{
  "_id": "6a1f071cb401979e7341bdb4",
  "Package": "tabulapdf",
  "Type": "Package",
  "Title": "Extract Tables from PDF Documents",
  "Description": "Bindings for the 'Tabula' <https://tabula.technology/>\n'Java' library, which can extract tables from PDF files. This\ntool can reduce time and effort in data extraction processes in\nfields like investigative journalism. It allows for automatic\nand manual table extraction, the latter facilitated through a\n'Shiny' interface, enabling manual areas selection\\ with a\ncomputer mouse for data retrieval.",
  "Version": "1.0.5-5",
  "Authors@R": "c(\nperson(\"Thomas J.\", \"Leeper\",\nrole = \"aut\",\nemail = \"thosjleeper@gmail.com\",\ncomment = c(ORCID = \"0000-0003-4097-6326\")),\nperson(\"Mauricio\", \"Vargas Sepulveda\",\nrole = c(\"aut\",\"cre\"),\nemail = \"m.sepulveda@mail.utoronto.ca\",\ncomment = c(ORCID = \"0000-0003-1017-7574\")),\nperson(\"Tom\", \"Paskhalis\",\nrole = \"aut\",\nemail = \"tpaskhalis@gmail.com\",\ncomment = c(ORCID = \"0000-0001-9298-8850\")),\nperson(\"Manuel\", \"Aristaran\",\nrole = \"ctb\"),\nperson(\"David\", \"Gohel\",\nrole = \"ctb\",\ncomment = \"rOpenSci reviewer\"),\nperson(\"Lincoln\", \"Mullen\",\nrole = \"ctb\",\ncomment = \"rOpenSci reviewer\"),\nperson(\"Munk School of Global Affairs and Public Policy\",\nrole = \"fnd\")\n)",
  "License": "Apache License (>= 2)",
  "URL": "https://docs.ropensci.org/tabulapdf/ (website)\nhttps://github.com/ropensci/tabulapdf/",
  "BugReports": "https://github.com/ropensci/tabulapdf/issues/",
  "SystemRequirements": "Java (>= 7.0): openjdk-11-jdk (deb),\njava-11-openjdk.x86_64 (rpm), openjdk@11 (brew)",
  "VignetteBuilder": "knitr",
  "Encoding": "UTF-8",
  "RoxygenNote": "7.3.2",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-05-18 06:50:13 UTC",
    "User": "root"
  },
  "Author": "Thomas J. Leeper [aut]\n(<https://orcid.org/0000-0003-4097-6326>), Mauricio Vargas\nSepulveda [aut, cre] (<https://orcid.org/0000-0003-1017-7574>),\nTom Paskhalis [aut] (<https://orcid.org/0000-0001-9298-8850>),\nManuel Aristaran [ctb], David Gohel [ctb] (rOpenSci reviewer),\nLincoln Mullen [ctb] (rOpenSci reviewer), Munk School of Global\nAffairs and Public Policy [fnd]",
  "Maintainer": "Mauricio Vargas Sepulveda <m.sepulveda@mail.utoronto.ca>",
  "Config/pak/sysreqs": "default-jdk",
  "Repository": "https://cran.r-universe.dev",
  "Date/Publication": "2024-11-15 13:00:02 UTC",
  "RemoteUrl": "https://github.com/cran/tabulapdf",
  "RemoteRef": "HEAD",
  "RemoteSha": "6b13547143722c3ce9e6434d9dc18571278310cc",
  "MD5sum": "757c7a4f332b7cec60fa81e3ac8612c7",
  "_user": "cran",
  "_type": "src",
  "_file": "tabulapdf_1.0.5-5.tar.gz",
  "_fileid": "34ce63c2f96c565d7a058d8fab0571044bdfd95653393f7470455599f5cdc831",
  "_filesize": 13035986,
  "_sha256": "34ce63c2f96c565d7a058d8fab0571044bdfd95653393f7470455599f5cdc831",
  "_created": "2026-05-18T06:50:13.000Z",
  "_published": "2026-06-02T16:38:52.228Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 79122434614,
      "time": 166,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7051248211"
    },
    {
      "job": 79122435133,
      "time": 161,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7051247189"
    },
    {
      "job": 79122433917,
      "time": 222,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7051206859"
    },
    {
      "job": 79122434056,
      "time": 149,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7363991308"
    }
  ],
  "_buildurl": "https://github.com/r-universe/cran/actions/runs/26017853300",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/cran/tabulapdf",
  "_commit": {
    "id": "6b13547143722c3ce9e6434d9dc18571278310cc",
    "author": "Mauricio Vargas Sepulveda <m.sepulveda@mail.utoronto.ca>",
    "committer": "cran-robot <csardi.gabor+cran@gmail.com>",
    "message": "version 1.0.5-5\n",
    "time": 1731675602
  },
  "_maintainer": {
    "name": "Mauricio Vargas Sepulveda",
    "email": "m.sepulveda@mail.utoronto.ca",
    "login": "pachadotdev",
    "orcid": "0000-0003-1017-7574",
    "description": "Statistician interested in applying statistical methods to address specific policy-relevant questions, particularly in international trade.",
    "uuid": 10091065
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "png",
      "role": "Imports"
    },
    {
      "package": "readr",
      "role": "Imports"
    },
    {
      "package": "rJava",
      "role": "Imports"
    },
    {
      "package": "tools",
      "role": "Imports"
    },
    {
      "package": "utils",
      "role": "Imports"
    },
    {
      "package": "graphics",
      "role": "Suggests"
    },
    {
      "package": "grDevices",
      "role": "Suggests"
    },
    {
      "package": "knitr",
      "role": "Suggests"
    },
    {
      "package": "miniUI",
      "role": "Suggests"
    },
    {
      "package": "shiny",
      "role": "Suggests"
    },
    {
      "package": "testthat",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "role": "Suggests"
    },
    {
      "package": "covr",
      "role": "Suggests"
    }
  ],
  "_owner": "cran",
  "_selfowned": false,
  "_usedby": 2,
  "_updates": [],
  "_tags": [],
  "_stars": 0,
  "_contributors": [
    {
      "user": "pachadotdev",
      "count": 2,
      "uuid": 10091065
    }
  ],
  "_userbio": {
    "uuid": 6899542,
    "type": "organization",
    "name": "cran",
    "description": "Unofficial read-only mirror of all CRAN R packages"
  },
  "_downloads": {
    "count": 1925,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/tabulapdf"
  },
  "_devurl": "https://github.com/ropensci/tabulapdf",
  "_pkgdown": "https://docs.ropensci.org/tabulapdf/",
  "_searchresults": 250,
  "_topics": [
    "openjdk"
  ],
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/NEWS.html",
    "extra/NEWS.txt",
    "extra/readme.html",
    "extra/readme.md",
    "extra/tabulapdf.html",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/ropensci/tabulapdf",
  "_realowner": "ropensci",
  "_cranurl": false,
  "_releases": [
    {
      "version": "1.0.5-3",
      "date": "2024-05-21"
    },
    {
      "version": "1.0.5-5",
      "date": "2024-11-15"
    }
  ],
  "_exports": [
    "extract_areas",
    "extract_metadata",
    "extract_tables",
    "extract_text",
    "get_n_pages",
    "get_page_dims",
    "locate_areas",
    "make_thumbnails",
    "merge_pdfs",
    "split_pdf",
    "stop_logging"
  ],
  "_help": [
    {
      "page": "tabulapdf-package",
      "title": "tabulapdf",
      "topics": [
        "tabulapdf-package",
        "tabulapdf"
      ]
    },
    {
      "page": "extract_metadata",
      "title": "extract_metadata",
      "topics": [
        "extract_metadata"
      ]
    },
    {
      "page": "extract_tables",
      "title": "extract_tables",
      "topics": [
        "extract_tables"
      ]
    },
    {
      "page": "extract_text",
      "title": "extract_text",
      "topics": [
        "extract_text"
      ]
    },
    {
      "page": "get_page_dims",
      "title": "Page length and dimensions",
      "topics": [
        "get_n_pages",
        "get_page_dims"
      ]
    },
    {
      "page": "extract_areas",
      "title": "extract_areas",
      "topics": [
        "extract_areas",
        "locate_areas"
      ]
    },
    {
      "page": "make_thumbnails",
      "title": "make_thumbnails",
      "topics": [
        "make_thumbnails"
      ]
    },
    {
      "page": "split_merge",
      "title": "Split and merge PDFs",
      "topics": [
        "merge_pdfs",
        "split_pdf"
      ]
    },
    {
      "page": "stop_logging",
      "title": "rJava logging",
      "topics": [
        "stop_logging"
      ]
    }
  ],
  "_pkglogo": "https://github.com/cran/tabulapdf/raw/HEAD/man/figures/logo.svg",
  "_readme": "https://github.com/cran/tabulapdf/raw/HEAD/README.md",
  "_rundeps": [
    "bit",
    "bit64",
    "cli",
    "clipr",
    "cpp11",
    "crayon",
    "glue",
    "hms",
    "lifecycle",
    "magrittr",
    "pillar",
    "pkgconfig",
    "png",
    "prettyunits",
    "progress",
    "R6",
    "readr",
    "rJava",
    "rlang",
    "tibble",
    "tidyselect",
    "tzdb",
    "utf8",
    "vctrs",
    "vroom",
    "withr"
  ],
  "_sysdeps": [
    {
      "shlib": "libjvm",
      "package": "openjdk-21-jre-headless",
      "headers": "openjdk-21-jre-headless",
      "source": "openjdk",
      "version": "21.0.10+7-1~24.04",
      "name": "openjdk",
      "homepage": "https://openjdk.java.net/",
      "description": "OpenJDK Java runtime, using Hotspot JIT (headless)"
    }
  ],
  "_vignettes": [
    {
      "source": "tabulapdf.Rmd",
      "filename": "tabulapdf.html",
      "title": "Introduction to tabulapdf",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Introduction",
        "Basic usage",
        "Specifying the extraction method",
        "Extracting areas",
        "Interactive table extraction",
        "Use case: COVID-19 treatments in Italy",
        "Miscellaneous functionality"
      ],
      "created": "2024-05-22 02:41:26",
      "modified": "2024-11-15 13:00:02",
      "commits": 2
    }
  ],
  "_score": 5.15949199723622,
  "_indexed": false,
  "_nocasepkg": "tabulapdf",
  "_universes": [
    "cran"
  ],
  "_indexurl": "https://ropensci.r-universe.dev/tabulapdf",
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "1.0.5-5",
      "date": "2026-05-18T06:52:50.000Z",
      "distro": "noble",
      "commit": "6b13547143722c3ce9e6434d9dc18571278310cc",
      "fileid": "1dfb04923ff8d4cb06569b288f636e8c61c03ba61d3045f885f127aed3fe58e4",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/cran/actions/runs/26017853300"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "1.0.5-5",
      "date": "2026-05-18T06:52:44.000Z",
      "distro": "noble",
      "commit": "6b13547143722c3ce9e6434d9dc18571278310cc",
      "fileid": "44a497e3c3a6f3fecc6d6d5535f87b21766de73ab6b1acfb2c30a681c2e70146",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/cran/actions/runs/26017853300"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "1.0.5-5",
      "date": "2026-06-02T16:38:28.000Z",
      "commit": "6b13547143722c3ce9e6434d9dc18571278310cc",
      "fileid": "4915569dfde0b9e30115c42a5eba75199167a4992ad11670a7c134dd92892c5b",
      "status": "success",
      "buildurl": "https://github.com/r-universe/cran/actions/runs/26017853300"
    }
  ]
}