{
  "_id": "6a1f2c7bb401979e734260eb",
  "Package": "tabulapdf",
  "Type": "Package",
  "Title": "Extract Tables from PDF Documents",
  "Description": "Bindings for the 'Tabula' <https://tabula.technology/>\n'Java' library, which can extract tables from PDF files. This\ntool can reduce time and effort in data extraction processes in\nfields like investigative journalism. It allows for automatic\nand manual table extraction, the latter facilitated through a\n'Shiny' interface, enabling manual areas selection\\ with a\ncomputer mouse for data retrieval.",
  "Version": "1.0.5-5",
  "Authors@R": "c(\nperson(\"Thomas J.\", \"Leeper\",\nrole = \"aut\",\nemail = \"thosjleeper@gmail.com\",\ncomment = c(ORCID = \"0000-0003-4097-6326\")),\nperson(\"Mauricio\", \"Vargas Sepulveda\",\nrole = c(\"aut\",\"cre\"),\nemail = \"m.sepulveda@mail.utoronto.ca\",\ncomment = c(ORCID = \"0000-0003-1017-7574\")),\nperson(\"Tom\", \"Paskhalis\",\nrole = \"aut\",\nemail = \"tpaskhalis@gmail.com\",\ncomment = c(ORCID = \"0000-0001-9298-8850\")),\nperson(\"Manuel\", \"Aristaran\",\nrole = \"ctb\"),\nperson(\"David\", \"Gohel\",\nrole = \"ctb\",\ncomment = \"rOpenSci reviewer\"),\nperson(\"Lincoln\", \"Mullen\",\nrole = \"ctb\",\ncomment = \"rOpenSci reviewer\"),\nperson(\"Munk School of Global Affairs and Public Policy\",\nrole = \"fnd\")\n)",
  "License": "Apache License (>= 2)",
  "URL": "https://docs.ropensci.org/tabulapdf/ (website)\nhttps://github.com/ropensci/tabulapdf/",
  "BugReports": "https://github.com/ropensci/tabulapdf/issues/",
  "SystemRequirements": "Java (>= 7.0): openjdk-11-jdk (deb),\njava-11-openjdk.x86_64 (rpm), openjdk@11 (brew)",
  "VignetteBuilder": "knitr",
  "Encoding": "UTF-8",
  "RoxygenNote": "7.3.2",
  "Config/pak/sysreqs": "make default-jdk libpng-dev libx11-dev",
  "Repository": "https://ropensci.r-universe.dev",
  "Date/Publication": "2025-01-03 08:31:08 UTC",
  "RemoteUrl": "https://github.com/ropensci/tabulapdf",
  "RemoteRef": "main",
  "RemoteSha": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-05-15 09:54:19 UTC",
    "User": "root"
  },
  "Author": "Thomas J. Leeper [aut] (ORCID: <https://orcid.org/0000-0003-4097-6326>),\nMauricio Vargas Sepulveda [aut, cre] (ORCID:\n<https://orcid.org/0000-0003-1017-7574>),\nTom Paskhalis [aut] (ORCID: <https://orcid.org/0000-0001-9298-8850>),\nManuel Aristaran [ctb],\nDavid Gohel [ctb] (rOpenSci reviewer),\nLincoln Mullen [ctb] (rOpenSci reviewer),\nMunk School of Global Affairs and Public Policy [fnd]",
  "Maintainer": "Mauricio Vargas Sepulveda <m.sepulveda@mail.utoronto.ca>",
  "MD5sum": "827e62023d0fe2729805dbde43ffcb49",
  "_user": "ropensci",
  "_type": "src",
  "_file": "tabulapdf_1.0.5-5.tar.gz",
  "_fileid": "c5439853044c91c167aebf040573be8b8dfe30374fe802ac0c26858221b13583",
  "_filesize": 13038175,
  "_sha256": "c5439853044c91c167aebf040573be8b8dfe30374fe802ac0c26858221b13583",
  "_created": "2026-05-15T09:54:19.000Z",
  "_published": "2026-06-02T19:18:19.950Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 79152625465,
      "time": 172,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7014556077"
    },
    {
      "job": 79152625506,
      "time": 158,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7014552080"
    },
    {
      "job": 79152625592,
      "time": 127,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7014764260"
    },
    {
      "job": 79152625456,
      "time": 129,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7014772589"
    },
    {
      "job": 79152624824,
      "time": 157,
      "config": "pkgdown",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7014492878"
    },
    {
      "job": 79152625130,
      "time": 199,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7014504113"
    },
    {
      "job": 79152624629,
      "time": 127,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7367538498"
    },
    {
      "job": 79152625171,
      "time": 112,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7014538076"
    },
    {
      "job": 79152625445,
      "time": 123,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7014542184"
    },
    {
      "job": 79152625510,
      "time": 96,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7014533475"
    }
  ],
  "_buildurl": "https://github.com/r-universe/ropensci/actions/runs/25911546367",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/ropensci/tabulapdf",
  "_commit": {
    "id": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
    "author": "Mauricio 'Pacha' Vargas Sepulveda <m.sepulveda@mail.utoronto.ca>",
    "committer": "Mauricio 'Pacha' Vargas Sepulveda <m.sepulveda@mail.utoronto.ca>",
    "message": "add CRAN changes to repo\n",
    "time": 1735893068
  },
  "_maintainer": {
    "name": "Mauricio Vargas Sepulveda",
    "email": "m.sepulveda@mail.utoronto.ca",
    "login": "pachadotdev",
    "orcid": "0000-0003-1017-7574",
    "uuid": 10091065
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "png",
      "role": "Imports"
    },
    {
      "package": "readr",
      "role": "Imports"
    },
    {
      "package": "rJava",
      "role": "Imports"
    },
    {
      "package": "tools",
      "role": "Imports"
    },
    {
      "package": "utils",
      "role": "Imports"
    },
    {
      "package": "graphics",
      "role": "Suggests"
    },
    {
      "package": "grDevices",
      "role": "Suggests"
    },
    {
      "package": "knitr",
      "role": "Suggests"
    },
    {
      "package": "miniUI",
      "role": "Suggests"
    },
    {
      "package": "shiny",
      "role": "Suggests"
    },
    {
      "package": "testthat",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "role": "Suggests"
    },
    {
      "package": "covr",
      "role": "Suggests"
    }
  ],
  "_owner": "ropensci",
  "_selfowned": true,
  "_usedby": 2,
  "_updates": [],
  "_tags": [],
  "_topics": [
    "java",
    "pdf",
    "pdf-document",
    "peer-reviewed",
    "ropensci",
    "tabula",
    "tabular-data",
    "openjdk"
  ],
  "_stars": 564,
  "_contributors": [
    {
      "user": "leeper",
      "count": 76,
      "uuid": 3505428
    },
    {
      "user": "tpaskhalis",
      "count": 59,
      "uuid": 2973437
    },
    {
      "user": "pachadotdev",
      "count": 36,
      "uuid": 10091065
    },
    {
      "user": "jeroen",
      "count": 4,
      "uuid": 216319
    },
    {
      "user": "aqlt",
      "count": 2,
      "uuid": 24825189
    },
    {
      "user": "albansagouis",
      "count": 1,
      "uuid": 25483578
    },
    {
      "user": "b-rodrigues",
      "count": 1,
      "uuid": 2998834
    },
    {
      "user": "karthik",
      "count": 1,
      "uuid": 138494
    },
    {
      "user": "uribo",
      "count": 1,
      "uuid": 228649
    }
  ],
  "_userbio": {
    "uuid": 1200269,
    "type": "organization",
    "name": "rOpenSci",
    "description": "Tools and R Packages for Open Science"
  },
  "_downloads": {
    "count": 1949,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/tabulapdf"
  },
  "_devurl": "https://github.com/ropensci/tabulapdf",
  "_pkgdown": "https://docs.ropensci.org/tabulapdf/",
  "_searchresults": 250,
  "_metadata": {
    "review": {
      "id": 42,
      "status": "reviewed",
      "version": "0.1.11",
      "organization": "rOpenSci Software Review",
      "url": "https://github.com/ropensci/software-review/issues/42"
    },
    "ropensci_category": "data-extraction"
  },
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/NEWS.html",
    "extra/NEWS.txt",
    "extra/readme.html",
    "extra/readme.md",
    "extra/tabulapdf.html",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/ropensci/tabulapdf",
  "_realowner": "ropensci",
  "_cranurl": true,
  "_releases": [
    {
      "version": "1.0.5-3",
      "date": "2024-05-21"
    },
    {
      "version": "1.0.5-5",
      "date": "2024-11-15"
    }
  ],
  "_exports": [
    "extract_areas",
    "extract_metadata",
    "extract_tables",
    "extract_text",
    "get_n_pages",
    "get_page_dims",
    "locate_areas",
    "make_thumbnails",
    "merge_pdfs",
    "split_pdf",
    "stop_logging"
  ],
  "_help": [
    {
      "page": "tabulapdf-package",
      "title": "tabulapdf",
      "topics": [
        "tabulapdf-package",
        "tabulapdf"
      ]
    },
    {
      "page": "extract_metadata",
      "title": "extract_metadata",
      "topics": [
        "extract_metadata"
      ]
    },
    {
      "page": "extract_tables",
      "title": "extract_tables",
      "topics": [
        "extract_tables"
      ]
    },
    {
      "page": "extract_text",
      "title": "extract_text",
      "topics": [
        "extract_text"
      ]
    },
    {
      "page": "get_page_dims",
      "title": "Page length and dimensions",
      "topics": [
        "get_n_pages",
        "get_page_dims"
      ]
    },
    {
      "page": "extract_areas",
      "title": "extract_areas",
      "topics": [
        "extract_areas",
        "locate_areas"
      ]
    },
    {
      "page": "make_thumbnails",
      "title": "make_thumbnails",
      "topics": [
        "make_thumbnails"
      ]
    },
    {
      "page": "split_merge",
      "title": "Split and merge PDFs",
      "topics": [
        "merge_pdfs",
        "split_pdf"
      ]
    },
    {
      "page": "stop_logging",
      "title": "rJava logging",
      "topics": [
        "stop_logging"
      ]
    }
  ],
  "_pkglogo": "https://github.com/ropensci/tabulapdf/raw/main/man/figures/logo.svg",
  "_readme": "https://github.com/ropensci/tabulapdf/raw/main/README.md",
  "_rundeps": [
    "bit",
    "bit64",
    "cli",
    "clipr",
    "cpp11",
    "crayon",
    "glue",
    "hms",
    "lifecycle",
    "magrittr",
    "pillar",
    "pkgconfig",
    "png",
    "prettyunits",
    "progress",
    "R6",
    "readr",
    "rJava",
    "rlang",
    "tibble",
    "tidyselect",
    "tzdb",
    "utf8",
    "vctrs",
    "vroom",
    "withr"
  ],
  "_sysdeps": [
    {
      "shlib": "libjvm",
      "package": "openjdk-21-jre-headless",
      "headers": "openjdk-21-jre-headless",
      "source": "openjdk",
      "version": "21.0.10+7-1~24.04",
      "name": "openjdk",
      "homepage": "https://openjdk.java.net/",
      "description": "OpenJDK Java runtime, using Hotspot JIT (headless)"
    }
  ],
  "_vignettes": [
    {
      "source": "tabulapdf.Rmd",
      "filename": "tabulapdf.html",
      "title": "Introduction to tabulapdf",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Introduction",
        "Basic usage",
        "Specifying the extraction method",
        "Extracting areas",
        "Interactive table extraction",
        "Use case: COVID-19 treatments in Italy",
        "Miscellaneous functionality"
      ],
      "created": "2024-04-11 02:55:08",
      "modified": "2024-09-19 19:14:11",
      "commits": 7
    }
  ],
  "_score": 9.819242193484609,
  "_indexed": true,
  "_nocasepkg": "tabulapdf",
  "_universes": [
    "ropensci",
    "pachadotdev"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "1.0.5-5",
      "date": "2026-05-15T09:56:58.000Z",
      "distro": "noble",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "5ea9ae5ac460c5dc7be0d677f6b09ed7293158fa143c364351856ec685ea7922",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25911546367"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "1.0.5-5",
      "date": "2026-05-15T09:56:47.000Z",
      "distro": "noble",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "59030c939473662858cdaf8dac2fccc1c5bdb5cb3e8253e204b09cf5aa7be763",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25911546367"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "1.0.5-5",
      "date": "2026-05-15T10:09:11.000Z",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "9ae836b68b84d22e2ce0ccf71dda28311a8d091f3f3573841b4ec0efb89a5e4b",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25911546367"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "1.0.5-5",
      "date": "2026-05-15T10:09:39.000Z",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "715cbbb314467a47f2d73e6a3ed85ad7e7ffd7caa6aa20354dc3feaf49fb284f",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25911546367"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "1.0.5-5",
      "date": "2026-05-15T09:55:42.000Z",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "84bf2124b5275c94d07159bbbf5b0ed239de9db8f399a18efda641c516754e9b",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25911546367"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "1.0.5-5",
      "date": "2026-05-15T09:56:03.000Z",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "9b3a2fbbd15af47f7372acae34bbe82e6601f39680406330087a66118b91365b",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25911546367"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "1.0.5-5",
      "date": "2026-05-15T09:55:37.000Z",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "fdc75c1036b228281787fef9ac5aaa89cfaad1b99bc902f93bb53f7b503c8429",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25911546367"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "1.0.5-5",
      "date": "2026-06-02T19:17:55.000Z",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "bbec22f22286bf30ac43364a8a0c62b867961c2de0c95a92624f228c30da75ca",
      "status": "success",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25911546367"
    }
  ]
}