{
  "_id": "6a44ceaf6ff6f2357551ba80",
  "Package": "tabulapdf",
  "Type": "Package",
  "Title": "Extract Tables from PDF Documents",
  "Description": "Bindings for the 'Tabula' <https://tabula.technology/>\n'Java' library, which can extract tables from PDF files. This\ntool can reduce time and effort in data extraction processes in\nfields like investigative journalism. It allows for automatic\nand manual table extraction, the latter facilitated through a\n'Shiny' interface, enabling manual areas selection\\ with a\ncomputer mouse for data retrieval.",
  "Version": "1.0.5-5",
  "Authors@R": "c(\nperson(\"Thomas J.\", \"Leeper\",\nrole = \"aut\",\nemail = \"thosjleeper@gmail.com\",\ncomment = c(ORCID = \"0000-0003-4097-6326\")),\nperson(\"Mauricio\", \"Vargas Sepulveda\",\nrole = c(\"aut\",\"cre\"),\nemail = \"m.sepulveda@mail.utoronto.ca\",\ncomment = c(ORCID = \"0000-0003-1017-7574\")),\nperson(\"Tom\", \"Paskhalis\",\nrole = \"aut\",\nemail = \"tpaskhalis@gmail.com\",\ncomment = c(ORCID = \"0000-0001-9298-8850\")),\nperson(\"Manuel\", \"Aristaran\",\nrole = \"ctb\"),\nperson(\"David\", \"Gohel\",\nrole = \"ctb\",\ncomment = \"rOpenSci reviewer\"),\nperson(\"Lincoln\", \"Mullen\",\nrole = \"ctb\",\ncomment = \"rOpenSci reviewer\"),\nperson(\"Munk School of Global Affairs and Public Policy\",\nrole = \"fnd\")\n)",
  "License": "Apache License (>= 2)",
  "URL": "https://docs.ropensci.org/tabulapdf/ (website)\nhttps://github.com/ropensci/tabulapdf/",
  "BugReports": "https://github.com/ropensci/tabulapdf/issues/",
  "SystemRequirements": "Java (>= 7.0): openjdk-11-jdk (deb),\njava-11-openjdk.x86_64 (rpm), openjdk@11 (brew)",
  "VignetteBuilder": "knitr",
  "Encoding": "UTF-8",
  "RoxygenNote": "7.3.2",
  "Config/pak/sysreqs": "make default-jdk libpng-dev libx11-dev",
  "Repository": "https://ropensci.r-universe.dev",
  "Date/Publication": "2025-01-03 08:31:08 UTC",
  "RemoteUrl": "https://github.com/ropensci/tabulapdf",
  "RemoteRef": "main",
  "RemoteSha": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-07-01 08:16:10 UTC",
    "User": "root"
  },
  "Author": "Thomas J. Leeper [aut] (ORCID: <https://orcid.org/0000-0003-4097-6326>),\nMauricio Vargas Sepulveda [aut, cre] (ORCID:\n<https://orcid.org/0000-0003-1017-7574>),\nTom Paskhalis [aut] (ORCID: <https://orcid.org/0000-0001-9298-8850>),\nManuel Aristaran [ctb],\nDavid Gohel [ctb] (rOpenSci reviewer),\nLincoln Mullen [ctb] (rOpenSci reviewer),\nMunk School of Global Affairs and Public Policy [fnd]",
  "Maintainer": "Mauricio Vargas Sepulveda <m.sepulveda@mail.utoronto.ca>",
  "_user": "ropensci",
  "_type": "src",
  "_file": "tabulapdf_1.0.5-5.tar.gz",
  "_fileid": "https://r2.ropensci.org/12283c61f21683366bcefb20c79354d72f9918e95a2fa3e7048f4414a0629cdd",
  "_filesize": 13036363,
  "_sha256": "12283c61f21683366bcefb20c79354d72f9918e95a2fa3e7048f4414a0629cdd",
  "_expires": "2026-10-09T08:24:14.000Z",
  "_created": "2026-07-01T08:16:10.000Z",
  "_published": "2026-07-01T08:24:15.467Z",
  "_jobs": [
    {
      "job": 84486409633,
      "time": 160,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "8004092454"
    },
    {
      "job": 84486409603,
      "time": 171,
      "config": "linux-release-x86_64",
      "r": "4.6.1",
      "check": "OK",
      "artifact": "8004096278"
    },
    {
      "job": 84486409606,
      "time": 133,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "8004144644"
    },
    {
      "job": 84486409595,
      "time": 167,
      "config": "macos-release-arm64",
      "r": "4.6.1",
      "check": "OK",
      "artifact": "8004158480"
    },
    {
      "job": 84485761468,
      "time": 156,
      "config": "pkgdown",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "8004007015"
    },
    {
      "job": 84485761481,
      "time": 215,
      "config": "source",
      "r": "4.6.1",
      "check": "OK",
      "artifact": "8004027834"
    },
    {
      "job": 84486409586,
      "time": 163,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "8004093769"
    },
    {
      "job": 84486409635,
      "time": 113,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "8004076986"
    },
    {
      "job": 84486409618,
      "time": 108,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "8004074131"
    },
    {
      "job": 84486409619,
      "time": 108,
      "config": "windows-release",
      "r": "4.6.1",
      "check": "OK",
      "artifact": "8004074677"
    }
  ],
  "_host": "GitHub-Actions",
  "_buildurl": "https://github.com/r-universe/ropensci/actions/runs/28503355484",
  "_status": "success",
  "_upstream": "https://github.com/ropensci/tabulapdf",
  "_commit": {
    "id": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
    "author": "Mauricio 'Pacha' Vargas Sepulveda <m.sepulveda@mail.utoronto.ca>",
    "committer": "Mauricio 'Pacha' Vargas Sepulveda <m.sepulveda@mail.utoronto.ca>",
    "message": "add CRAN changes to repo\n",
    "time": 1735893068
  },
  "_maintainer": {
    "name": "Mauricio Vargas Sepulveda",
    "email": "m.sepulveda@mail.utoronto.ca",
    "login": "pachadotdev",
    "orcid": "0000-0003-1017-7574",
    "description": "Statistician interested in applying statistical methods to address specific policy-relevant questions, particularly in international trade.",
    "uuid": 10091065
  },
  "_distro": "resolute",
  "_registered": true,
  "_dependencies": [
    {
      "package": "png",
      "role": "Imports"
    },
    {
      "package": "readr",
      "role": "Imports"
    },
    {
      "package": "rJava",
      "role": "Imports"
    },
    {
      "package": "tools",
      "role": "Imports"
    },
    {
      "package": "utils",
      "role": "Imports"
    },
    {
      "package": "graphics",
      "role": "Suggests"
    },
    {
      "package": "grDevices",
      "role": "Suggests"
    },
    {
      "package": "knitr",
      "role": "Suggests"
    },
    {
      "package": "miniUI",
      "role": "Suggests"
    },
    {
      "package": "shiny",
      "role": "Suggests"
    },
    {
      "package": "testthat",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "role": "Suggests"
    },
    {
      "package": "covr",
      "role": "Suggests"
    }
  ],
  "_owner": "ropensci",
  "_selfowned": true,
  "_usedby": 2,
  "_updates": [],
  "_tags": [],
  "_topics": [
    "java",
    "pdf",
    "pdf-document",
    "peer-reviewed",
    "ropensci",
    "tabula",
    "tabular-data",
    "openjdk"
  ],
  "_stars": 564,
  "_contributors": [
    {
      "user": "leeper",
      "count": 76,
      "uuid": 3505428
    },
    {
      "user": "tpaskhalis",
      "count": 59,
      "uuid": 2973437
    },
    {
      "user": "pachadotdev",
      "count": 36,
      "uuid": 10091065
    },
    {
      "user": "jeroen",
      "count": 4,
      "uuid": 216319
    },
    {
      "user": "aqlt",
      "count": 2,
      "uuid": 24825189
    },
    {
      "user": "albansagouis",
      "count": 1,
      "uuid": 25483578
    },
    {
      "user": "b-rodrigues",
      "count": 1,
      "uuid": 2998834
    },
    {
      "user": "karthik",
      "count": 1,
      "uuid": 138494
    },
    {
      "user": "uribo",
      "count": 1,
      "uuid": 228649
    }
  ],
  "_userbio": {
    "uuid": 1200269,
    "type": "organization",
    "name": "rOpenSci",
    "followers": 1106,
    "description": "Tools and R Packages for Open Science"
  },
  "_downloads": {
    "count": 1854,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/tabulapdf"
  },
  "_devurl": "https://github.com/ropensci/tabulapdf",
  "_pkgdown": "https://docs.ropensci.org/tabulapdf/",
  "_searchresults": 253,
  "_metadata": {
    "review": {
      "id": 42,
      "status": "reviewed",
      "version": "0.1.11",
      "organization": "rOpenSci Software Review",
      "url": "https://github.com/ropensci/software-review/issues/42"
    },
    "ropensci_category": "data-extraction"
  },
  "_rbuild": "4.6.1",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/NEWS.html",
    "extra/NEWS.txt",
    "extra/readme.html",
    "extra/readme.md",
    "extra/tabulapdf.html",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/ropensci/tabulapdf",
  "_realowner": "ropensci",
  "_cranurl": true,
  "_releases": [
    {
      "version": "1.0.5-3",
      "date": "2024-05-21"
    },
    {
      "version": "1.0.5-5",
      "date": "2024-11-15"
    }
  ],
  "_exports": [
    "extract_areas",
    "extract_metadata",
    "extract_tables",
    "extract_text",
    "get_n_pages",
    "get_page_dims",
    "locate_areas",
    "make_thumbnails",
    "merge_pdfs",
    "split_pdf",
    "stop_logging"
  ],
  "_help": [
    {
      "page": "tabulapdf-package",
      "title": "tabulapdf",
      "topics": [
        "tabulapdf-package",
        "tabulapdf"
      ]
    },
    {
      "page": "extract_metadata",
      "title": "extract_metadata",
      "topics": [
        "extract_metadata"
      ]
    },
    {
      "page": "extract_tables",
      "title": "extract_tables",
      "topics": [
        "extract_tables"
      ]
    },
    {
      "page": "extract_text",
      "title": "extract_text",
      "topics": [
        "extract_text"
      ]
    },
    {
      "page": "get_page_dims",
      "title": "Page length and dimensions",
      "topics": [
        "get_n_pages",
        "get_page_dims"
      ]
    },
    {
      "page": "extract_areas",
      "title": "extract_areas",
      "topics": [
        "extract_areas",
        "locate_areas"
      ]
    },
    {
      "page": "make_thumbnails",
      "title": "make_thumbnails",
      "topics": [
        "make_thumbnails"
      ]
    },
    {
      "page": "split_merge",
      "title": "Split and merge PDFs",
      "topics": [
        "merge_pdfs",
        "split_pdf"
      ]
    },
    {
      "page": "stop_logging",
      "title": "rJava logging",
      "topics": [
        "stop_logging"
      ]
    }
  ],
  "_pkglogo": "https://github.com/ropensci/tabulapdf/raw/main/man/figures/logo.svg",
  "_readme": "https://github.com/ropensci/tabulapdf/raw/main/README.md",
  "_rundeps": [
    "bit",
    "bit64",
    "cli",
    "clipr",
    "cpp11",
    "crayon",
    "glue",
    "hms",
    "lifecycle",
    "magrittr",
    "pillar",
    "pkgconfig",
    "png",
    "prettyunits",
    "progress",
    "R6",
    "readr",
    "rJava",
    "rlang",
    "tibble",
    "tidyselect",
    "tzdb",
    "utf8",
    "vctrs",
    "vroom",
    "withr"
  ],
  "_sysdeps": [
    {
      "shlib": "libjvm",
      "package": "openjdk-25-jre-headless",
      "headers": "openjdk-25-jre-headless",
      "source": "openjdk",
      "version": "25.0.3+9-2~26.04.2",
      "name": "openjdk",
      "homepage": "https://openjdk.java.net/",
      "description": "OpenJDK Java runtime, using Hotspot JIT (headless)"
    }
  ],
  "_vignettes": [
    {
      "source": "tabulapdf.Rmd",
      "filename": "tabulapdf.html",
      "title": "Introduction to tabulapdf",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Introduction",
        "Basic usage",
        "Specifying the extraction method",
        "Extracting areas",
        "Interactive table extraction",
        "Use case: COVID-19 treatments in Italy",
        "Miscellaneous functionality"
      ],
      "created": "2024-04-11 02:55:08",
      "modified": "2024-09-19 19:14:11",
      "commits": 7
    }
  ],
  "_score": 9.802720596679244,
  "_indexed": true,
  "_nocasepkg": "tabulapdf",
  "_universes": [
    "ropensci",
    "pachadotdev"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "1.0.5-5",
      "date": "2026-07-01T08:18:58.000Z",
      "distro": "resolute",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "https://r2.ropensci.org/320539e206839316918649f685d9430125eeba3459817c73038d98799a138e5c",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/28503355484"
    },
    {
      "r": "4.6.1",
      "os": "linux",
      "version": "1.0.5-5",
      "date": "2026-07-01T08:19:05.000Z",
      "distro": "resolute",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "https://r2.ropensci.org/790042f6c70f7d166ec5a02aea30f8e2c6db7572fbd347653c090a8493d1fee5",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/28503355484"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "1.0.5-5",
      "date": "2026-07-01T08:21:25.000Z",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "https://r2.ropensci.org/1a1aa3b2eb4d55b38e473e10b6ef566b4c842ddad56502ca3734f59d9fd84d4d",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/28503355484"
    },
    {
      "r": "4.6.1",
      "os": "mac",
      "version": "1.0.5-5",
      "date": "2026-07-01T08:21:38.000Z",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "https://r2.ropensci.org/40ad12fd97db156f0bb105af1ad0660ffa24df57da68dfb090116330da727d98",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/28503355484"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "1.0.5-5",
      "date": "2026-07-01T08:19:35.000Z",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "https://r2.ropensci.org/97195320c23d48f21ea51099d595bd1ca546cf72ce893a3ec652de3e3b3b45f4",
      "status": "success",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/28503355484"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "1.0.5-5",
      "date": "2026-07-01T08:18:04.000Z",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "https://r2.ropensci.org/643dfb16112af8fddbad6323245b72ede41c30f8b8cad090d51ba341598872d8",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/28503355484"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "1.0.5-5",
      "date": "2026-07-01T08:17:54.000Z",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "https://r2.ropensci.org/3c27329311af6fc5232cc9cecd3d6c60c5d9a172d011566c353e89bcf5cee0f5",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/28503355484"
    },
    {
      "r": "4.6.1",
      "os": "win",
      "version": "1.0.5-5",
      "date": "2026-07-01T08:17:56.000Z",
      "commit": "03cabea1c4cd5fec818a9539115d773c5cb4ff0b",
      "fileid": "https://r2.ropensci.org/88e2e0b74a002fe87816cf0259663f1ff7daa0a872cd809f382a8a4e33274429",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/28503355484"
    }
  ]
}