{
  "_id": "6a055b13607d4c2ebf59373e",
  "Package": "tesseract",
  "Type": "Package",
  "Title": "Open Source OCR Engine",
  "Version": "5.2.5",
  "Authors@R": "person(\"Jeroen\", \"Ooms\", role = c(\"aut\", \"cre\"), email = \"jeroenooms@gmail.com\",\ncomment = c(ORCID = \"0000-0002-4035-0289\"))",
  "Description": "Bindings to 'Tesseract': a powerful optical character\nrecognition (OCR) engine that supports over 100 languages. The\nengine is highly configurable in order to tune the detection\nalgorithms and obtain the best possible results.",
  "License": "Apache License 2.0",
  "URL": "https://docs.ropensci.org/tesseract/\nhttps://ropensci.r-universe.dev/tesseract",
  "BugReports": "https://github.com/ropensci/tesseract/issues",
  "SystemRequirements": "Tesseract >= 3.03 (libtesseract-dev /\ntesseract-devel) and Leptonica (libleptonica-dev /\nleptonica-devel). On Debian you need to install the English\ntraining data separately (tesseract-ocr-eng)",
  "RoxygenNote": "7.3.3",
  "Roxygen": "list(markdown = TRUE)",
  "Encoding": "UTF-8",
  "VignetteBuilder": "knitr",
  "Language": "en-US",
  "Config/pak/sysreqs": "libleptonica-dev libjpeg-dev libssl-dev\nlibtesseract-dev tesseract-ocr-eng zlib1g-dev",
  "Repository": "https://ropensci.r-universe.dev",
  "Date/Publication": "2026-01-26 13:10:43 UTC",
  "RemoteUrl": "https://github.com/ropensci/tesseract",
  "RemoteRef": "master",
  "RemoteSha": "eb79775ec4fd5efb1949647087f87e2216282670",
  "NeedsCompilation": "yes",
  "Packaged": {
    "Date": "2026-05-13 23:15:49 UTC",
    "User": "root"
  },
  "Author": "Jeroen Ooms [aut, cre] (ORCID: <https://orcid.org/0000-0002-4035-0289>)",
  "Maintainer": "Jeroen Ooms <jeroenooms@gmail.com>",
  "MD5sum": "f2981c5a80aaefcaf36755844ff9d9fa",
  "_user": "ropensci",
  "_type": "src",
  "_file": "tesseract_5.2.5.tar.gz",
  "_fileid": "eeb5b762220416aa6303fc2cf8c1f80cfb4cc44963a1abed20b1abda8c6bee19",
  "_filesize": 273038,
  "_sha256": "eeb5b762220416aa6303fc2cf8c1f80cfb4cc44963a1abed20b1abda8c6bee19",
  "_created": "2026-05-13T23:15:49.000Z",
  "_published": "2026-05-14T05:18:11.049Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 75932065073,
      "time": 145,
      "config": "linux-devel-arm64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "6983691679"
    },
    {
      "job": 75932064818,
      "time": 148,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "6983693635"
    },
    {
      "job": 75932064815,
      "time": 137,
      "config": "linux-release-arm64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "6983689837"
    },
    {
      "job": 75932064796,
      "time": 161,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "6983695097"
    },
    {
      "job": 75932064627,
      "time": 101,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "6987668508"
    },
    {
      "job": 75932064894,
      "time": 271,
      "config": "macos-oldrel-x86_64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "6983723863"
    },
    {
      "job": 75932064638,
      "time": 100,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "6987673126"
    },
    {
      "job": 75932064975,
      "time": 237,
      "config": "macos-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "6983711941"
    },
    {
      "job": 75932064604,
      "time": 165,
      "config": "pkgdown",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "6983648356"
    },
    {
      "job": 75932064833,
      "time": 211,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "6983659745"
    },
    {
      "job": 75932064559,
      "time": 350,
      "config": "wasm-release",
      "r": "4.5.1",
      "check": "FAIL",
      "artifact": ""
    },
    {
      "job": 75932064814,
      "time": 145,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "6983757469"
    },
    {
      "job": 75932065035,
      "time": 130,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "6983688530"
    },
    {
      "job": 75932064794,
      "time": 146,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "6983691947"
    }
  ],
  "_buildurl": "https://github.com/r-universe/ropensci/actions/runs/25831770683",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/ropensci/tesseract",
  "_commit": {
    "id": "eb79775ec4fd5efb1949647087f87e2216282670",
    "author": "Jeroen Ooms <jeroenooms@gmail.com>",
    "committer": "Jeroen Ooms <jeroenooms@gmail.com>",
    "message": "Wrap examples in donttest for cran policies\n",
    "time": 1769433043
  },
  "_maintainer": {
    "name": "Jeroen Ooms",
    "email": "jeroenooms@gmail.com",
    "login": "jeroen",
    "mastodon": "@jeroenooms@fosstodon.org",
    "bluesky": "@jeroenooms.bsky.social",
    "uuid": 216319,
    "orcid": "0000-0002-4035-0289"
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "Rcpp",
      "role": "LinkingTo"
    },
    {
      "package": "Rcpp",
      "version": ">= 0.12.12",
      "role": "Imports"
    },
    {
      "package": "pdftools",
      "version": ">= 1.5",
      "role": "Imports"
    },
    {
      "package": "curl",
      "role": "Imports"
    },
    {
      "package": "rappdirs",
      "role": "Imports"
    },
    {
      "package": "digest",
      "role": "Imports"
    },
    {
      "package": "magick",
      "version": ">= 1.7",
      "role": "Suggests"
    },
    {
      "package": "spelling",
      "role": "Suggests"
    },
    {
      "package": "knitr",
      "role": "Suggests"
    },
    {
      "package": "tibble",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "role": "Suggests"
    }
  ],
  "_owner": "ropensci",
  "_selfowned": true,
  "_usedby": 0,
  "_updates": [
    {
      "week": "2026-01",
      "n": 5
    },
    {
      "week": "2026-05",
      "n": 1
    }
  ],
  "_tags": [],
  "_topics": [
    "ocr",
    "tesseract",
    "tesseract-ocr",
    "cpp"
  ],
  "_stars": 251,
  "_contributors": [
    {
      "user": "jeroen",
      "count": 263,
      "uuid": 216319
    },
    {
      "user": "pachadotdev",
      "count": 3,
      "uuid": 10091065
    },
    {
      "user": "samuel-rosa",
      "count": 1,
      "uuid": 10142507
    },
    {
      "user": "kant",
      "count": 1,
      "uuid": 32717
    },
    {
      "user": "dmi3kno",
      "count": 1,
      "uuid": 13419011
    },
    {
      "user": "maelle",
      "count": 1,
      "uuid": 8360597
    }
  ],
  "_userbio": {
    "uuid": 1200269,
    "type": "organization",
    "name": "rOpenSci",
    "description": "Tools and R Packages for Open Science"
  },
  "_downloads": {
    "count": 99947,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/tesseract"
  },
  "_mentions": 2,
  "_devurl": "https://github.com/ropensci/tesseract",
  "_pkgdown": "https://docs.ropensci.org/tesseract/",
  "_searchresults": 610,
  "_metadata": {
    "ropensci_category": "image-processing"
  },
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/NEWS.html",
    "extra/NEWS.txt",
    "extra/readme.html",
    "extra/readme.md",
    "extra/tesseract.html",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/ropensci/tesseract",
  "_realowner": "ropensci",
  "_cranurl": true,
  "_releases": [
    {
      "version": "1.0",
      "date": "2016-11-03"
    },
    {
      "version": "1.1",
      "date": "2016-11-10"
    },
    {
      "version": "1.2",
      "date": "2016-11-13"
    },
    {
      "version": "1.3",
      "date": "2016-12-07"
    },
    {
      "version": "1.4",
      "date": "2017-03-21"
    },
    {
      "version": "1.6",
      "date": "2017-08-14"
    },
    {
      "version": "1.8",
      "date": "2018-01-26"
    },
    {
      "version": "1.9",
      "date": "2018-02-16"
    },
    {
      "version": "2.0",
      "date": "2018-03-02"
    },
    {
      "version": "2.1",
      "date": "2018-05-03"
    },
    {
      "version": "2.2",
      "date": "2018-07-10"
    },
    {
      "version": "2.3",
      "date": "2018-08-10"
    },
    {
      "version": "4.0",
      "date": "2018-11-02"
    },
    {
      "version": "4.1",
      "date": "2019-07-25"
    },
    {
      "version": "4.1.1",
      "date": "2021-05-10"
    },
    {
      "version": "4.1.2",
      "date": "2021-09-18"
    },
    {
      "version": "4.2.0",
      "date": "2021-12-03"
    },
    {
      "version": "5.0.0",
      "date": "2022-01-10"
    },
    {
      "version": "5.1.0",
      "date": "2022-05-29"
    },
    {
      "version": "5.2.0",
      "date": "2023-09-26"
    },
    {
      "version": "5.2.1",
      "date": "2023-11-20"
    },
    {
      "version": "5.2.2",
      "date": "2024-10-04"
    },
    {
      "version": "5.2.3",
      "date": "2025-03-23"
    },
    {
      "version": "5.2.4",
      "date": "2025-12-29"
    },
    {
      "version": "5.2.5",
      "date": "2026-01-26"
    }
  ],
  "_exports": [
    "ocr",
    "ocr_data",
    "tesseract",
    "tesseract_download",
    "tesseract_info",
    "tesseract_params"
  ],
  "_help": [
    {
      "page": "ocr",
      "title": "Tesseract OCR",
      "concept": [
        "tesseract"
      ],
      "topics": [
        "ocr",
        "ocr_data"
      ]
    },
    {
      "page": "tesseract",
      "title": "Tesseract Engine",
      "concept": [
        "tesseract"
      ],
      "topics": [
        "tesseract",
        "tesseract_info",
        "tesseract_params"
      ]
    },
    {
      "page": "tessdata",
      "title": "Tesseract Training Data",
      "concept": [
        "tesseract"
      ],
      "topics": [
        "tessdata",
        "tesseract_download"
      ]
    }
  ],
  "_readme": "https://github.com/ropensci/tesseract/raw/master/README.md",
  "_rundeps": [
    "askpass",
    "curl",
    "digest",
    "pdftools",
    "qpdf",
    "rappdirs",
    "Rcpp",
    "sys"
  ],
  "_sysdeps": [
    {
      "shlib": "libtesseract",
      "package": "libtesseract5",
      "headers": "libtesseract-dev",
      "source": "tesseract",
      "version": "5.3.4-1build5",
      "name": "tesseract",
      "homepage": "https://github.com/tesseract-ocr/",
      "description": "Tesseract OCR library"
    },
    {
      "shlib": "libstdc++",
      "package": "libstdc++6",
      "source": "gcc",
      "version": "14.2.0-4ubuntu2~24.04.1",
      "name": "c++",
      "homepage": "http://gcc.gnu.org/",
      "description": "GNU Standard C++ Library v3"
    }
  ],
  "_vignettes": [
    {
      "source": "intro.Rmd",
      "filename": "intro.html",
      "title": "Using the Tesseract OCR engine in R",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Extract Text from Images",
        "Language Data",
        "Preprocessing with Magick",
        "Read from PDF files",
        "Tesseract Control Parameters",
        "Whitelist / Blacklist characters"
      ],
      "created": "2018-02-23 22:16:20",
      "modified": "2023-11-20 14:44:32",
      "commits": 28
    }
  ],
  "_score": 11.184773319398175,
  "_indexed": true,
  "_nocasepkg": "tesseract",
  "_universes": [
    "ropensci",
    "jeroen"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "5.2.5",
      "date": "2026-05-13T23:18:22.000Z",
      "distro": "noble",
      "arch": "aarch64",
      "commit": "eb79775ec4fd5efb1949647087f87e2216282670",
      "fileid": "747ef9156c022ccbcae183fc37d8548520dd8ef3f4f4ece48e4b7773ca9fce64",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25831770683"
    },
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "5.2.5",
      "date": "2026-05-13T23:18:28.000Z",
      "distro": "noble",
      "arch": "x86_64",
      "commit": "eb79775ec4fd5efb1949647087f87e2216282670",
      "fileid": "ef0c306a32c0cb53601ae82b3b066953980d3430f3a8381fb3b12a10312f1e86",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25831770683"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "5.2.5",
      "date": "2026-05-13T23:18:14.000Z",
      "distro": "noble",
      "arch": "aarch64",
      "commit": "eb79775ec4fd5efb1949647087f87e2216282670",
      "fileid": "aaff2cc337feb7cdb5c7753bd1877c1202618f4c649b5e6d9767b7f90e57f83a",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25831770683"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "5.2.5",
      "date": "2026-05-13T23:18:33.000Z",
      "distro": "noble",
      "arch": "x86_64",
      "commit": "eb79775ec4fd5efb1949647087f87e2216282670",
      "fileid": "ab15b9571cc78e40d46903432b95d21388ae4a4133da7ce1ed0c242473ef5c52",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25831770683"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "5.2.5",
      "date": "2026-05-14T05:16:59.000Z",
      "arch": "aarch64",
      "commit": "eb79775ec4fd5efb1949647087f87e2216282670",
      "fileid": "8cfcdbf521f5b1d1fa10fd4d55b812ac1b78c9275703fcbadc8b15baed21fa7b",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25831770683"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "5.2.5",
      "date": "2026-05-13T23:20:13.000Z",
      "arch": "x86_64",
      "commit": "eb79775ec4fd5efb1949647087f87e2216282670",
      "fileid": "e0bedd0aa2c58e0f95192cea027a7591f8fcf798823ff11d8f13a06ac7be8edc",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25831770683"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "5.2.5",
      "date": "2026-05-14T05:17:22.000Z",
      "arch": "aarch64",
      "commit": "eb79775ec4fd5efb1949647087f87e2216282670",
      "fileid": "3e841abe908f0662174de9db8ff1996bef5da99ac96c58d6ef25469bb25b0b18",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25831770683"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "5.2.5",
      "date": "2026-05-13T23:19:01.000Z",
      "arch": "x86_64",
      "commit": "eb79775ec4fd5efb1949647087f87e2216282670",
      "fileid": "e6b2b6432231ccbcf4ad435eb75118972f0f592f0d1d8ef48f9ccff1480428c8",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25831770683"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "5.2.5",
      "date": "2026-05-13T23:22:24.000Z",
      "arch": "x86_64",
      "commit": "eb79775ec4fd5efb1949647087f87e2216282670",
      "fileid": "f47045bd3f547b176ccd3add8027c0300e5d29004cbe809e5fc0608bbd7510c0",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25831770683"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "5.2.5",
      "date": "2026-05-13T23:17:10.000Z",
      "arch": "x86_64",
      "commit": "eb79775ec4fd5efb1949647087f87e2216282670",
      "fileid": "5575cf4d320407bbcfa3775592a9fef37e7913109b516be56770e8093adbe282",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25831770683"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "5.2.5",
      "date": "2026-05-13T23:17:17.000Z",
      "arch": "x86_64",
      "commit": "eb79775ec4fd5efb1949647087f87e2216282670",
      "fileid": "1d09e7b48369cfa20b69825750ecaa3aafe376fa452f98a44254d616da63d2c0",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/ropensci/actions/runs/25831770683"
    }
  ]
}