{
  "_id": "6a197280acfb0bcc41deec31",
  "Package": "readtext",
  "Version": "0.92.1",
  "Type": "Package",
  "Title": "Import and Handling for Plain and Formatted Text Files",
  "Authors@R": "c( person(\"Kenneth\", \"Benoit\", email = \"kbenoit@lse.ac.uk\", role =\nc(\"aut\", \"cre\", \"cph\")),\nperson(\"Adam\", \"Obeng\", email = \"quanteda@binaryeagle.com\", role = \"aut\"),\nperson(\"Kohei\", \"Watanabe\", email = \"watanabe.kohei@gmail.com\", role = \"ctb\"),\nperson(\"Akitaka\", \"Matsuo\", email = \"a.matsuo@lse.ac.uk\", role = \"ctb\"),\nperson(\"Paul\", \"Nulty\", email = \"paul.nulty@gmail.com\", role = \"ctb\"),\nperson(\"Stefan\", \"Müller\", email = \"mullers@tcd.ie\", role = \"ctb\"))",
  "Description": "Functions for importing and handling text files and\nformatted text files with additional meta-data, such including\n'.csv', '.tab', '.json', '.xml', '.html', '.pdf', '.doc',\n'.docx', '.rtf', '.xls', '.xlsx', and others.",
  "License": "GPL-3",
  "URL": "https://readtext.quanteda.io/,\nhttps://github.com/quanteda/readtext",
  "Encoding": "UTF-8",
  "BugReports": "https://github.com/quanteda/readtext/issues",
  "LazyData": "TRUE",
  "VignetteBuilder": "knitr",
  "RoxygenNote": "7.3.2",
  "Roxygen": "list(markdown = TRUE)",
  "Language": "en-GB",
  "Config/pak/sysreqs": "make libicu-dev libjpeg-dev libxml2-dev libssl-dev\nlibpoppler-cpp-dev poppler-data zlib1g-dev",
  "Repository": "https://quanteda.r-universe.dev",
  "Date/Publication": "2025-07-27 09:25:32 UTC",
  "RemoteUrl": "https://github.com/quanteda/readtext",
  "RemoteRef": "HEAD",
  "RemoteSha": "f5a5d26709e5f42da7030088f191998b1774e5b9",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-05-29 09:25:20 UTC",
    "User": "root"
  },
  "Author": "Kenneth Benoit [aut, cre, cph],\nAdam Obeng [aut],\nKohei Watanabe [ctb],\nAkitaka Matsuo [ctb],\nPaul Nulty [ctb],\nStefan Müller [ctb]",
  "Maintainer": "Kenneth Benoit <kbenoit@lse.ac.uk>",
  "MD5sum": "41b2edac9cad501e5662c6f60cacf378",
  "_user": "quanteda",
  "_type": "src",
  "_file": "readtext_0.92.1.tar.gz",
  "_fileid": "8411fd88910ccb5ae80fe024a7dadce1b9e6eefea41043fdc68b5cc80edf79d7",
  "_filesize": 3328933,
  "_sha256": "8411fd88910ccb5ae80fe024a7dadce1b9e6eefea41043fdc68b5cc80edf79d7",
  "_created": "2026-05-29T09:25:20.000Z",
  "_published": "2026-05-29T11:03:28.204Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 78474074419,
      "time": 130,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7287499450"
    },
    {
      "job": 78474074483,
      "time": 153,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7287506645"
    },
    {
      "job": 78474074448,
      "time": 166,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7289150186"
    },
    {
      "job": 78474074459,
      "time": 147,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7289143569"
    },
    {
      "job": 78473354738,
      "time": 280,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7287457279"
    },
    {
      "job": 78474074535,
      "time": 115,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7287494640"
    },
    {
      "job": 78474074541,
      "time": 97,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "7287489014"
    },
    {
      "job": 78474074489,
      "time": 90,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "7287486799"
    },
    {
      "job": 78474074504,
      "time": 93,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7287487833"
    }
  ],
  "_buildurl": "https://github.com/r-universe/quanteda/actions/runs/26629147933",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/quanteda/readtext",
  "_commit": {
    "id": "f5a5d26709e5f42da7030088f191998b1774e5b9",
    "author": "kbenoit <kbenoit@lse.ac.uk>",
    "committer": "kbenoit <kbenoit@lse.ac.uk>",
    "message": "Update for 0.92.1 release\n",
    "time": 1753608332
  },
  "_maintainer": {
    "name": "Kenneth Benoit",
    "email": "kbenoit@lse.ac.uk",
    "login": "kbenoit",
    "bluesky": "@kenbenoit.bsky.social",
    "twitter": "@kenbenoit",
    "description": "Professor of Computational Social Science; Dean, School of Social Science, Singapore Management University;\nDirector of non-profit @quanteda Initiative",
    "uuid": 2182246
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 3.6",
      "role": "Depends"
    },
    {
      "package": "antiword",
      "role": "Imports"
    },
    {
      "package": "data.table",
      "role": "Imports"
    },
    {
      "package": "digest",
      "role": "Imports"
    },
    {
      "package": "httr",
      "role": "Imports"
    },
    {
      "package": "jsonlite",
      "version": ">= 0.9.10",
      "role": "Imports"
    },
    {
      "package": "pillar",
      "role": "Imports"
    },
    {
      "package": "pdftools",
      "role": "Imports"
    },
    {
      "package": "readODS",
      "version": ">= 1.7.0",
      "role": "Imports"
    },
    {
      "package": "readxl",
      "role": "Imports"
    },
    {
      "package": "streamR",
      "role": "Imports"
    },
    {
      "package": "stringi",
      "role": "Imports"
    },
    {
      "package": "striprtf",
      "role": "Imports"
    },
    {
      "package": "xml2",
      "role": "Imports"
    },
    {
      "package": "utils",
      "role": "Imports"
    },
    {
      "package": "knitr",
      "role": "Suggests"
    },
    {
      "package": "pkgload",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "role": "Suggests"
    },
    {
      "package": "quanteda",
      "version": ">= 3.0",
      "role": "Suggests"
    },
    {
      "package": "testthat",
      "role": "Suggests"
    },
    {
      "package": "covr",
      "role": "Suggests"
    },
    {
      "package": "spelling",
      "role": "Suggests"
    }
  ],
  "_owner": "quanteda",
  "_selfowned": true,
  "_usedby": 7,
  "_updates": [
    {
      "week": "2025-30",
      "n": 1
    }
  ],
  "_tags": [],
  "_topics": [
    "encoding",
    "quanteda",
    "text"
  ],
  "_stars": 121,
  "_contributors": [
    {
      "user": "kbenoit",
      "count": 271,
      "uuid": 2182246
    },
    {
      "user": "adamobeng",
      "count": 124,
      "uuid": 776593
    },
    {
      "user": "amatsuo",
      "count": 47,
      "uuid": 8436792
    },
    {
      "user": "koheiw",
      "count": 29,
      "uuid": 6572963
    },
    {
      "user": "chainsawriot",
      "count": 2,
      "uuid": 637269
    },
    {
      "user": "jirkalewandowski",
      "count": 1,
      "uuid": 7399218
    },
    {
      "user": "pmyteh",
      "count": 1,
      "uuid": 890868
    },
    {
      "user": "olivroy",
      "count": 1,
      "uuid": 52606734
    },
    {
      "user": "pnulty",
      "count": 1,
      "uuid": 654540
    }
  ],
  "_userbio": {
    "uuid": 34347233,
    "type": "organization",
    "name": "Quanteda Initiative"
  },
  "_downloads": {
    "count": 4190,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/readtext"
  },
  "_mentions": 1,
  "_devurl": "https://github.com/quanteda/readtext",
  "_pkgdown": "https://readtext.quanteda.io/",
  "_searchresults": 1760,
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/NEWS.html",
    "extra/NEWS.txt",
    "extra/readme.html",
    "extra/readme.md",
    "extra/readtext.html",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/quanteda/readtext",
  "_realowner": "quanteda",
  "_cranurl": true,
  "_releases": [
    {
      "version": "0.50",
      "date": "2017-05-22"
    },
    {
      "version": "0.70",
      "date": "2018-05-09"
    },
    {
      "version": "0.71",
      "date": "2018-05-10"
    },
    {
      "version": "0.74",
      "date": "2019-05-08"
    },
    {
      "version": "0.75",
      "date": "2019-06-26"
    },
    {
      "version": "0.76",
      "date": "2020-03-04"
    },
    {
      "version": "0.80",
      "date": "2020-09-22"
    },
    {
      "version": "0.81",
      "date": "2021-07-14"
    },
    {
      "version": "0.82",
      "date": "2023-04-06"
    },
    {
      "version": "0.90",
      "date": "2023-06-03"
    },
    {
      "version": "0.91",
      "date": "2024-02-23"
    },
    {
      "version": "0.92.1",
      "date": "2025-08-01"
    }
  ],
  "_exports": [
    "encoding",
    "readtext",
    "readtext_options",
    "texts"
  ],
  "_datasets": [
    {
      "name": "data_char_encodedtexts",
      "title": "encoded texts for testing",
      "object": "data_char_encodedtexts",
      "class": [
        "character"
      ],
      "fields": [],
      "table": false,
      "tojson": false
    }
  ],
  "_help": [
    {
      "page": "readtext-package",
      "title": "Import and handling for plain and formatted text files",
      "topics": [
        "readtext-package"
      ]
    },
    {
      "page": "as.character.readtext",
      "title": "return only the texts from a readtext object",
      "topics": [
        "as.character.readtext"
      ]
    },
    {
      "page": "data_char_encodedtexts",
      "title": "encoded texts for testing",
      "topics": [
        "data_char_encodedtexts"
      ]
    },
    {
      "page": "data_files_encodedtexts",
      "title": "a .zip file of texts containing a variety of differently encoded texts",
      "topics": [
        "data_files_encodedtexts"
      ]
    },
    {
      "page": "encoding",
      "title": "detect the encoding of texts",
      "topics": [
        "encoding"
      ]
    },
    {
      "page": "readtext",
      "title": "read a text file(s)",
      "topics": [
        "readtext"
      ]
    },
    {
      "page": "readtext_options",
      "title": "Get or set package options for readtext",
      "topics": [
        "readtext_options"
      ]
    }
  ],
  "_readme": "https://github.com/quanteda/readtext/raw/HEAD/README.md",
  "_rundeps": [
    "antiword",
    "askpass",
    "bitops",
    "cellranger",
    "cli",
    "cpp11",
    "crayon",
    "curl",
    "data.table",
    "digest",
    "glue",
    "hms",
    "httr",
    "jsonlite",
    "lifecycle",
    "magrittr",
    "mime",
    "minty",
    "ndjson",
    "openssl",
    "pdftools",
    "pillar",
    "pkgconfig",
    "prettyunits",
    "progress",
    "qpdf",
    "R6",
    "Rcpp",
    "RCurl",
    "readODS",
    "readxl",
    "rematch",
    "rjson",
    "rlang",
    "streamR",
    "stringi",
    "stringr",
    "striprtf",
    "sys",
    "tibble",
    "tzdb",
    "utf8",
    "vctrs",
    "withr",
    "xml2",
    "zip"
  ],
  "_vignettes": [
    {
      "source": "readtext_vignette.Rmd",
      "filename": "readtext_vignette.html",
      "title": "Reading text files with readtext",
      "engine": "knitr::rmarkdown",
      "headings": [
        "1. Introduction",
        "2. Reading one or more text files",
        "2.1 Plain text files (.txt)",
        "2.2 Comma- or tab-separated values (.csv, .tab, .tsv)",
        "2.3 JSON data (.json)",
        "2.4 PDF files",
        "2.5 Microsoft Word files (.doc, .docx)",
        "2.6 Text from URLs",
        "2.7 Text from archive files (.zip, .tar, .tar.gz, .tar.bz)",
        "3. Inter-operability with quanteda",
        "4. Solving common problems",
        "4.1 Remove page numbers using regular expressions",
        "4.2 Read files with different encodings"
      ],
      "created": "2017-04-26 17:50:16",
      "modified": "2023-04-06 06:41:47",
      "commits": 15
    }
  ],
  "_score": 10.874791347158776,
  "_indexed": true,
  "_nocasepkg": "readtext",
  "_universes": [
    "quanteda",
    "kbenoit"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "0.92.1",
      "date": "2026-05-29T09:27:32.000Z",
      "distro": "noble",
      "commit": "f5a5d26709e5f42da7030088f191998b1774e5b9",
      "fileid": "2c28b43991ae830abc316ab5590316c415b7057e9d391f6642a18069af4e8655",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/quanteda/actions/runs/26629147933"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "0.92.1",
      "date": "2026-05-29T09:27:50.000Z",
      "distro": "noble",
      "commit": "f5a5d26709e5f42da7030088f191998b1774e5b9",
      "fileid": "157d6186d101931493b6a7960d6e93241b519271c2ea4727963fd548fab9b182",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/quanteda/actions/runs/26629147933"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "0.92.1",
      "date": "2026-05-29T11:02:24.000Z",
      "commit": "f5a5d26709e5f42da7030088f191998b1774e5b9",
      "fileid": "b79a2b153e407362fbc6f17bdcaab7a4c70f1c68a5ff94677865641cf91f2c88",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/quanteda/actions/runs/26629147933"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "0.92.1",
      "date": "2026-05-29T11:02:00.000Z",
      "commit": "f5a5d26709e5f42da7030088f191998b1774e5b9",
      "fileid": "59edb2888c1b3562d91559af190dcc93318fb25b2c21a91b6e21503137943e64",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/quanteda/actions/runs/26629147933"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "0.92.1",
      "date": "2026-05-29T09:27:35.000Z",
      "commit": "f5a5d26709e5f42da7030088f191998b1774e5b9",
      "fileid": "c592ef8a16eec6f41996b0fbe88ae73f4ec14be6e39c4d754f8b8b446187c66c",
      "status": "success",
      "buildurl": "https://github.com/r-universe/quanteda/actions/runs/26629147933"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "0.92.1",
      "date": "2026-05-29T09:26:46.000Z",
      "commit": "f5a5d26709e5f42da7030088f191998b1774e5b9",
      "fileid": "73b5a4deb8c93f083d065bfce1988ea17f0295247438aad070bf24ca8582e549",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/quanteda/actions/runs/26629147933"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "0.92.1",
      "date": "2026-05-29T09:26:38.000Z",
      "commit": "f5a5d26709e5f42da7030088f191998b1774e5b9",
      "fileid": "f9bb4158f62e1274bd89b0549b9b671824c5538895a7e1f2d05ab9b2d384bf83",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/quanteda/actions/runs/26629147933"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "0.92.1",
      "date": "2026-05-29T09:26:41.000Z",
      "commit": "f5a5d26709e5f42da7030088f191998b1774e5b9",
      "fileid": "69189445a5c2495bdf237f37d24ebef60ceb0b365f60545de949197d7c1ccbf0",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/quanteda/actions/runs/26629147933"
    }
  ]
}