{
  "_id": "6a107001acfb0bcc41cab85d",
  "Package": "docxtractr",
  "Title": "Extract Data Tables and Comments from 'Microsoft' 'Word'\nDocuments",
  "Version": "0.6.5",
  "Authors@R": "c(\nperson(\"Bob\", \"Rudis\", email = \"bob@rud.is\", role = c(\"aut\", \"cre\"),\ncomment = c(ORCID = \"0000-0001-5670-2640\")),\nperson(\"Mark\", \"Dulhunty\", role = c(\"ctb\")),\nperson(\"Karlo\", \"Guidoni-Martins\", role = c(\"ctb\"), email = \"kguidonimartins@gmail.com\"),\nperson(\"Chris\", \"Muir\", email = \"chrismuirrva@gmail.com\", role = c(\"aut\", \"ctb\"))\n)",
  "Maintainer": "Bob Rudis <bob@rud.is>",
  "Description": "'Microsoft Word' 'docx' files provide an 'XML' structure\nthat is fairly straightforward to navigate, especially when it\napplies to 'Word' tables and comments. Tools are provided to\ndetermine table count/structure, comment count and also to\nextract/clean tables and comments from 'Microsoft Word' 'docx'\ndocuments. There is also nascent support for '.doc' files.",
  "SystemRequirements": "LibreOffice (<https://www.libreoffice.org/>)\nrequired to extract data from .doc files or perform .pptx\nconversion.",
  "URL": "http://gitlab.com/hrbrmstr/docxtractr",
  "BugReports": "https://gitlab.com/hrbrmstr/docxtractr/issues",
  "Encoding": "UTF-8",
  "License": "MIT + file LICENSE",
  "RoxygenNote": "7.1.0",
  "Config/pak/sysreqs": "libxml2-dev libssl-dev",
  "Repository": "https://hrbrmstr.r-universe.dev",
  "Date/Publication": "2020-07-04 12:32:47 UTC",
  "RemoteUrl": "https://github.com/hrbrmstr/docxtractr",
  "RemoteRef": "HEAD",
  "RemoteSha": "a2855a442d4bbe87232ebd3b023002d9e73bbc5b",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-05-07 07:25:00 UTC",
    "User": "root"
  },
  "Author": "Bob Rudis [aut, cre] (ORCID: <https://orcid.org/0000-0001-5670-2640>),\nMark Dulhunty [ctb],\nKarlo Guidoni-Martins [ctb],\nChris Muir [aut, ctb]",
  "MD5sum": "2b92e9611f6a4d001c30227901bef85f",
  "_user": "hrbrmstr",
  "_type": "src",
  "_file": "docxtractr_0.6.5.tar.gz",
  "_fileid": "99dc5e1b476a62a95276603db882455c000494adcb5b1be554c74314cd68c44d",
  "_filesize": 621274,
  "_sha256": "99dc5e1b476a62a95276603db882455c000494adcb5b1be554c74314cd68c44d",
  "_created": "2026-05-07T07:25:00.000Z",
  "_published": "2026-05-22T15:02:25.425Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 77406047973,
      "time": 151,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "6849290680"
    },
    {
      "job": 77406047971,
      "time": 125,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "6849281539"
    },
    {
      "job": 77406048978,
      "time": 79,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "6849268359"
    },
    {
      "job": 77406048039,
      "time": 75,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "6849267187"
    },
    {
      "job": 77406047628,
      "time": 167,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "6849245381"
    },
    {
      "job": 77406047548,
      "time": 132,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7163688497"
    },
    {
      "job": 77406048685,
      "time": 88,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "OK",
      "artifact": "6849271115"
    },
    {
      "job": 77406049135,
      "time": 80,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "OK",
      "artifact": "6849268487"
    },
    {
      "job": 77406048783,
      "time": 66,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "6849264676"
    }
  ],
  "_buildurl": "https://github.com/r-universe/hrbrmstr/actions/runs/25481966510",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/hrbrmstr/docxtractr",
  "_commit": {
    "id": "a2855a442d4bbe87232ebd3b023002d9e73bbc5b",
    "author": "hrbrmstr <bob@rud.is>",
    "committer": "hrbrmstr <bob@rud.is>",
    "message": "cran check errors fixes\n",
    "time": 1593865967
  },
  "_maintainer": {
    "name": "Bob Rudis",
    "email": "bob@rud.is",
    "login": "hrbrmstr",
    "mastodon": "@hrbrmstr@mastodon.social",
    "bluesky": "@hrbrmstr.dev",
    "orcid": "0000-0001-5670-2640",
    "uuid": 509878
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 3.6.0",
      "role": "Depends"
    },
    {
      "package": "tools",
      "role": "Imports"
    },
    {
      "package": "xml2",
      "role": "Imports"
    },
    {
      "package": "purrr",
      "role": "Imports"
    },
    {
      "package": "dplyr",
      "role": "Imports"
    },
    {
      "package": "utils",
      "role": "Imports"
    },
    {
      "package": "httr",
      "role": "Imports"
    },
    {
      "package": "magrittr",
      "role": "Imports"
    },
    {
      "package": "covr",
      "role": "Suggests"
    },
    {
      "package": "tinytest",
      "role": "Suggests"
    }
  ],
  "_owner": "hrbrmstr",
  "_selfowned": true,
  "_usedby": 0,
  "_updates": [],
  "_tags": [],
  "_topics": [
    "docx",
    "extract-tables",
    "microsoft-word",
    "table-extraction"
  ],
  "_stars": 178,
  "_contributors": [
    {
      "user": "hrbrmstr",
      "count": 47,
      "uuid": 509878
    },
    {
      "user": "muschellij2",
      "count": 18,
      "uuid": 1075118
    },
    {
      "user": "chrismuir",
      "count": 7,
      "uuid": 13386824
    },
    {
      "user": "markdly",
      "count": 4,
      "uuid": 8509894
    },
    {
      "user": "jimhester",
      "count": 1,
      "uuid": 205275
    },
    {
      "user": "kguidonimartins",
      "count": 1,
      "uuid": 8163542
    },
    {
      "user": "ironholds",
      "count": 1,
      "uuid": 2487262
    },
    {
      "user": "sangeetabhatia03",
      "count": 1,
      "uuid": 15316049
    }
  ],
  "_userbio": {
    "uuid": 509878,
    "type": "user",
    "name": "boB Rudis",
    "description": "🇺🇦 Pampa • Don't look at me…I do what he does—just slower. #rstats avuncular•👨‍🍳•✝️• 💤• Distinguished Engineer @ Censys + CMU Lecturer"
  },
  "_downloads": {
    "count": 1136,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/docxtractr"
  },
  "_devurl": "https://gitlab.com/hrbrmstr/docxtractr",
  "_searchresults": 222,
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/docxtractr.html",
    "extra/NEWS.html",
    "extra/NEWS.txt",
    "extra/readme.html",
    "extra/readme.md",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/hrbrmstr/docxtractr",
  "_realowner": "hrbrmstr",
  "_cranurl": true,
  "_releases": [
    {
      "version": "0.1.0.9000",
      "date": "2015-08-29"
    },
    {
      "version": "0.2.0",
      "date": "2016-07-20"
    },
    {
      "version": "0.5.0",
      "date": "2018-09-18"
    },
    {
      "version": "0.6.1",
      "date": "2019-01-09"
    },
    {
      "version": "0.6.2",
      "date": "2020-06-13"
    },
    {
      "version": "0.6.3",
      "date": "2020-06-13"
    },
    {
      "version": "0.6.5",
      "date": "2020-07-05"
    }
  ],
  "_exports": [
    "%>%",
    "assign_colnames",
    "convert_to_pdf",
    "docx_cmnt_count",
    "docx_describe_cmnts",
    "docx_describe_tbls",
    "docx_extract_all",
    "docx_extract_all_cmnts",
    "docx_extract_all_tbls",
    "docx_extract_tbl",
    "docx_tbl_count",
    "mcga",
    "read_docx",
    "set_libreoffice_path"
  ],
  "_help": [
    {
      "page": "assign_colnames",
      "title": "Make a specific row the column names for the specified data.frame",
      "topics": [
        "assign_colnames"
      ]
    },
    {
      "page": "convert_to_pdf",
      "title": "Convert a Document (usually PowerPoint) to a PDF",
      "topics": [
        "convert_to_pdf"
      ]
    },
    {
      "page": "docx_cmnt_count",
      "title": "Get number of comments in a Word document",
      "topics": [
        "docx_cmnt_count"
      ]
    },
    {
      "page": "docx_describe_cmnts",
      "title": "Returns information about the comments in the Word document",
      "topics": [
        "docx_describe_cmnts"
      ]
    },
    {
      "page": "docx_describe_tbls",
      "title": "Returns a description of all the tables in the Word document",
      "topics": [
        "docx_describe_tbls"
      ]
    },
    {
      "page": "docx_extract_all",
      "title": "Extract all tables from a Word document",
      "topics": [
        "docx_extract_all"
      ]
    },
    {
      "page": "docx_extract_all_cmnts",
      "title": "Extract all comments from a Word document",
      "topics": [
        "docx_extract_all_cmnts"
      ]
    },
    {
      "page": "docx_extract_all_tbls",
      "title": "Extract all tables from a Word document",
      "topics": [
        "docx_extract_all_tbls"
      ]
    },
    {
      "page": "docx_extract_tbl",
      "title": "Extract a table from a Word document",
      "topics": [
        "docx_extract_tbl"
      ]
    },
    {
      "page": "docx_tbl_count",
      "title": "Get number of tables in a Word document",
      "topics": [
        "docx_tbl_count"
      ]
    },
    {
      "page": "docxtractr",
      "title": "Extract Data Tables and Comments from 'Microsoft' 'Word' Documents",
      "topics": [
        "docxtractr"
      ]
    },
    {
      "page": "mcga",
      "title": "Make Column Names Great Again",
      "topics": [
        "mcga"
      ]
    },
    {
      "page": "print.docx",
      "title": "Display information about the document",
      "topics": [
        "print.docx"
      ]
    },
    {
      "page": "read_docx",
      "title": "Read in a Word document for table extraction",
      "topics": [
        "read_docx"
      ]
    },
    {
      "page": "set_libreoffice_path",
      "title": "Point to Local soffice.exe File",
      "topics": [
        "set_libreoffice_path"
      ]
    }
  ],
  "_readme": "https://github.com/hrbrmstr/docxtractr/raw/HEAD/README.md",
  "_rundeps": [
    "askpass",
    "cli",
    "curl",
    "dplyr",
    "generics",
    "glue",
    "httr",
    "jsonlite",
    "lifecycle",
    "magrittr",
    "mime",
    "openssl",
    "pillar",
    "pkgconfig",
    "purrr",
    "R6",
    "rlang",
    "sys",
    "tibble",
    "tidyselect",
    "utf8",
    "vctrs",
    "withr",
    "xml2"
  ],
  "_score": 7.196219352484808,
  "_indexed": true,
  "_nocasepkg": "docxtractr",
  "_universes": [
    "hrbrmstr",
    "gitlab-hrbrmstr"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "0.6.5",
      "date": "2026-05-07T07:27:35.000Z",
      "distro": "noble",
      "commit": "a2855a442d4bbe87232ebd3b023002d9e73bbc5b",
      "fileid": "4ca2751b807bf152718947361b1faa1d895024f6472447e6f9de5ba65253a98b",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/hrbrmstr/actions/runs/25481966510"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "0.6.5",
      "date": "2026-05-07T07:27:02.000Z",
      "distro": "noble",
      "commit": "a2855a442d4bbe87232ebd3b023002d9e73bbc5b",
      "fileid": "9e133ecdff33c17fc4035110841ed169429bb7fe06efc1b5ecedd9be5838a100",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/hrbrmstr/actions/runs/25481966510"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "0.6.5",
      "date": "2026-05-07T07:26:25.000Z",
      "commit": "a2855a442d4bbe87232ebd3b023002d9e73bbc5b",
      "fileid": "838a521e22cafdfc1964a6f220c4f3bf1500969e63d4985964b46363aac56e65",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/hrbrmstr/actions/runs/25481966510"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "0.6.5",
      "date": "2026-05-07T07:26:20.000Z",
      "commit": "a2855a442d4bbe87232ebd3b023002d9e73bbc5b",
      "fileid": "cae666e963b4b85b1785b189b5e1dfbced23837d73ed0c9cc608ca4befda296b",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/hrbrmstr/actions/runs/25481966510"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "0.6.5",
      "date": "2026-05-07T07:26:13.000Z",
      "commit": "a2855a442d4bbe87232ebd3b023002d9e73bbc5b",
      "fileid": "1054c55af4bf26cff7e6aac3e3219f33801f3c7c3e37e78793c004b870c35dc0",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/hrbrmstr/actions/runs/25481966510"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "0.6.5",
      "date": "2026-05-07T07:26:09.000Z",
      "commit": "a2855a442d4bbe87232ebd3b023002d9e73bbc5b",
      "fileid": "dbb0243dc579ee556f5b2933a835f99d1a9697ab70660467ba1bb8e9e03ba5b1",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/hrbrmstr/actions/runs/25481966510"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "0.6.5",
      "date": "2026-05-07T07:26:01.000Z",
      "commit": "a2855a442d4bbe87232ebd3b023002d9e73bbc5b",
      "fileid": "690445c6ca8238777637a85b62164968592d08141875a9e92ee2cb5667ac4b3d",
      "status": "success",
      "check": "OK",
      "buildurl": "https://github.com/r-universe/hrbrmstr/actions/runs/25481966510"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "0.6.5",
      "date": "2026-05-22T15:02:08.000Z",
      "commit": "a2855a442d4bbe87232ebd3b023002d9e73bbc5b",
      "fileid": "b372bc3ae5ac2188484cc5b276b1a4fad8af3836a2731bc7b0d9a13e05e7d1f6",
      "status": "success",
      "buildurl": "https://github.com/r-universe/hrbrmstr/actions/runs/25481966510"
    }
  ]
}