{
  "_id": "6a1f2fdbb401979e73427611",
  "Package": "repboxDoc",
  "Type": "Package",
  "Title": "Heuristically prepare PDF or HTML articles or appendices for\nfurther repbox analysis",
  "Version": "0.1.0",
  "Author": "Sebastian Kranz",
  "Maintainer": "Sebastian Kranz <sebastian.kranz@uni-ulm.de>",
  "Description": "Heuristically prepare PDF or HTML articles or appendices\nfor further repbox analysis",
  "License": "GPL >= 2.0",
  "Encoding": "UTF-8",
  "Config/pak/sysreqs": "cmake libfontconfig1-dev libfreetype6-dev\nlibfribidi-dev git make libharfbuzz-dev libgit2-dev libicu-dev\nlibjpeg-dev libpng-dev libtiff-dev libuv1-dev libwebp-dev\nlibxml2-dev libssl-dev libx11-dev zlib1g-dev",
  "Repository": "https://skranz.r-universe.dev",
  "Date/Publication": "2026-04-15 09:20:28 UTC",
  "RemoteUrl": "https://github.com/repboxr/repboxDoc",
  "RemoteRef": "main",
  "RemoteSha": "e0f14b8502cc1b0d57d0ff83e33db74fe27b2bf5",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-05-15 09:05:57 UTC",
    "User": "root"
  },
  "MD5sum": "6f5659386308cdb5dfd33a939f4a1074",
  "_user": "skranz",
  "_type": "src",
  "_file": "repboxDoc_0.1.0.tar.gz",
  "_fileid": "ab51967630024db69b35180d335817a69f1cfdb90d548201b50a5cc3c222d8c8",
  "_filesize": 147132,
  "_sha256": "ab51967630024db69b35180d335817a69f1cfdb90d548201b50a5cc3c222d8c8",
  "_created": "2026-05-15T09:05:57.000Z",
  "_published": "2026-06-02T19:32:43.436Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 79155290758,
      "time": 163,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "WARNING",
      "artifact": "7013716685"
    },
    {
      "job": 79155290817,
      "time": 141,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "WARNING",
      "artifact": "7013712396"
    },
    {
      "job": 79155291688,
      "time": 78,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "WARNING",
      "artifact": "7013692909"
    },
    {
      "job": 79155291320,
      "time": 98,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "WARNING",
      "artifact": "7013698745"
    },
    {
      "job": 79155290376,
      "time": 206,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7013670139"
    },
    {
      "job": 79155290341,
      "time": 135,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7367851536"
    },
    {
      "job": 79155291447,
      "time": 101,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "WARNING",
      "artifact": "7013699290"
    },
    {
      "job": 79155290932,
      "time": 127,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "WARNING",
      "artifact": "7013707121"
    },
    {
      "job": 79155291065,
      "time": 81,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "WARNING",
      "artifact": "7013694014"
    }
  ],
  "_buildurl": "https://github.com/r-universe/skranz/actions/runs/25909538326",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/repboxr/repboxDoc",
  "_commit": {
    "id": "e0f14b8502cc1b0d57d0ff83e33db74fe27b2bf5",
    "author": "skranz-auto <xsx50@uni-ulm.de>",
    "committer": "skranz-auto <xsx50@uni-ulm.de>",
    "message": "Update from server\n",
    "time": 1776244828
  },
  "_maintainer": {
    "name": "Sebastian Kranz",
    "email": "sebastian.kranz@uni-ulm.de",
    "login": "skranz",
    "bluesky": "@sebkranz.bsky.social",
    "uuid": 1413022
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 3.5.0",
      "role": "Depends"
    },
    {
      "package": "repboxUtils",
      "role": "Depends"
    },
    {
      "package": "restorepoint",
      "role": "Depends"
    },
    {
      "package": "stringi",
      "role": "Depends"
    },
    {
      "package": "tidyr",
      "role": "Depends"
    },
    {
      "package": "dplyr",
      "role": "Depends"
    },
    {
      "package": "stringtools",
      "role": "Depends"
    },
    {
      "package": "ExtractSciTab",
      "role": "Depends"
    },
    {
      "package": "repboxTableTools",
      "role": "Depends"
    }
  ],
  "_owner": "repboxr",
  "_selfowned": true,
  "_usedby": 1,
  "_updates": [
    {
      "week": "2025-26",
      "n": 1
    },
    {
      "week": "2025-27",
      "n": 1
    },
    {
      "week": "2025-52",
      "n": 1
    },
    {
      "week": "2026-13",
      "n": 2
    },
    {
      "week": "2026-16",
      "n": 1
    }
  ],
  "_tags": [],
  "_stars": 0,
  "_contributors": [
    {
      "user": "skranz-auto",
      "count": 12,
      "uuid": 124874982
    },
    {
      "user": "skranz",
      "count": 1,
      "uuid": 1413022
    }
  ],
  "_userbio": {
    "uuid": 1413022,
    "type": "user",
    "name": "Sebastian Kranz"
  },
  "_downloads": {
    "count": 0,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/repboxDoc"
  },
  "_devurl": "https://github.com/repboxr/repboxdoc",
  "_searchresults": 8,
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/readme.html",
    "extra/readme.md",
    "extra/repboxDoc.html",
    "manual.pdf"
  ],
  "_cranurl": false,
  "_exports": [
    "bind_rows_with_parent_fields",
    "cell_df_join",
    "cell_df_to_tabhtml",
    "change_file_ext",
    "check_and_repair_footnote_candidates",
    "combine_short_paragraphs",
    "combine_text_lines",
    "doc_dir_to_artid",
    "doc_dir_to_project_dir",
    "ecta_parse_html",
    "ecta_parse_html_table",
    "ends.with.text",
    "ensure_empty_types",
    "example",
    "example_mocr_make",
    "extract_all_to_index_df",
    "extract_num_from_sequence_text",
    "extract_order_num_from_sequence_text",
    "find_wrong_mocr",
    "first_repair_rdoc_pdf_text",
    "first.non.null",
    "from_to",
    "get_phrases_def",
    "guess_journ_from_artid",
    "html_tab_cell_row_panel_df",
    "html_table_cells_from_all_tr",
    "html_table_cells_from_tr",
    "html_text_part_df_standardize",
    "identify_figure_lines_on_page",
    "is_aer_pandp",
    "is_really_a_note_line",
    "is.true",
    "jpe_parse_html",
    "jpe_parse_html_table",
    "keep.overlapping.loc",
    "left_join_overlap",
    "line_df_find_figures",
    "line_df_find_footnotes",
    "line_df_find_junk_lines",
    "line_df_find_page_header_footer",
    "line_df_find_section_cands",
    "line_df_find_sections",
    "line_df_to_part_df",
    "lines_to_pages",
    "lines_to_plines",
    "load_phrases_def",
    "loc_sep_lines",
    "loc_to_df",
    "locate_all_as_df",
    "locate_col_refs_in_txt",
    "locate_sentences_in_txt",
    "locate_tab_fig_refs_in_txt",
    "make_phrases_def",
    "map_loc_to_parent_loc",
    "match_overlap",
    "mocr_copy_to_ejs",
    "mocr_html_extract_tables",
    "mocr_make_ocr",
    "mocr_md_to_html_by_page",
    "mocr_md_to_html_mono",
    "mocr_parse_html_parts",
    "most.common",
    "ms_parse_html",
    "ms_parse_html_table",
    "my_pandoc",
    "my_rank",
    "na.false",
    "na.remove",
    "na.val",
    "pdf_to_txt_pages",
    "plines_to_lines",
    "rdoc_document_url",
    "rdoc_find_in_text_fixed",
    "rdoc_form",
    "rdoc_guess_journ",
    "rdoc_has_art_mocr",
    "rdoc_has_html",
    "rdoc_has_pdf",
    "rdoc_has_two_col",
    "rdoc_html_file",
    "rdoc_html_process",
    "rdoc_html_tab_standardize",
    "rdoc_html_to_parts",
    "rdoc_is_processed",
    "rdoc_load_art_meta_data",
    "rdoc_load_page_df",
    "rdoc_load_part_df",
    "rdoc_load_ref_li",
    "rdoc_load_sent_df",
    "rdoc_load_tab_df",
    "rdoc_load_with_cache",
    "rdoc_mocr_process",
    "rdoc_options",
    "rdoc_opts",
    "rdoc_pdf_extract_raw_tabs",
    "rdoc_pdf_extract_tabs",
    "rdoc_pdf_file",
    "rdoc_pdf_pages_to_parts",
    "rdoc_pdf_process",
    "rdoc_pdf_to_txt_pages",
    "rdoc_phrase_analysis",
    "rdoc_process",
    "rdoc_refs_analysis",
    "rdoc_repair_two_col",
    "rdoc_repair_two_col_aer_pandp",
    "rdoc_sent_df",
    "rdoc_steps_from",
    "rdoc_tab_fig_refs",
    "rdoc_tab_phrase_analysis",
    "rdoc_tab_ref_text",
    "rdoc_tabs_file",
    "rdoc_text_parts_phrase_analysis",
    "rdoc_type",
    "rdoc_update_project",
    "readRDS.or.null",
    "refine_cell_df_and_add_panel_info",
    "remove_nested_html_elements",
    "remove.cols",
    "remove.overlapping.loc",
    "repair_ejd_files_art_mocr",
    "repbox_all_pdf_file",
    "repbox_doc_dirs",
    "repbox_doc_file_select",
    "repbox_doc_files_info",
    "repbox_doc_types",
    "repbox_journ_list",
    "repbox_pdf_file",
    "repbox_process_all_docs",
    "repbox_rdoc_opts",
    "restat_parse_html",
    "restud_parse_html",
    "restud_parse_html_table",
    "rle_block",
    "rle_cummax_block",
    "rle_table",
    "save_rds_create_dir",
    "sentences_merge_with_next",
    "seq_rows",
    "show_cell_df_html",
    "substitute_wrong_pdf_txt_chars",
    "text_df_add_section_cols",
    "text_parts_tab_fig_references",
    "text_parts_to_loc",
    "txt_locate_keywords",
    "txt_locate_rx_keywords",
    "txt_locate_typed_keywords",
    "txt_phrase_analysis"
  ],
  "_help": [],
  "_readme": "https://github.com/repboxr/repboxDoc/raw/main/README.md",
  "_rundeps": [
    "askpass",
    "base64enc",
    "brew",
    "brio",
    "bslib",
    "cachem",
    "callr",
    "cli",
    "clipr",
    "commonmark",
    "cpp11",
    "crayon",
    "credentials",
    "curl",
    "data.table",
    "desc",
    "devtools",
    "diffobj",
    "digest",
    "downlit",
    "dplyr",
    "ellipsis",
    "evaluate",
    "ExtractSciTab",
    "fansi",
    "fastmap",
    "fontawesome",
    "fs",
    "generics",
    "gert",
    "gh",
    "gitcreds",
    "glue",
    "highr",
    "htmltools",
    "htmlwidgets",
    "httpuv",
    "httr",
    "httr2",
    "ini",
    "jquerylib",
    "jsonlite",
    "knitr",
    "later",
    "lifecycle",
    "magrittr",
    "memoise",
    "mime",
    "miniUI",
    "openssl",
    "otel",
    "pak",
    "pillar",
    "pkgbuild",
    "pkgconfig",
    "pkgdown",
    "pkgload",
    "praise",
    "prettyunits",
    "processx",
    "profvis",
    "promises",
    "ps",
    "purrr",
    "R6",
    "ragg",
    "rappdirs",
    "rcmdcheck",
    "Rcpp",
    "repboxDB",
    "repboxTableTools",
    "repboxUtils",
    "restorepoint",
    "rlang",
    "rmarkdown",
    "roxygen2",
    "rprojroot",
    "rstudioapi",
    "rversions",
    "rvest",
    "sass",
    "selectr",
    "sessioninfo",
    "shiny",
    "sourcetools",
    "stringi",
    "stringr",
    "stringtools",
    "sys",
    "systemfonts",
    "testthat",
    "textshaping",
    "tibble",
    "tidyr",
    "tidyselect",
    "tinytex",
    "urlchecker",
    "usethis",
    "utf8",
    "vctrs",
    "waldo",
    "whisker",
    "withr",
    "xfun",
    "xml2",
    "xopen",
    "xtable",
    "yaml",
    "zip"
  ],
  "_score": 2.8750612633917,
  "_indexed": false,
  "_nocasepkg": "repboxdoc",
  "_universes": [
    "skranz"
  ],
  "_indexurl": "https://repboxr.r-universe.dev/repboxDoc",
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "0.1.0",
      "date": "2026-05-15T09:08:36.000Z",
      "distro": "noble",
      "commit": "e0f14b8502cc1b0d57d0ff83e33db74fe27b2bf5",
      "fileid": "466cf7af486966b08702a118177623020b320d74741ba8cc7861c048102bfda5",
      "status": "success",
      "check": "WARNING",
      "buildurl": "https://github.com/r-universe/skranz/actions/runs/25909538326"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "0.1.0",
      "date": "2026-05-15T09:08:26.000Z",
      "distro": "noble",
      "commit": "e0f14b8502cc1b0d57d0ff83e33db74fe27b2bf5",
      "fileid": "c70194406fd5dea112c8cb1be57af353bf344860ba76adeae8f3ee29cfeb5089",
      "status": "success",
      "check": "WARNING",
      "buildurl": "https://github.com/r-universe/skranz/actions/runs/25909538326"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "0.1.0",
      "date": "2026-05-15T09:07:22.000Z",
      "commit": "e0f14b8502cc1b0d57d0ff83e33db74fe27b2bf5",
      "fileid": "70a657c8d4d8cbaa65cb0484481fa62f80125a1b2d0575b1f7c743e52d8c69f1",
      "status": "success",
      "check": "WARNING",
      "buildurl": "https://github.com/r-universe/skranz/actions/runs/25909538326"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "0.1.0",
      "date": "2026-05-15T09:07:40.000Z",
      "commit": "e0f14b8502cc1b0d57d0ff83e33db74fe27b2bf5",
      "fileid": "f41372c801c76ac1c71511dd154a4323565b69ecd9f50a4e7dcb116a7954e82e",
      "status": "success",
      "check": "WARNING",
      "buildurl": "https://github.com/r-universe/skranz/actions/runs/25909538326"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "0.1.0",
      "date": "2026-05-15T09:07:32.000Z",
      "commit": "e0f14b8502cc1b0d57d0ff83e33db74fe27b2bf5",
      "fileid": "c053b1777a3fe96a2e889e7d99f3772ad13cebdc6b77664ac2cac44bb85c5e12",
      "status": "success",
      "check": "WARNING",
      "buildurl": "https://github.com/r-universe/skranz/actions/runs/25909538326"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "0.1.0",
      "date": "2026-05-15T09:08:04.000Z",
      "commit": "e0f14b8502cc1b0d57d0ff83e33db74fe27b2bf5",
      "fileid": "e6e8d48ea3206fe4534f095e4d79e46552f94a41a54d34927720660f1a0c7e1e",
      "status": "success",
      "check": "WARNING",
      "buildurl": "https://github.com/r-universe/skranz/actions/runs/25909538326"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "0.1.0",
      "date": "2026-05-15T09:07:14.000Z",
      "commit": "e0f14b8502cc1b0d57d0ff83e33db74fe27b2bf5",
      "fileid": "76520032ba17966c6924520573a013ff2ef7162c07b1894f2a79191340a737e7",
      "status": "success",
      "check": "WARNING",
      "buildurl": "https://github.com/r-universe/skranz/actions/runs/25909538326"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "0.1.0",
      "date": "2026-06-02T19:32:27.000Z",
      "commit": "e0f14b8502cc1b0d57d0ff83e33db74fe27b2bf5",
      "fileid": "ebfbf13a9a0518cf52c4a0b85381beaa7334cb10c76fe264f574383c63dd66eb",
      "status": "success",
      "buildurl": "https://github.com/r-universe/skranz/actions/runs/25909538326"
    }
  ]
}