{
  "_id": "6a0f6a6bacfb0bcc41c5e1ee",
  "Package": "eHDPrep",
  "Type": "Package",
  "Title": "Quality Control and Semantic Enrichment of Datasets",
  "Version": "1.4.0",
  "Authors@R": "c(person(\"Tom\", \"Toner\", role = c(\"aut\"),\nemail = \"ttoner03@qub.ac.uk\",\ncomment = c(ORCID = \"0000-0001-8059-5822\")),\nperson(\"Ian\", \"Overton\", role = c(\"aut\", \"cre\"),\nemail = \"I.Overton@qub.ac.uk\",\ncomment = c(ORCID = \"0000-0003-1158-8527\"))\n)",
  "Maintainer": "Ian Overton <I.Overton@qub.ac.uk>",
  "Description": "A tool for the preparation and enrichment of health\ndatasets for analysis (Toner et al. (2023)\n<doi:10.1093/gigascience/giad030>). Provides functionality for\nassessing data quality and for improving the reliability and\nmachine interpretability of a dataset. 'eHDPrep' also enables\nsemantic enrichment of a dataset where metavariables are\ndiscovered from the relationships between input variables\ndetermined from user-provided ontologies.",
  "License": "GPL-3",
  "URL": "https://github.com/overton-group/eHDPrep",
  "BugReports": "https://github.com/overton-group/eHDPrep/issues",
  "Encoding": "UTF-8",
  "LazyData": "true",
  "RoxygenNote": "7.3.3",
  "BuildVignettes": "true",
  "VignetteBuilder": "knitr",
  "Config/testthat/edition": "3",
  "Config/pak/sysreqs": "cmake libfontconfig1-dev libfreetype6-dev\nlibfribidi-dev libglpk-dev make libharfbuzz-dev libicu-dev\nlibpng-dev libuv1-dev libxml2-dev libx11-dev",
  "Repository": "https://overton-group.r-universe.dev",
  "Date/Publication": "2026-02-20 15:17:59 UTC",
  "RemoteUrl": "https://github.com/overton-group/ehdprep",
  "RemoteRef": "HEAD",
  "RemoteSha": "887f3b12c191e883c394bbd0cb8c6ca90393c6bc",
  "NeedsCompilation": "no",
  "Packaged": {
    "Date": "2026-05-21 08:46:55 UTC",
    "User": "root"
  },
  "Author": "Tom Toner [aut] (ORCID: <https://orcid.org/0000-0001-8059-5822>),\nIan Overton [aut, cre] (ORCID: <https://orcid.org/0000-0003-1158-8527>)",
  "MD5sum": "cc708aadcabd8526b6c68a55beadfb0b",
  "_user": "overton-group",
  "_type": "src",
  "_file": "eHDPrep_1.4.0.tar.gz",
  "_fileid": "7279b0b4f06e816517cc05f526e6f579b5154d595829d394eaf4665ae2a14975",
  "_filesize": 3929896,
  "_sha256": "7279b0b4f06e816517cc05f526e6f579b5154d595829d394eaf4665ae2a14975",
  "_created": "2026-05-21T08:46:55.000Z",
  "_published": "2026-05-21T20:26:19.868Z",
  "_distro": "noble",
  "_jobs": [
    {
      "job": 77261823771,
      "time": 237,
      "config": "linux-devel-x86_64",
      "r": "4.7.0",
      "check": "NOTE",
      "artifact": "7131342310"
    },
    {
      "job": 77261824138,
      "time": 231,
      "config": "linux-release-x86_64",
      "r": "4.6.0",
      "check": "NOTE",
      "artifact": "7131339884"
    },
    {
      "job": 77261823861,
      "time": 207,
      "config": "macos-oldrel-arm64",
      "r": "4.5.3",
      "check": "NOTE",
      "artifact": "7131319505"
    },
    {
      "job": 77261824445,
      "time": 183,
      "config": "macos-release-arm64",
      "r": "4.6.0",
      "check": "NOTE",
      "artifact": "7131313692"
    },
    {
      "job": 77261823685,
      "time": 284,
      "config": "source",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7131259282"
    },
    {
      "job": 77261823563,
      "time": 150,
      "config": "wasm-release",
      "r": "4.6.0",
      "check": "OK",
      "artifact": "7146401841"
    },
    {
      "job": 77261823888,
      "time": 187,
      "config": "windows-devel",
      "r": "4.7.0",
      "check": "NOTE",
      "artifact": "7131324816"
    },
    {
      "job": 77261823916,
      "time": 155,
      "config": "windows-oldrel",
      "r": "4.5.3",
      "check": "NOTE",
      "artifact": "7131313841"
    },
    {
      "job": 77261824032,
      "time": 180,
      "config": "windows-release",
      "r": "4.6.0",
      "check": "NOTE",
      "artifact": "7131322095"
    }
  ],
  "_buildurl": "https://github.com/r-universe/overton-group/actions/runs/26215360756",
  "_status": "success",
  "_host": "GitHub-Actions",
  "_upstream": "https://github.com/overton-group/ehdprep",
  "_commit": {
    "id": "887f3b12c191e883c394bbd0cb8c6ca90393c6bc",
    "author": "kboakyeduah <kluivertboakyejnr@gmail.com>",
    "committer": "kboakyeduah <kluivertboakyejnr@gmail.com>",
    "message": "updates to r.yml\n",
    "time": 1771600679
  },
  "_maintainer": {
    "name": "Ian Overton",
    "email": "i.overton@qub.ac.uk",
    "login": "ianoverton",
    "description": "",
    "uuid": 46562629,
    "orcid": "0000-0003-1158-8527"
  },
  "_registered": true,
  "_dependencies": [
    {
      "package": "R",
      "version": ">= 3.6.0",
      "role": "Depends"
    },
    {
      "package": "ggplot2",
      "version": ">= 3.3.3",
      "role": "Imports"
    },
    {
      "package": "dplyr",
      "version": ">= 1.1.0",
      "role": "Imports"
    },
    {
      "package": "forcats",
      "version": ">= 0.5.0",
      "role": "Imports"
    },
    {
      "package": "stringr",
      "version": ">= 1.4.0",
      "role": "Imports"
    },
    {
      "package": "purrr",
      "version": ">= 0.3.4",
      "role": "Imports"
    },
    {
      "package": "tidyr",
      "version": ">= 1.1.2",
      "role": "Imports"
    },
    {
      "package": "kableExtra",
      "version": ">= 1.3.1",
      "role": "Imports"
    },
    {
      "package": "magrittr",
      "version": ">= 2.0.1",
      "role": "Imports"
    },
    {
      "package": "tibble",
      "version": ">= 3.0.5",
      "role": "Imports"
    },
    {
      "package": "scales",
      "version": ">= 1.1.1",
      "role": "Imports"
    },
    {
      "package": "rlang",
      "version": ">= 0.4.10",
      "role": "Imports"
    },
    {
      "package": "quanteda",
      "version": ">= 2.1.2",
      "role": "Imports"
    },
    {
      "package": "tm",
      "version": ">= 0.7-8",
      "role": "Imports"
    },
    {
      "package": "pheatmap",
      "version": ">= 1.0.12",
      "role": "Imports"
    },
    {
      "package": "igraph",
      "version": ">= 1.2.6",
      "role": "Imports"
    },
    {
      "package": "tidygraph",
      "version": ">= 1.2.0",
      "role": "Imports"
    },
    {
      "package": "readr",
      "version": ">= 1.4.0",
      "role": "Imports"
    },
    {
      "package": "readxl",
      "version": ">= 1.3.1",
      "role": "Imports"
    },
    {
      "package": "knitr",
      "version": ">= 1.31",
      "role": "Imports"
    },
    {
      "package": "testthat",
      "version": ">= 2.1.0",
      "role": "Suggests"
    },
    {
      "package": "ggraph",
      "version": ">= 2.0.5",
      "role": "Suggests"
    },
    {
      "package": "rmarkdown",
      "version": ">= 2.3",
      "role": "Suggests"
    }
  ],
  "_owner": "overton-group",
  "_selfowned": true,
  "_usedby": 0,
  "_updates": [
    {
      "week": "2025-34",
      "n": 2
    },
    {
      "week": "2025-35",
      "n": 2
    },
    {
      "week": "2025-37",
      "n": 3
    },
    {
      "week": "2026-06",
      "n": 3
    },
    {
      "week": "2026-08",
      "n": 10
    }
  ],
  "_tags": [
    {
      "name": "v1.4.0",
      "date": "2026-02-20"
    }
  ],
  "_topics": [
    "data-quality",
    "health-informatics",
    "semantic-enrichment"
  ],
  "_stars": 8,
  "_contributors": [
    {
      "user": "tommtoner",
      "count": 73,
      "uuid": 68654202
    },
    {
      "user": "kboakyeduah",
      "count": 20,
      "uuid": 93317047
    },
    {
      "user": "davisvaughan",
      "count": 2,
      "uuid": 19150088
    },
    {
      "user": "hadley",
      "count": 1,
      "uuid": 4196
    }
  ],
  "_userbio": {
    "uuid": 46562691,
    "type": "organization",
    "name": "overton-group"
  },
  "_downloads": {
    "count": 228,
    "source": "https://cranlogs.r-pkg.org/downloads/total/last-month/eHDPrep"
  },
  "_devurl": "https://github.com/overton-group/ehdprep",
  "_searchresults": 12,
  "_rbuild": "4.6.0",
  "_assets": [
    "extra/citation.cff",
    "extra/citation.html",
    "extra/citation.json",
    "extra/citation.txt",
    "extra/contents.json",
    "extra/eHDPrep.html",
    "extra/NEWS.html",
    "extra/NEWS.txt",
    "extra/readme.html",
    "extra/readme.md",
    "manual.pdf"
  ],
  "_homeurl": "https://github.com/overton-group/ehdprep",
  "_realowner": "overton-group",
  "_cranurl": true,
  "_releases": [
    {
      "version": "1.2.1",
      "date": "2022-09-07"
    },
    {
      "version": "1.3.2",
      "date": "2023-02-01"
    },
    {
      "version": "1.3.3",
      "date": "2023-06-05"
    },
    {
      "version": "1.3.4",
      "date": "2025-09-03"
    },
    {
      "version": "1.4.0",
      "date": "2026-02-20"
    }
  ],
  "_exports": [
    "apply_quality_ctrl",
    "assess_completeness",
    "assess_quality",
    "assume_var_classes",
    "compare_completeness",
    "compare_info_content",
    "compare_info_content_plt",
    "completeness_heatmap",
    "count_compare",
    "edge_tbl_to_graph",
    "encode_as_num_mat",
    "encode_binary_cats",
    "encode_cats",
    "encode_genotypes",
    "encode_ordinals",
    "entropy",
    "export_dataset",
    "extract_freetext",
    "identify_inconsistency",
    "import_dataset",
    "import_var_classes",
    "information_content_contin",
    "information_content_discrete",
    "join_vars_to_ontol",
    "merge_cols",
    "metavariable_agg",
    "metavariable_info",
    "metavariable_variable_descendants",
    "mi_content_discrete",
    "mod_track",
    "node_IC_zhou",
    "nums_to_NA",
    "ordinal_label_levels",
    "plot_completeness",
    "report_var_mods",
    "review_quality_ctrl",
    "row_completeness",
    "semantic_enrichment",
    "skipgram_append",
    "skipgram_freq",
    "skipgram_identify",
    "strings_to_NA",
    "validate_consistency_tbl",
    "variable_completeness",
    "variable_entropy",
    "zero_entropy_variables"
  ],
  "_datasets": [
    {
      "name": "example_data",
      "title": "Example data for eHDPrep",
      "object": "example_data",
      "class": [
        "tbl_df",
        "tbl",
        "data.frame"
      ],
      "fields": [
        "patient_id",
        "tumoursize",
        "t_stage",
        "n_stage",
        "diabetes",
        "diabetes_type",
        "hypertension",
        "rural_urban",
        "marital_status",
        "SNP_a",
        "SNP_b",
        "free_text"
      ],
      "rows": 1000,
      "table": true,
      "tojson": true
    },
    {
      "name": "example_edge_tbl",
      "title": "Example ontology as an edge table for semantic enrichment",
      "object": "example_edge_tbl",
      "class": [
        "tbl_df",
        "tbl",
        "data.frame"
      ],
      "fields": [
        "from",
        "to"
      ],
      "rows": 25,
      "table": true,
      "tojson": true
    },
    {
      "name": "example_mapping_file",
      "title": "Example mapping file for semantic enrichment",
      "object": "example_mapping_file",
      "class": [
        "tbl_df",
        "tbl",
        "data.frame"
      ],
      "fields": [
        "variable",
        "onto_entity"
      ],
      "rows": 12,
      "table": true,
      "tojson": true
    },
    {
      "name": "example_ontology",
      "title": "Example ontology as a network graph for semantic enrichment",
      "object": "example_ontology",
      "class": [
        "tbl_graph",
        "igraph"
      ],
      "fields": [],
      "table": false,
      "tojson": false
    }
  ],
  "_help": [
    {
      "page": "apply_quality_ctrl",
      "title": "Apply quality control measures to a dataset",
      "concept": [
        "high level functionality"
      ],
      "topics": [
        "apply_quality_ctrl"
      ]
    },
    {
      "page": "assess_completeness",
      "title": "Assess completeness of a dataset",
      "concept": [
        "measures of completeness"
      ],
      "topics": [
        "assess_completeness"
      ]
    },
    {
      "page": "assess_quality",
      "title": "Assess quality of a dataset",
      "concept": [
        "high level functionality"
      ],
      "topics": [
        "assess_quality"
      ]
    },
    {
      "page": "assume_var_classes",
      "title": "Assume variable classes in data",
      "topics": [
        "assume_var_classes"
      ]
    },
    {
      "page": "cellspec_lgl",
      "title": "Kable logical data highlighting",
      "topics": [
        "cellspec_lgl"
      ]
    },
    {
      "page": "compare_completeness",
      "title": "Compare Completeness between Datasets",
      "concept": [
        "measures of completeness"
      ],
      "topics": [
        "compare_completeness"
      ]
    },
    {
      "page": "compare_info_content",
      "title": "Information Content Comparison Table",
      "topics": [
        "compare_info_content"
      ]
    },
    {
      "page": "compare_info_content_plt",
      "title": "Information Content Comparison Plot",
      "topics": [
        "compare_info_content_plt"
      ]
    },
    {
      "page": "completeness_heatmap",
      "title": "Completeness Heatmap",
      "concept": [
        "measures of completeness"
      ],
      "topics": [
        "completeness_heatmap"
      ]
    },
    {
      "page": "count_compare",
      "title": "Compare unique values before and after data modification",
      "topics": [
        "count_compare"
      ]
    },
    {
      "page": "discrete.mi",
      "title": "Calculate mutual information of a matrix of discrete values",
      "topics": [
        "discrete.mi"
      ]
    },
    {
      "page": "distant_neg_val",
      "title": "Find highly distant value for data frame",
      "topics": [
        "distant_neg_val"
      ]
    },
    {
      "page": "edge_tbl_to_graph",
      "title": "Convert edge table to tidygraph graph",
      "topics": [
        "edge_tbl_to_graph"
      ]
    },
    {
      "page": "encode_as_num_mat",
      "title": "Convert data frame to numeric matrix",
      "topics": [
        "encode_as_num_mat"
      ]
    },
    {
      "page": "encode_bin_cat_vec",
      "title": "Encode a categorical vector with binary categories",
      "topics": [
        "encode_bin_cat_vec"
      ]
    },
    {
      "page": "encode_binary_cats",
      "title": "Encode categorical variables as binary factors",
      "topics": [
        "encode_binary_cats"
      ]
    },
    {
      "page": "encode_cats",
      "title": "Encode categorical variables using one-hot encoding.",
      "topics": [
        "encode_cats"
      ]
    },
    {
      "page": "encode_genotype_vec",
      "title": "Encode a genotype/SNP vector",
      "topics": [
        "encode_genotype_vec"
      ]
    },
    {
      "page": "encode_genotypes",
      "title": "Encode genotype/SNP variables in data frame",
      "topics": [
        "encode_genotypes"
      ]
    },
    {
      "page": "encode_ordinals",
      "title": "Encode ordinal variables",
      "topics": [
        "encode_ordinals"
      ]
    },
    {
      "page": "entropy",
      "title": "Calculate Entropy of a Vector",
      "topics": [
        "entropy"
      ]
    },
    {
      "page": "exact.kde",
      "title": "Exact kernel density estimation",
      "topics": [
        "exact.kde"
      ]
    },
    {
      "page": "example_data",
      "title": "Example data for eHDPrep",
      "topics": [
        "example_data"
      ]
    },
    {
      "page": "example_edge_tbl",
      "title": "Example ontology as an edge table for semantic enrichment",
      "topics": [
        "example_edge_tbl"
      ]
    },
    {
      "page": "example_mapping_file",
      "title": "Example mapping file for semantic enrichment",
      "topics": [
        "example_mapping_file"
      ]
    },
    {
      "page": "example_ontology",
      "title": "Example ontology as a network graph for semantic enrichment",
      "topics": [
        "example_ontology"
      ]
    },
    {
      "page": "export_dataset",
      "title": "Export data to delimited file",
      "concept": [
        "import to/export from 'R' functions"
      ],
      "topics": [
        "export_dataset"
      ]
    },
    {
      "page": "extract_freetext",
      "title": "Extract information from free text",
      "concept": [
        "free text functions"
      ],
      "topics": [
        "extract_freetext"
      ]
    },
    {
      "page": "identify_inconsistency",
      "title": "Identify inconsistencies in a dataset",
      "concept": [
        "internal consistency functions"
      ],
      "topics": [
        "identify_inconsistency"
      ]
    },
    {
      "page": "import_dataset",
      "title": "Import data into 'R'",
      "concept": [
        "import to/export from 'R' functions"
      ],
      "topics": [
        "import_dataset"
      ]
    },
    {
      "page": "import_var_classes",
      "title": "Import corrected variable classes",
      "topics": [
        "import_var_classes"
      ]
    },
    {
      "page": "information_content_contin",
      "title": "Calculate Information Content (Continuous Variable)",
      "topics": [
        "information_content_contin"
      ]
    },
    {
      "page": "information_content_discrete",
      "title": "Calculate Information Content (Discrete Variable)",
      "topics": [
        "information_content_discrete"
      ]
    },
    {
      "page": "join_vars_to_ontol",
      "title": "Join Mapping Table to Ontology Network Graph",
      "concept": [
        "semantic enrichment functions"
      ],
      "topics": [
        "join_vars_to_ontol"
      ]
    },
    {
      "page": "max_catchNAs",
      "title": "Find maximum of vector safely",
      "topics": [
        "max_catchNAs"
      ]
    },
    {
      "page": "mean_catchNAs",
      "title": "Find mean of vector safely",
      "topics": [
        "mean_catchNAs"
      ]
    },
    {
      "page": "merge_cols",
      "title": "Merge columns in data frame",
      "topics": [
        "merge_cols"
      ]
    },
    {
      "page": "metavariable_agg",
      "title": "Aggregate Data by Metavariable",
      "concept": [
        "semantic enrichment functions"
      ],
      "topics": [
        "metavariable_agg"
      ]
    },
    {
      "page": "metavariable_info",
      "title": "Compute Metavariable Information",
      "concept": [
        "semantic enrichment functions"
      ],
      "topics": [
        "metavariable_info"
      ]
    },
    {
      "page": "metavariable_variable_descendants",
      "title": "Extract metavariables' descendant variables",
      "concept": [
        "semantic enrichment functions"
      ],
      "topics": [
        "metavariable_variable_descendants"
      ]
    },
    {
      "page": "mi_content_discrete",
      "title": "Calculate Mutual Information Content",
      "topics": [
        "mi_content_discrete"
      ]
    },
    {
      "page": "min_catchNAs",
      "title": "Find minimum of vector safely",
      "topics": [
        "min_catchNAs"
      ]
    },
    {
      "page": "mod_track",
      "title": "Data modification tracking",
      "topics": [
        "mod_track"
      ]
    },
    {
      "page": "node_IC_zhou",
      "title": "Calculate Node Information Content (Zhou et al 2008 method)",
      "topics": [
        "node_IC_zhou"
      ]
    },
    {
      "page": "normalize",
      "title": "Min max normalization",
      "topics": [
        "normalize"
      ]
    },
    {
      "page": "nums_to_NA",
      "title": "Replace numeric values in numeric columns with NA",
      "topics": [
        "nums_to_NA"
      ]
    },
    {
      "page": "onehot_vec",
      "title": "One hot encode a vector",
      "topics": [
        "onehot_vec"
      ]
    },
    {
      "page": "ordinal_label_levels",
      "title": "Extract labels and levels of ordinal variables in a dataset",
      "topics": [
        "ordinal_label_levels"
      ]
    },
    {
      "page": "plot_completeness",
      "title": "Plot Completeness of a Dataset",
      "concept": [
        "measures of completeness"
      ],
      "topics": [
        "plot_completeness"
      ]
    },
    {
      "page": "prod_catchNAs",
      "title": "Find product of vector safely",
      "topics": [
        "prod_catchNAs"
      ]
    },
    {
      "page": "report_var_mods",
      "title": "Track changes to dataset variables",
      "topics": [
        "report_var_mods"
      ]
    },
    {
      "page": "review_quality_ctrl",
      "title": "Review Quality Control",
      "concept": [
        "high level functionality"
      ],
      "topics": [
        "review_quality_ctrl"
      ]
    },
    {
      "page": "row_completeness",
      "title": "Calculate Row Completeness in a Data Frame",
      "concept": [
        "measures of completeness"
      ],
      "topics": [
        "row_completeness"
      ]
    },
    {
      "page": "semantic_enrichment",
      "title": "Semantic enrichment",
      "concept": [
        "high level functionality"
      ],
      "topics": [
        "semantic_enrichment"
      ]
    },
    {
      "page": "skipgram_append",
      "title": "Append Skipgram Presence Variables to Dataset",
      "concept": [
        "free text functions"
      ],
      "topics": [
        "skipgram_append"
      ]
    },
    {
      "page": "skipgram_freq",
      "title": "Report Skipgram Frequency",
      "concept": [
        "free text functions"
      ],
      "topics": [
        "skipgram_freq"
      ]
    },
    {
      "page": "skipgram_identify",
      "title": "Identify Neighbouring Words (Skipgrams) in a free-text vector",
      "concept": [
        "free text functions"
      ],
      "topics": [
        "skipgram_identify"
      ]
    },
    {
      "page": "strings_to_NA",
      "title": "Replace values in non-numeric columns with NA",
      "topics": [
        "strings_to_NA"
      ]
    },
    {
      "page": "sum_catchNAs",
      "title": "Sum vector safely for semantic enrichment",
      "topics": [
        "sum_catchNAs"
      ]
    },
    {
      "page": "validate_consistency_tbl",
      "title": "Validate internal consistency table",
      "concept": [
        "internal consistency functions"
      ],
      "topics": [
        "validate_consistency_tbl"
      ]
    },
    {
      "page": "validate_mapping_tbl",
      "title": "Validate mapping table for semantic enrichment",
      "topics": [
        "validate_mapping_tbl"
      ]
    },
    {
      "page": "validate_ontol_nw",
      "title": "Validate ontology network for semantic enrichment",
      "topics": [
        "validate_ontol_nw"
      ]
    },
    {
      "page": "variable_completeness",
      "title": "Calculate Variable Completeness in a Data Frame",
      "concept": [
        "measures of completeness"
      ],
      "topics": [
        "variable_completeness"
      ]
    },
    {
      "page": "variable_entropy",
      "title": "Calculate Entropy of Each Variable in Data Frame",
      "topics": [
        "variable_entropy"
      ]
    },
    {
      "page": "variable.bw.kde",
      "title": "Variable bandwidth Kernel Density Estimation",
      "topics": [
        "variable.bw.kde"
      ]
    },
    {
      "page": "warn_missing_dots",
      "title": "Missing dots warning",
      "topics": [
        "warn_missing_dots"
      ]
    },
    {
      "page": "zero_entropy_variables",
      "title": "Identify variables with zero entropy",
      "topics": [
        "zero_entropy_variables"
      ]
    }
  ],
  "_readme": "https://github.com/overton-group/ehdprep/raw/HEAD/README.md",
  "_rundeps": [
    "base64enc",
    "BH",
    "bit",
    "bit64",
    "bslib",
    "cachem",
    "cellranger",
    "cli",
    "clipr",
    "cpp11",
    "crayon",
    "digest",
    "dplyr",
    "evaluate",
    "farver",
    "fastmap",
    "fastmatch",
    "fontawesome",
    "forcats",
    "fs",
    "generics",
    "ggplot2",
    "glue",
    "gtable",
    "highr",
    "hms",
    "htmltools",
    "igraph",
    "isoband",
    "ISOcodes",
    "jquerylib",
    "jsonlite",
    "kableExtra",
    "knitr",
    "labeling",
    "lattice",
    "lifecycle",
    "magrittr",
    "Matrix",
    "memoise",
    "mime",
    "NLP",
    "pheatmap",
    "pillar",
    "pkgconfig",
    "prettyunits",
    "progress",
    "purrr",
    "quanteda",
    "R6",
    "rappdirs",
    "RColorBrewer",
    "Rcpp",
    "readr",
    "readxl",
    "rematch",
    "rlang",
    "rmarkdown",
    "rstudioapi",
    "S7",
    "sass",
    "scales",
    "slam",
    "SnowballC",
    "stopwords",
    "stringi",
    "stringr",
    "svglite",
    "systemfonts",
    "textshaping",
    "tibble",
    "tidygraph",
    "tidyr",
    "tidyselect",
    "tinytex",
    "tm",
    "tzdb",
    "utf8",
    "vctrs",
    "viridisLite",
    "vroom",
    "withr",
    "xfun",
    "xml2",
    "yaml"
  ],
  "_vignettes": [
    {
      "source": "Introduction_to_eHDPrep.Rmd",
      "filename": "Introduction_to_eHDPrep.pdf",
      "title": "'eHDPrep': an 'R' package for Electronic Health Data Quality Control and Semantic Enrichment",
      "author": "Tom Toner, Ian Overton",
      "engine": "knitr::rmarkdown",
      "headings": [
        "Quick Start",
        "Introduction",
        "Data",
        "Quality control",
        "High level functions",
        "Data Import",
        "Assess input data quality",
        "Apply quality control",
        "Review of all quality control",
        "Low level functions",
        "Measure completeness",
        "show_rownames is passed to pheatmap() through the ... parameter",
        "Merge variables",
        "Encoding categorical data",
        "Encoding ordinal data",
        "Encoding genotype (SNP) data",
        "Extract information from free text variables",
        "Review quality control",
        "value level modifications showing which exact missingness values",
        "were removed",
        "plot value level modifications",
        "Semantic enrichment",
        "Required inputs",
        "Example data",
        "High level functionality",
        "Low level functionality",
        "Convert edge table to ontology",
        "Join ontology and data variable names",
        "Compute meta-variable information",
        "annotations are also considered a set. This isn't helpful for this visualisation",
        "Therefore, the sets of non-meta-variables are removed below",
        "Generate semantic aggregations",
        "References"
      ],
      "created": "2022-07-26 10:54:44",
      "modified": "2023-06-01 15:58:03",
      "commits": 10
    }
  ],
  "_score": 5.857332496431268,
  "_indexed": true,
  "_nocasepkg": "ehdprep",
  "_universes": [
    "overton-group",
    "ianoverton"
  ],
  "_binaries": [
    {
      "r": "4.7.0",
      "os": "linux",
      "version": "1.4.0",
      "date": "2026-05-21T08:50:09.000Z",
      "distro": "noble",
      "commit": "887f3b12c191e883c394bbd0cb8c6ca90393c6bc",
      "fileid": "f4e08b8057fe57012bad7177b8c0fb0185a56df1b97523c1ab9289a53e15ad36",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/overton-group/actions/runs/26215360756"
    },
    {
      "r": "4.6.0",
      "os": "linux",
      "version": "1.4.0",
      "date": "2026-05-21T08:50:07.000Z",
      "distro": "noble",
      "commit": "887f3b12c191e883c394bbd0cb8c6ca90393c6bc",
      "fileid": "c09471b06e2d50dd3784a9d5066a4e36ae7a52a947b15159e2601ee65dfbedc4",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/overton-group/actions/runs/26215360756"
    },
    {
      "r": "4.5.3",
      "os": "mac",
      "version": "1.4.0",
      "date": "2026-05-21T08:49:30.000Z",
      "commit": "887f3b12c191e883c394bbd0cb8c6ca90393c6bc",
      "fileid": "a9241e25851f8f966ae6702592a0952f39a7a0d2445a928f99bba04e6e80d0a7",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/overton-group/actions/runs/26215360756"
    },
    {
      "r": "4.6.0",
      "os": "mac",
      "version": "1.4.0",
      "date": "2026-05-21T08:49:04.000Z",
      "commit": "887f3b12c191e883c394bbd0cb8c6ca90393c6bc",
      "fileid": "e598f71ca98466bef422557176b9120ebfb8cc91cee3872a4dea421911221870",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/overton-group/actions/runs/26215360756"
    },
    {
      "r": "4.6.0",
      "os": "wasm",
      "version": "1.4.0",
      "date": "2026-05-21T20:25:59.000Z",
      "commit": "887f3b12c191e883c394bbd0cb8c6ca90393c6bc",
      "fileid": "109c47862b3aa39b70ec123d6b8bc5e5ac76703a1f691df2cbfb37567bd0e1bb",
      "status": "success",
      "buildurl": "https://github.com/r-universe/overton-group/actions/runs/26215360756"
    },
    {
      "r": "4.7.0",
      "os": "win",
      "version": "1.4.0",
      "date": "2026-05-21T08:49:12.000Z",
      "commit": "887f3b12c191e883c394bbd0cb8c6ca90393c6bc",
      "fileid": "2f0202291a47805ba6e6ade88c03f16e0d66176170d7c7967c98cb5d27017793",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/overton-group/actions/runs/26215360756"
    },
    {
      "r": "4.5.3",
      "os": "win",
      "version": "1.4.0",
      "date": "2026-05-21T08:48:40.000Z",
      "commit": "887f3b12c191e883c394bbd0cb8c6ca90393c6bc",
      "fileid": "11372450b83a3ce4be848c05f3e251538efc758367ae82a16eb11f93d04075f2",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/overton-group/actions/runs/26215360756"
    },
    {
      "r": "4.6.0",
      "os": "win",
      "version": "1.4.0",
      "date": "2026-05-21T08:49:03.000Z",
      "commit": "887f3b12c191e883c394bbd0cb8c6ca90393c6bc",
      "fileid": "2003fc81cd1d4835e9a2606ed4d3aa6791383257340714d67985c66014de67df",
      "status": "success",
      "check": "NOTE",
      "buildurl": "https://github.com/r-universe/overton-group/actions/runs/26215360756"
    }
  ]
}