AMR/data-raw/internals.R

86 lines
4.7 KiB
R
Raw Normal View History

# ==================================================================== #
# TITLE #
# Antimicrobial Resistance (AMR) Analysis #
# #
# SOURCE #
# https://github.com/msberends/AMR #
# #
# LICENCE #
# (c) 2018-2020 Berends MS, Luz CF et al. #
# #
# This R package is free software; you can freely use and distribute #
# it for both personal and commercial purposes under the terms of the #
# GNU General Public License version 2.0 (GNU GPL-2), as published by #
# the Free Software Foundation. #
# #
# We created this package for both routine data analysis and academic #
# research and it was publicly released in the hope that it will be #
# useful, but it comes WITHOUT ANY WARRANTY OR LIABILITY. #
# Visit our website for more info: https://msberends.github.io/AMR. #
# ==================================================================== #
# Run this file to update the package using: -------------------------------
# source("data-raw/internals.R")
# --------------------------------------------------------------------------
# See 'data-raw/eucast_rules.tsv' for the EUCAST reference file
2019-11-15 15:25:03 +01:00
eucast_rules_file <- utils::read.delim(file = "data-raw/eucast_rules.tsv",
skip = 10,
2019-06-01 20:40:49 +02:00
sep = "\t",
stringsAsFactors = FALSE,
header = TRUE,
strip.white = TRUE,
2019-11-15 15:25:03 +01:00
na = c(NA, "", NULL))
2020-02-17 14:38:01 +01:00
# take the order of the reference.rule_group column in the original data file
2019-11-15 15:25:03 +01:00
eucast_rules_file$reference.rule_group <- factor(eucast_rules_file$reference.rule_group,
levels = unique(eucast_rules_file$reference.rule_group),
ordered = TRUE)
eucast_rules_file <- dplyr::arrange(eucast_rules_file,
2019-06-01 20:40:49 +02:00
reference.rule_group,
reference.rule)
eucast_rules_file$reference.rule_group <- as.character(eucast_rules_file$reference.rule_group)
# Translations ----
translations_file <- utils::read.delim(file = "data-raw/translations.tsv",
2019-06-01 20:40:49 +02:00
sep = "\t",
stringsAsFactors = FALSE,
header = TRUE,
blank.lines.skip = TRUE,
fill = TRUE,
strip.white = TRUE,
encoding = "UTF-8",
fileEncoding = "UTF-8",
na.strings = c(NA, "", NULL),
allowEscapes = TRUE, # else "\\1" will be imported as "\\\\1"
quote = "")
2019-06-01 20:40:49 +02:00
2019-09-18 15:46:09 +02:00
# Old microorganism codes -------------------------------------------------
microorganisms.translation <- readRDS("data-raw/microorganisms.translation.rds")
2019-06-01 20:40:49 +02:00
# Export to package as internal data ----
2019-09-18 15:46:09 +02:00
usethis::use_data(eucast_rules_file, translations_file, microorganisms.translation,
2019-06-01 20:40:49 +02:00
internal = TRUE,
overwrite = TRUE,
version = 2)
# Remove from global environment ----
rm(eucast_rules_file)
rm(translations_file)
2019-09-18 15:46:09 +02:00
rm(microorganisms.translation)
2020-02-01 15:09:36 +01:00
# Save to raw data to repository ----
usethis::ui_done(paste0("Saving raw data to {usethis::ui_value('/data-raw/')}"))
devtools::load_all(quiet = TRUE)
2020-02-14 19:54:13 +01:00
# give official names to ABs and MOs
2020-05-16 13:05:47 +02:00
write.table(dplyr::mutate(rsi_translation, ab = ab_name(ab), mo = mo_name(mo)),
2020-02-01 15:09:36 +01:00
"data-raw/rsi_translation.txt", sep = "\t", na = "", row.names = FALSE)
2020-05-16 13:05:47 +02:00
write.table(dplyr::mutate_if(microorganisms, ~!is.numeric(.), as.character),
2020-02-01 15:09:36 +01:00
"data-raw/microorganisms.txt", sep = "\t", na = "", row.names = FALSE)
2020-05-16 13:05:47 +02:00
write.table(dplyr::mutate_if(antibiotics, ~!is.numeric(.), as.character),
2020-02-01 15:09:36 +01:00
"data-raw/antibiotics.txt", sep = "\t", na = "", row.names = FALSE)
2020-05-16 13:05:47 +02:00
write.table(dplyr::mutate_all(antivirals, as.character),
2020-02-01 15:09:36 +01:00
"data-raw/antivirals.txt", sep = "\t", na = "", row.names = FALSE)
write.table(intrinsic_resistant,
"data-raw/intrinsic_resistant.txt", sep = "\t", na = "", row.names = FALSE)