2021-05-15 21:36:22 +02:00
|
|
|
# ==================================================================== #
|
|
|
|
# TITLE #
|
|
|
|
# Antimicrobial Resistance (AMR) Data Analysis for R #
|
|
|
|
# #
|
|
|
|
# SOURCE #
|
|
|
|
# https://github.com/msberends/AMR #
|
|
|
|
# #
|
|
|
|
# LICENCE #
|
2021-12-23 18:56:28 +01:00
|
|
|
# (c) 2018-2022 Berends MS, Luz CF et al. #
|
2021-05-15 21:36:22 +02:00
|
|
|
# Developed at the University of Groningen, the Netherlands, in #
|
|
|
|
# collaboration with non-profit organisations Certe Medical #
|
2022-08-28 10:31:50 +02:00
|
|
|
# Diagnostics & Advice, and University Medical Center Groningen. #
|
2021-05-15 21:36:22 +02:00
|
|
|
# #
|
|
|
|
# This R package is free software; you can freely use and distribute #
|
|
|
|
# it for both personal and commercial purposes under the terms of the #
|
|
|
|
# GNU General Public License version 2.0 (GNU GPL-2), as published by #
|
|
|
|
# the Free Software Foundation. #
|
|
|
|
# We created this package for both routine data analysis and academic #
|
|
|
|
# research and it was publicly released in the hope that it will be #
|
|
|
|
# useful, but it comes WITHOUT ANY WARRANTY OR LIABILITY. #
|
|
|
|
# #
|
|
|
|
# Visit our website for the full manual and a complete tutorial about #
|
|
|
|
# how to conduct AMR data analysis: https://msberends.github.io/AMR/ #
|
|
|
|
# ==================================================================== #
|
|
|
|
|
2021-05-16 10:50:00 +02:00
|
|
|
expect_true(AMR:::check_dataset_integrity()) # in misc.R
|
2021-05-15 21:36:22 +02:00
|
|
|
|
|
|
|
# IDs should always be unique
|
|
|
|
expect_identical(nrow(microorganisms), length(unique(microorganisms$mo)))
|
|
|
|
expect_identical(class(microorganisms$mo), c("mo", "character"))
|
|
|
|
expect_identical(nrow(antibiotics), length(unique(antibiotics$ab)))
|
2021-06-23 10:03:17 +02:00
|
|
|
expect_true(all(is.na(antibiotics$atc[duplicated(antibiotics$atc)])))
|
2021-05-15 21:36:22 +02:00
|
|
|
expect_identical(class(antibiotics$ab), c("ab", "character"))
|
|
|
|
|
2021-06-23 10:03:17 +02:00
|
|
|
|
2021-05-15 21:36:22 +02:00
|
|
|
# check cross table reference
|
|
|
|
expect_true(all(microorganisms.codes$mo %in% microorganisms$mo))
|
|
|
|
expect_true(all(example_isolates$mo %in% microorganisms$mo))
|
|
|
|
expect_true(all(rsi_translation$mo %in% microorganisms$mo))
|
|
|
|
expect_true(all(rsi_translation$ab %in% antibiotics$ab))
|
2021-12-14 21:47:14 +01:00
|
|
|
expect_true(all(intrinsic_resistant$mo %in% microorganisms$mo))
|
|
|
|
expect_true(all(intrinsic_resistant$ab %in% antibiotics$ab))
|
2021-05-15 21:36:22 +02:00
|
|
|
expect_false(any(is.na(microorganisms.codes$code)))
|
|
|
|
expect_false(any(is.na(microorganisms.codes$mo)))
|
|
|
|
expect_true(all(dosage$ab %in% antibiotics$ab))
|
|
|
|
expect_true(all(dosage$name %in% antibiotics$name))
|
2021-12-13 11:57:34 +01:00
|
|
|
# check valid disks/MICs
|
2022-08-27 20:49:37 +02:00
|
|
|
expect_false(any(is.na(as.mic(rsi_translation[which(rsi_translation$method == "MIC"), "breakpoint_S", drop = TRUE]))))
|
|
|
|
expect_false(any(is.na(as.mic(rsi_translation[which(rsi_translation$method == "MIC"), "breakpoint_R", drop = TRUE]))))
|
|
|
|
expect_false(any(is.na(as.disk(rsi_translation[which(rsi_translation$method == "DISK"), "breakpoint_S", drop = TRUE]))))
|
|
|
|
expect_false(any(is.na(as.disk(rsi_translation[which(rsi_translation$method == "DISK"), "breakpoint_R", drop = TRUE]))))
|
2021-05-15 21:36:22 +02:00
|
|
|
|
|
|
|
# antibiotic names must always be coercible to their original AB code
|
|
|
|
expect_identical(as.ab(antibiotics$name), antibiotics$ab)
|
|
|
|
|
2022-08-28 19:34:04 +02:00
|
|
|
if (AMR:::pkg_is_available("tibble", also_load = FALSE)) {
|
|
|
|
# there should be no diacritics (i.e. non ASCII) characters in the datasets (CRAN policy)
|
|
|
|
datasets <- data(package = "AMR", envir = asNamespace("AMR"))$results[, "Item", drop = TRUE]
|
|
|
|
for (i in seq_len(length(datasets))) {
|
|
|
|
dataset <- get(datasets[i], envir = asNamespace("AMR"))
|
|
|
|
expect_identical(AMR:::dataset_UTF8_to_ASCII(dataset), dataset, info = datasets[i])
|
|
|
|
}
|
2021-05-15 21:36:22 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
df <- AMR:::MO_lookup
|
2022-08-27 20:49:37 +02:00
|
|
|
expect_true(nrow(df[which(df$prevalence == 1), , drop = FALSE]) < nrow(df[which(df$prevalence == 2), , drop = FALSE]))
|
|
|
|
expect_true(nrow(df[which(df$prevalence == 2), , drop = FALSE]) < nrow(df[which(df$prevalence == 3), , drop = FALSE]))
|
2022-08-28 10:31:50 +02:00
|
|
|
expect_true(all(c(
|
|
|
|
"mo", "fullname",
|
|
|
|
"kingdom", "phylum", "class", "order", "family", "genus", "species", "subspecies",
|
|
|
|
"rank", "ref", "species_id", "source", "prevalence", "snomed",
|
|
|
|
"kingdom_index", "fullname_lower", "g_species"
|
|
|
|
) %in% colnames(df)))
|
2021-05-15 21:36:22 +02:00
|
|
|
|
2022-08-28 10:31:50 +02:00
|
|
|
expect_true(all(c(
|
|
|
|
"fullname", "fullname_new", "ref", "prevalence",
|
|
|
|
"fullname_lower", "g_species"
|
|
|
|
) %in% colnames(AMR:::MO.old_lookup)))
|
2021-05-15 21:36:22 +02:00
|
|
|
|
|
|
|
expect_inherits(AMR:::MO_CONS, "mo")
|
|
|
|
|
2022-08-28 10:31:50 +02:00
|
|
|
expect_identical(
|
|
|
|
class(catalogue_of_life_version()),
|
|
|
|
c("catalogue_of_life_version", "list")
|
|
|
|
)
|
2021-05-15 21:36:22 +02:00
|
|
|
|
|
|
|
expect_stdout(print(catalogue_of_life_version()))
|
|
|
|
|
2022-08-28 10:31:50 +02:00
|
|
|
uncategorised <- subset(
|
|
|
|
microorganisms,
|
|
|
|
genus == "Staphylococcus" &
|
|
|
|
!species %in% c("", "aureus") &
|
|
|
|
!mo %in% c(AMR:::MO_CONS, AMR:::MO_COPS)
|
|
|
|
)
|
|
|
|
expect_true(NROW(uncategorised) == 0,
|
|
|
|
info = ifelse(NROW(uncategorised) == 0,
|
|
|
|
"All staphylococcal species categorised as CoNS/CoPS.",
|
|
|
|
paste0(
|
|
|
|
"Staphylococcal species not categorised as CoNS/CoPS: S. ",
|
|
|
|
uncategorised$species, " (", uncategorised$mo, ")"
|
|
|
|
)
|
|
|
|
)
|
|
|
|
)
|
2021-12-14 22:39:23 +01:00
|
|
|
|
|
|
|
# THIS WILL CHECK NON-ASCII STRINGS IN ALL FILES:
|
|
|
|
|
|
|
|
# check_non_ascii <- function() {
|
|
|
|
# purrr::map_df(
|
|
|
|
# .id = "file",
|
|
|
|
# # list common text files
|
|
|
|
# .x = fs::dir_ls(
|
|
|
|
# recurse = TRUE,
|
|
|
|
# type = "file",
|
|
|
|
# # ignore images, compressed
|
|
|
|
# regexp = "\\.(png|ico|rda|ai|tar.gz|zip|xlsx|csv|pdf|psd)$",
|
|
|
|
# invert = TRUE
|
|
|
|
# ),
|
|
|
|
# .f = function(path) {
|
|
|
|
# x <- readLines(path, warn = FALSE)
|
|
|
|
# # from tools::showNonASCII()
|
|
|
|
# asc <- iconv(x, "latin1", "ASCII")
|
|
|
|
# ind <- is.na(asc) | asc != x
|
|
|
|
# # make data frame
|
|
|
|
# if (any(ind)) {
|
|
|
|
# tibble::tibble(
|
|
|
|
# row = which(ind),
|
|
|
|
# line = iconv(x[ind], "latin1", "ASCII", sub = "byte")
|
|
|
|
# )
|
|
|
|
# } else {
|
|
|
|
# tibble::tibble()
|
|
|
|
# }
|
|
|
|
# }
|
|
|
|
# )
|
|
|
|
# }
|
2022-08-28 10:31:50 +02:00
|
|
|
# x <- check_non_ascii() %>%
|
2021-12-14 22:39:23 +01:00
|
|
|
# filter(file %unlike% "^(data-raw|docs|git_)")
|