AMR/R/mic.R

242 lines
8.0 KiB
R
Raw Normal View History

2018-02-21 11:52:31 +01:00
# ==================================================================== #
# TITLE #
# Antimicrobial Resistance (AMR) Analysis #
# #
2019-01-02 23:24:07 +01:00
# SOURCE #
# https://gitlab.com/msberends/AMR #
2018-02-21 11:52:31 +01:00
# #
# LICENCE #
2019-01-02 23:24:07 +01:00
# (c) 2019 Berends MS (m.s.berends@umcg.nl), Luz CF (c.f.luz@umcg.nl) #
2018-02-21 11:52:31 +01:00
# #
2019-01-02 23:24:07 +01:00
# This R package is free software; you can freely use and distribute #
# it for both personal and commercial purposes under the terms of the #
# GNU General Public License version 2.0 (GNU GPL-2), as published by #
# the Free Software Foundation. #
# #
# This R package was created for academic research and was publicly #
# released in the hope that it will be useful, but it comes WITHOUT #
# ANY WARRANTY OR LIABILITY. #
2019-04-05 18:47:39 +02:00
# Visit our website for more info: https://msberends.gitlab.io/AMR. #
2018-02-21 11:52:31 +01:00
# ==================================================================== #
#' Class 'mic'
#'
#' This transforms a vector to a new class \code{mic}, which is an ordered factor with valid MIC values as levels. Invalid MIC values will be translated as \code{NA} with a warning.
2018-02-21 11:52:31 +01:00
#' @rdname as.mic
#' @param x vector
#' @param na.rm a logical indicating whether missing values should be removed
2019-05-10 16:44:59 +02:00
#' @details Interpret MIC values as RSI values with \code{\link{as.rsi}}. It supports guidelines from EUCAST and CLSI.
2018-10-17 17:32:34 +02:00
#' @return Ordered factor with new class \code{mic}
2019-11-06 14:43:23 +01:00
#' @aliases MIC
2018-02-21 11:52:31 +01:00
#' @export
#' @importFrom dplyr %>%
#' @seealso \code{\link{as.rsi}}
2019-01-02 23:24:07 +01:00
#' @inheritSection AMR Read more on our website!
2018-02-22 20:48:48 +01:00
#' @examples
#' mic_data <- as.mic(c(">=32", "1.0", "1", "1.00", 8, "<=0.128", "8", "16", "16"))
#' is.mic(mic_data)
2018-04-02 16:05:09 +02:00
#'
2018-06-19 10:05:38 +02:00
#' # this can also coerce combined MIC/RSI values:
#' as.mic("<=0.002; S") # will return <=0.002
2018-06-19 10:05:38 +02:00
#'
2019-05-10 16:44:59 +02:00
#' # interpret MIC values
#' as.rsi(x = as.mic(2),
#' mo = as.mo("S. pneumoniae"),
#' ab = "AMX",
#' guideline = "EUCAST")
#' as.rsi(x = as.mic(4),
#' mo = as.mo("S. pneumoniae"),
#' ab = "AMX",
#' guideline = "EUCAST")
#'
2018-02-22 20:48:48 +01:00
#' plot(mic_data)
2018-03-13 14:34:10 +01:00
#' barplot(mic_data)
2018-08-01 22:37:28 +02:00
#' freq(mic_data)
2018-02-21 11:52:31 +01:00
as.mic <- function(x, na.rm = FALSE) {
if (is.mic(x)) {
x
} else {
x <- x %>% unlist()
if (na.rm == TRUE) {
x <- x[!is.na(x)]
}
x.bak <- x
2018-04-02 16:05:09 +02:00
2018-06-19 10:05:38 +02:00
# comma to period
2019-10-11 17:21:02 +02:00
x <- gsub(",", ".", x, fixed = TRUE)
2018-06-19 10:05:38 +02:00
# remove space between operator and number ("<= 0.002" -> "<=0.002")
2019-10-11 17:21:02 +02:00
x <- gsub("(<|=|>) +", "\\1", x)
# transform => to >= and =< to <=
2019-10-11 17:21:02 +02:00
x <- gsub("=>", ">=", x, fixed = TRUE)
x <- gsub("=<", "<=", x, fixed = TRUE)
2018-02-21 11:52:31 +01:00
# starting dots must start with 0
2019-10-11 17:21:02 +02:00
x <- gsub("^[.]+", "0.", x)
2018-02-21 11:52:31 +01:00
# <=0.2560.512 should be 0.512
2019-10-11 17:21:02 +02:00
x <- gsub(".*[.].*[.]", "0.", x)
2018-02-21 11:52:31 +01:00
# remove ending .0
2019-10-11 17:21:02 +02:00
x <- gsub("[.]+0$", "", x)
2018-02-21 11:52:31 +01:00
# remove all after last digit
2019-10-11 17:21:02 +02:00
x <- gsub("[^0-9]+$", "", x)
# keep only one zero before dot
x <- gsub("0+[.]", "0.", x)
# starting 00 is probably 0.0 if there's no dot yet
x[!x %like% "[.]"] <- gsub("^00", "0.0", x[!x %like% "[.]"])
2018-02-21 11:52:31 +01:00
# remove last zeroes
2019-10-11 17:21:02 +02:00
x <- gsub("([.].?)0+$", "\\1", x)
x <- gsub("(.*[.])0+$", "\\10", x)
2018-12-29 22:24:19 +01:00
# remove ending .0 again
2019-10-11 17:21:02 +02:00
x[x %like% "[.]"] <- gsub("0+$", "", x[x %like% "[.]"])
2018-06-19 10:05:38 +02:00
# force to be character
x <- as.character(x)
# trim it
x <- trimws(x)
2018-04-02 16:05:09 +02:00
2019-05-10 16:44:59 +02:00
## previously unempty values now empty - should return a warning later on
x[x.bak != "" & x == ""] <- "invalid"
2019-05-10 16:44:59 +02:00
# these are allowed MIC values and will become factor levels
ops <- c("<", "<=", "", ">=", ">")
lvls <- c(c(t(sapply(ops, function(x) paste0(x, "0.00", 1:9)))),
unique(c(t(sapply(ops, function(x) paste0(x, sort(as.double(paste0("0.0",
sort(c(1:99, 125, 128, 256, 512, 625)))))))))),
unique(c(t(sapply(ops, function(x) paste0(x, sort(as.double(paste0("0.",
c(1:99, 125, 128, 256, 512))))))))),
c(t(sapply(ops, function(x) paste0(x, sort(c(1:9, 1.5)))))),
c(t(sapply(ops, function(x) paste0(x, c(10:98)[9:98 %% 2 == TRUE])))),
c(t(sapply(ops, function(x) paste0(x, sort(c(2 ^ c(7:10), 80 * c(2:12))))))))
2018-04-02 16:05:09 +02:00
2019-10-11 17:21:02 +02:00
na_before <- x[is.na(x) | x == ""] %>% length()
2018-02-21 11:52:31 +01:00
x[!x %in% lvls] <- NA
2019-10-11 17:21:02 +02:00
na_after <- x[is.na(x) | x == ""] %>% length()
2018-04-02 16:05:09 +02:00
2018-02-21 11:52:31 +01:00
if (na_before != na_after) {
2019-10-11 17:21:02 +02:00
list_missing <- x.bak[is.na(x) & !is.na(x.bak) & x.bak != ""] %>%
2018-02-21 11:52:31 +01:00
unique() %>%
sort()
2019-10-11 17:21:02 +02:00
list_missing <- paste0('"', list_missing, '"', collapse = ", ")
warning(na_after - na_before, " results truncated (",
round(((na_after - na_before) / length(x)) * 100),
2019-10-11 17:21:02 +02:00
"%) that were invalid MICs: ",
2018-02-21 11:52:31 +01:00
list_missing, call. = FALSE)
}
2018-04-02 16:05:09 +02:00
2019-08-07 15:37:39 +02:00
structure(.Data = factor(x, levels = lvls, ordered = TRUE),
2019-10-11 17:21:02 +02:00
class = c("mic", "ordered", "factor"))
2018-02-21 11:52:31 +01:00
}
}
#' @rdname as.mic
#' @export
#' @importFrom dplyr %>%
is.mic <- function(x) {
2019-10-11 17:21:02 +02:00
class(x) %>% identical(c("mic", "ordered", "factor"))
2018-02-21 11:52:31 +01:00
}
#' @exportMethod as.double.mic
#' @export
#' @noRd
as.double.mic <- function(x, ...) {
2019-10-11 17:21:02 +02:00
as.double(gsub("(<|=|>)+", "", as.character(x)))
2018-02-21 11:52:31 +01:00
}
#' @exportMethod as.integer.mic
#' @export
#' @noRd
as.integer.mic <- function(x, ...) {
2019-10-11 17:21:02 +02:00
as.integer(gsub("(<|=|>)+", "", as.character(x)))
2018-02-21 11:52:31 +01:00
}
#' @exportMethod as.numeric.mic
#' @export
#' @noRd
as.numeric.mic <- function(x, ...) {
2019-10-11 17:21:02 +02:00
as.numeric(gsub("(<|=|>)+", "", as.character(x)))
2018-02-21 11:52:31 +01:00
}
2018-12-29 22:24:19 +01:00
#' @exportMethod droplevels.mic
#' @export
#' @noRd
2019-10-11 17:21:02 +02:00
droplevels.mic <- function(x, exclude = ifelse(anyNA(levels(x)), NULL, NA), ...) {
2018-12-29 22:24:19 +01:00
x <- droplevels.factor(x, exclude = exclude, ...)
2019-10-11 17:21:02 +02:00
class(x) <- c("mic", "ordered", "factor")
2018-12-29 22:24:19 +01:00
x
}
2018-02-21 11:52:31 +01:00
#' @exportMethod print.mic
#' @export
#' @importFrom dplyr %>% tibble group_by summarise pull
#' @noRd
print.mic <- function(x, ...) {
2018-07-15 22:56:41 +02:00
cat("Class 'mic'\n")
2018-08-01 22:37:28 +02:00
print(as.character(x), quote = FALSE)
2018-02-21 11:52:31 +01:00
}
#' @exportMethod summary.mic
#' @export
2018-04-03 16:07:32 +02:00
#' @importFrom dplyr %>%
2018-02-21 11:52:31 +01:00
#' @noRd
summary.mic <- function(object, ...) {
x <- object
n_total <- x %>% length()
x <- x[!is.na(x)]
n <- x %>% length()
2018-12-07 12:04:55 +01:00
c(
2019-10-11 17:21:02 +02:00
"Class" = "mic",
2018-12-07 12:04:55 +01:00
"<NA>" = n_total - n,
"Min." = sort(x)[1] %>% as.character(),
"Max." = sort(x)[n] %>% as.character()
)
2018-02-21 11:52:31 +01:00
}
#' @exportMethod plot.mic
#' @export
2019-06-16 22:14:43 +02:00
#' @importFrom graphics barplot axis par
2018-02-21 11:52:31 +01:00
#' @noRd
plot.mic <- function(x,
2019-10-11 17:21:02 +02:00
main = paste("MIC values of", deparse(substitute(x))),
ylab = "Frequency",
xlab = "MIC value",
axes = FALSE,
...) {
barplot(table(droplevels.factor(x)),
ylab = ylab,
xlab = xlab,
axes = axes,
main = main,
...)
axis(2, seq(0, max(table(droplevels.factor(x)))))
2018-03-13 14:34:10 +01:00
}
#' @exportMethod barplot.mic
#' @export
2018-03-13 15:40:10 +01:00
#' @importFrom graphics barplot axis
2018-03-13 14:34:10 +01:00
#' @noRd
barplot.mic <- function(height,
2019-10-11 17:21:02 +02:00
main = paste("MIC values of", deparse(substitute(height))),
ylab = "Frequency",
xlab = "MIC value",
axes = FALSE,
...) {
barplot(table(droplevels.factor(height)),
ylab = ylab,
xlab = xlab,
axes = axes,
main = main,
2018-03-13 14:34:10 +01:00
...)
axis(2, seq(0, max(table(droplevels.factor(height)))))
2018-02-21 11:52:31 +01:00
}
2019-08-07 15:37:39 +02:00
#' @importFrom pillar type_sum
#' @export
type_sum.mic <- function(x) {
"mic"
}
#' @importFrom pillar pillar_shaft
#' @export
pillar_shaft.mic <- function(x, ...) {
out <- trimws(format(x))
out[is.na(x)] <- pillar::style_na(NA)
2019-08-07 15:37:39 +02:00
pillar::new_pillar_shaft_simple(out, align = "right", min_width = 4)
}