AMR/R/disk.R

# ==================================================================== #
# TITLE                                                                #
# Antimicrobial Resistance (AMR) Data Analysis for R                   #
#                                                                      #
# SOURCE                                                               #
# https://github.com/msberends/AMR                                     #
#                                                                      #
# LICENCE                                                              #
# (c) 2018-2022 Berends MS, Luz CF et al.                              #
# Developed at the University of Groningen, the Netherlands, in        #
# collaboration with non-profit organisations Certe Medical            #
# Diagnostics & Advice, and University Medical Center Groningen.       # 
#                                                                      #
# This R package is free software; you can freely use and distribute   #
# it for both personal and commercial purposes under the terms of the  #
# GNU General Public License version 2.0 (GNU GPL-2), as published by  #
# the Free Software Foundation.                                        #
# We created this package for both routine data analysis and academic  #
# research and it was publicly released in the hope that it will be    #
# useful, but it comes WITHOUT ANY WARRANTY OR LIABILITY.              #
#                                                                      #
# Visit our website for the full manual and a complete tutorial about  #
# how to conduct AMR data analysis: https://msberends.github.io/AMR/   #
# ==================================================================== #

#' Transform Input to Disk Diffusion Diameters
#'
#' This transforms a vector to a new class [`disk`], which is a disk diffusion growth zone size (around an antibiotic disk) in millimetres between 6 and 50.
#' @inheritSection lifecycle Stable Lifecycle
#' @rdname as.disk
#' @param x vector
#' @param na.rm a [logical] indicating whether missing values should be removed
#' @details Interpret disk values as RSI values with [as.rsi()]. It supports guidelines from EUCAST and CLSI.
#' @return An [integer] with additional class [`disk`]
#' @aliases disk
#' @export
#' @seealso [as.rsi()]
#' @inheritSection AMR Read more on Our Website!
#' @examples
#' \donttest{
#' # transform existing disk zones to the `disk` class
#' df <- data.frame(microorganism = "E. coli",
#'                  AMP = 20,
#'                  CIP = 14,
#'                  GEN = 18,
#'                  TOB = 16)
#' df[, 2:5] <- lapply(df[, 2:5], as.disk)
#' # same with dplyr:
#' # df %>% mutate(across(AMP:TOB, as.disk))
#' 
#' # interpret disk values, see ?as.rsi
#' as.rsi(x = as.disk(18),
#'        mo = "Strep pneu",  # `mo` will be coerced with as.mo()
#'        ab = "ampicillin",  # and `ab` with as.ab()
#'        guideline = "EUCAST")
#'        
#' as.rsi(df)
#' }
as.disk <- function(x, na.rm = FALSE) {
  meet_criteria(x, allow_class = c("disk", "character", "numeric", "integer"), allow_NA = TRUE)
  meet_criteria(na.rm, allow_class = "logical", has_length = 1)
  
  if (!is.disk(x)) {
    x <- unlist(x)
    if (na.rm == TRUE) {
      x <- x[!is.na(x)]
    }
    x.bak <- x
    
    na_before <- length(x[is.na(x)])
    
    # heavily based on cleaner::clean_double():
    clean_double2 <- function(x, remove = "[^0-9.,-]", fixed = FALSE) {
      x <- gsub(",", ".", x)
      # remove ending dot/comma
      x <- gsub("[,.]$", "", x)
      # only keep last dot/comma
      reverse <- function(x) vapply(FUN.VALUE = character(1), lapply(strsplit(x, NULL), rev), paste, collapse = "")
      x <- sub("{{dot}}", ".", 
               gsub(".", "",
                    reverse(sub(".", "}}tod{{",
                                reverse(x), 
                                fixed = TRUE)),
                    fixed = TRUE), 
               fixed = TRUE)
      x_clean <- gsub(remove, "", x, ignore.case = TRUE, fixed = fixed)
      # remove everything that is not a number or dot
      as.double(gsub("[^0-9.]+", "", x_clean))
    }
    
    # round up and make it an integer
    x <- as.integer(ceiling(clean_double2(x)))
    
    # disks can never be less than 6 mm (size of smallest disk) or more than 50 mm
    x[x < 6 | x > 50] <- NA_integer_
    na_after <- length(x[is.na(x)])
    
    if (na_before != na_after) {
      list_missing <- x.bak[is.na(x) & !is.na(x.bak)] %pm>%
        unique() %pm>%
        sort() %pm>%
        vector_and(quotes = TRUE)
      warning_(na_after - na_before, " results truncated (",
               round(((na_after - na_before) / length(x)) * 100),
               "%) that were invalid disk zones: ",
               list_missing, call = FALSE)
    }
  }
  set_clean_class(as.integer(x),
                  new_class = c("disk", "integer"))
}

all_valid_disks <- function(x) {
  if (!inherits(x, c("disk", "character", "numeric", "integer"))) {
    return(FALSE)
  }
  x_disk <- tryCatch(suppressWarnings(as.disk(x[!is.na(x)])),
                     error = function(e) NA)
  !any(is.na(x_disk)) && !all(is.na(x))
}

#' @rdname as.disk
#' @details `NA_disk_` is a missing value of the new `<disk>` class.
#' @export
NA_disk_ <- set_clean_class(as.integer(NA_real_),
                            new_class = c("disk", "integer"))

#' @rdname as.disk
#' @export
is.disk <- function(x) {
  inherits(x, "disk")
}

# will be exported using s3_register() in R/zzz.R
pillar_shaft.disk <- function(x, ...) {
  out <- trimws(format(x))
  out[is.na(x)] <- font_na(NA)
  create_pillar_column(out, align = "right", width = 2)
}

# will be exported using s3_register() in R/zzz.R
type_sum.disk <- function(x, ...) {
  "disk"
}

#' @method print disk
#' @export
#' @noRd
print.disk <- function(x, ...) {
  cat("Class <disk>\n")
  print(as.integer(x), quote = FALSE)
}

#' @method [ disk
#' @export
#' @noRd
"[.disk" <- function(x, ...) {
  y <- NextMethod()
  attributes(y) <- attributes(x)
  y
}
#' @method [[ disk
#' @export
#' @noRd
"[[.disk" <- function(x, ...) {
  y <- NextMethod()
  attributes(y) <- attributes(x)
  y
}
#' @method [<- disk
#' @export
#' @noRd
"[<-.disk" <- function(i, j, ..., value) {
  value <- as.disk(value)
  y <- NextMethod()
  attributes(y) <- attributes(i)
  y
}
#' @method [[<- disk
#' @export
#' @noRd
"[[<-.disk" <- function(i, j, ..., value) {
  value <- as.disk(value)
  y <- NextMethod()
  attributes(y) <- attributes(i)
  y
}
#' @method c disk
#' @export
#' @noRd
c.disk <- function(...) {
  as.disk(unlist(lapply(list(...), as.character)))
}

#' @method unique disk
#' @export
#' @noRd
unique.disk <- function(x, incomparables = FALSE, ...) {
  y <- NextMethod()
  attributes(y) <- attributes(x)
  y
}

#' @method rep disk
#' @export
#' @noRd
rep.disk <- function(x, ...) {
  y <- NextMethod()
  attributes(y) <- attributes(x)
  y
}

# will be exported using s3_register() in R/zzz.R
get_skimmers.disk <- function(column) {
  skimr::sfl(
    skim_type = "disk",
    min = ~min(as.double(.), na.rm = TRUE),
    max = ~max(as.double(.), na.rm = TRUE),
    median = ~stats::median(as.double(.), na.rm = TRUE),
    n_unique = ~length(unique(stats::na.omit(.))),
    hist = ~skimr::inline_hist(stats::na.omit(as.double(.)))
  )
}
new antibiotics 2019-05-10 16:44:59 +02:00			`# ==================================================================== #`
			`# TITLE #`
(v1.5.0.9014) only_rsi_columns, is.rsi.eligible improvement 2021-02-02 23:57:35 +01:00			`# Antimicrobial Resistance (AMR) Data Analysis for R #`
new antibiotics 2019-05-10 16:44:59 +02:00			`# #`
			`# SOURCE #`
(v1.2.0.9026) move to github 2020-07-08 14:48:06 +02:00			`# https://github.com/msberends/AMR #`
new antibiotics 2019-05-10 16:44:59 +02:00			`# #`
			`# LICENCE #`
(v1.8.0) prerelease 1.8.0 2021-12-23 18:56:28 +01:00			`# (c) 2018-2022 Berends MS, Luz CF et al. #`
(v1.4.0) matching score update 2020-10-08 11:16:03 +02:00			`# Developed at the University of Groningen, the Netherlands, in #`
			`# collaboration with non-profit organisations Certe Medical #`
			`# Diagnostics & Advice, and University Medical Center Groningen. #`
new antibiotics 2019-05-10 16:44:59 +02:00			`# #`
			`# This R package is free software; you can freely use and distribute #`
			`# it for both personal and commercial purposes under the terms of the #`
			`# GNU General Public License version 2.0 (GNU GPL-2), as published by #`
			`# the Free Software Foundation. #`
(v0.9.0.9008) Happy new year! Add lifecycles 2020-01-05 17:22:09 +01:00			`# We created this package for both routine data analysis and academic #`
			`# research and it was publicly released in the hope that it will be #`
			`# useful, but it comes WITHOUT ANY WARRANTY OR LIABILITY. #`
(v1.4.0) matching score update 2020-10-08 11:16:03 +02:00			`# #`
			`# Visit our website for the full manual and a complete tutorial about #`
(v1.5.0.9014) only_rsi_columns, is.rsi.eligible improvement 2021-02-02 23:57:35 +01:00			`# how to conduct AMR data analysis: https://msberends.github.io/AMR/ #`
new antibiotics 2019-05-10 16:44:59 +02:00			`# ==================================================================== #`

(v1.5.0.9006) major documentation update 2021-01-18 16:57:56 +01:00			`#' Transform Input to Disk Diffusion Diameters`
new antibiotics 2019-05-10 16:44:59 +02:00			`#'`
(v1.3.0.9014) as.mo() speed improvement 2020-09-03 12:31:48 +02:00			#' This transforms a vector to a new class [`disk`], which is a disk diffusion growth zone size (around an antibiotic disk) in millimetres between 6 and 50.
(v1.5.0.9006) major documentation update 2021-01-18 16:57:56 +01:00			`#' @inheritSection lifecycle Stable Lifecycle`
new antibiotics 2019-05-10 16:44:59 +02:00			`#' @rdname as.disk`
			`#' @param x vector`
(v1.6.0.9021) join functions update 2021-05-12 18:15:03 +02:00			`#' @param na.rm a [logical] indicating whether missing values should be removed`
(v0.8.0.9036) complete documentation rewrite 2019-11-28 22:32:17 +01:00			`#' @details Interpret disk values as RSI values with [as.rsi()]. It supports guidelines from EUCAST and CLSI.`
(v1.3.0.9022) mo_matching_score(), poorman update, as.rsi() fix 2020-09-18 16:05:53 +02:00			#' @return An [integer] with additional class [`disk`]
(v0.8.0.9017) keywords update 2019-11-06 14:43:23 +01:00			`#' @aliases disk`
new antibiotics 2019-05-10 16:44:59 +02:00			`#' @export`
(v0.8.0.9036) complete documentation rewrite 2019-11-28 22:32:17 +01:00			`#' @seealso [as.rsi()]`
(v1.5.0.9006) major documentation update 2021-01-18 16:57:56 +01:00			`#' @inheritSection AMR Read more on Our Website!`
new antibiotics 2019-05-10 16:44:59 +02:00			`#' @examples`
(v1.3.0.9035) mdro() for EUCAST 3.2, examples cleanup 2020-09-29 23:35:46 +02:00			`#' \donttest{`
(v0.9.0.9026) update documentation 2020-02-17 14:38:01 +01:00			#' # transform existing disk zones to the `disk` class
			`#' df <- data.frame(microorganism = "E. coli",`
			`#' AMP = 20,`
			`#' CIP = 14,`
			`#' GEN = 18,`
			`#' TOB = 16)`
(v1.3.0.9035) mdro() for EUCAST 3.2, examples cleanup 2020-09-29 23:35:46 +02:00			`#' df[, 2:5] <- lapply(df[, 2:5], as.disk)`
			`#' # same with dplyr:`
			`#' # df %>% mutate(across(AMP:TOB, as.disk))`
(v0.9.0.9026) update documentation 2020-02-17 14:38:01 +01:00			`#'`
			`#' # interpret disk values, see ?as.rsi`
			`#' as.rsi(x = as.disk(18),`
			#' mo = "Strep pneu", # `mo` will be coerced with as.mo()
			#' ab = "ampicillin", # and `ab` with as.ab()
new antibiotics 2019-05-10 16:44:59 +02:00			`#' guideline = "EUCAST")`
(v0.9.0.9026) update documentation 2020-02-17 14:38:01 +01:00			`#'`
			`#' as.rsi(df)`
(v1.1.0.9007) lose dependencies 2020-05-16 21:40:50 +02:00			`#' }`
new antibiotics 2019-05-10 16:44:59 +02:00			`as.disk <- function(x, na.rm = FALSE) {`
(v1.4.0.9001) is_gram_positive(), is_gram_negative(), parameter hardening 2020-10-19 17:09:19 +02:00			`meet_criteria(x, allow_class = c("disk", "character", "numeric", "integer"), allow_NA = TRUE)`
			`meet_criteria(na.rm, allow_class = "logical", has_length = 1)`

(v1.1.0.9012) lose dependencies 2020-05-19 12:08:49 +02:00			`if (!is.disk(x)) {`
(v1.5.0.9010) MDRO vignette update, get_episode for < day 2021-01-24 14:48:56 +01:00			`x <- unlist(x)`
new antibiotics 2019-05-10 16:44:59 +02:00			`if (na.rm == TRUE) {`
			`x <- x[!is.na(x)]`
			`}`
			`x.bak <- x`
(v1.2.0.9034) code cleaning 2020-07-13 09:17:24 +02:00
new antibiotics 2019-05-10 16:44:59 +02:00			`na_before <- length(x[is.na(x)])`
(v1.2.0.9034) code cleaning 2020-07-13 09:17:24 +02:00
(v1.4.0.9052) replaced all sapply's with type-safe vapply's 2020-12-28 22:24:33 +01:00			`# heavily based on cleaner::clean_double():`
(v1.3.0.9004) data sets, as.disk() improvement 2020-08-16 21:38:42 +02:00			`clean_double2 <- function(x, remove = "[^0-9.,-]", fixed = FALSE) {`
			`x <- gsub(",", ".", x)`
			`# remove ending dot/comma`
			`x <- gsub("[,.]$", "", x)`
			`# only keep last dot/comma`
(v1.4.0.9052) replaced all sapply's with type-safe vapply's 2020-12-28 22:24:33 +01:00			`reverse <- function(x) vapply(FUN.VALUE = character(1), lapply(strsplit(x, NULL), rev), paste, collapse = "")`
(v1.3.0.9004) data sets, as.disk() improvement 2020-08-16 21:38:42 +02:00			`x <- sub("{{dot}}", ".",`
			`gsub(".", "",`
			`reverse(sub(".", "}}tod{{",`
			`reverse(x),`
			`fixed = TRUE)),`
			`fixed = TRUE),`
			`fixed = TRUE)`
			`x_clean <- gsub(remove, "", x, ignore.case = TRUE, fixed = fixed)`
			`# remove everything that is not a number or dot`
(v1.6.0.9062) code consistency 2021-05-24 00:06:28 +02:00			`as.double(gsub("[^0-9.]+", "", x_clean))`
(v1.3.0.9004) data sets, as.disk() improvement 2020-08-16 21:38:42 +02:00			`}`

			`# round up and make it an integer`
			`x <- as.integer(ceiling(clean_double2(x)))`
(v1.2.0.9034) code cleaning 2020-07-13 09:17:24 +02:00
(v0.9.0.9005) as.mo for G. species 2019-12-21 10:56:06 +01:00			`# disks can never be less than 6 mm (size of smallest disk) or more than 50 mm`
			`x[x < 6 \| x > 50] <- NA_integer_`
new antibiotics 2019-05-10 16:44:59 +02:00			`na_after <- length(x[is.na(x)])`
(v1.2.0.9034) code cleaning 2020-07-13 09:17:24 +02:00
new antibiotics 2019-05-10 16:44:59 +02:00			`if (na_before != na_after) {`
(v1.3.0.9022) mo_matching_score(), poorman update, as.rsi() fix 2020-09-18 16:05:53 +02:00			`list_missing <- x.bak[is.na(x) & !is.na(x.bak)] %pm>%`
			`unique() %pm>%`
(v1.5.0.9015) unit test fix, grouped first isolates 2021-02-04 16:48:16 +01:00			`sort() %pm>%`
			`vector_and(quotes = TRUE)`
(v1.4.0.9015) bugfix 2020-11-10 16:35:56 +01:00			`warning_(na_after - na_before, " results truncated (",`
			`round(((na_after - na_before) / length(x)) * 100),`
			`"%) that were invalid disk zones: ",`
			`list_missing, call = FALSE)`
new antibiotics 2019-05-10 16:44:59 +02:00			`}`
			`}`
(v1.4.0.9021) more robust class setting 2020-11-16 16:57:55 +01:00			`set_clean_class(as.integer(x),`
			`new_class = c("disk", "integer"))`
new antibiotics 2019-05-10 16:44:59 +02:00			`}`

(v0.9.0.9029) add uti to as.rsi() 2020-02-20 13:19:23 +01:00			`all_valid_disks <- function(x) {`
(v1.4.0.9001) is_gram_positive(), is_gram_negative(), parameter hardening 2020-10-19 17:09:19 +02:00			`if (!inherits(x, c("disk", "character", "numeric", "integer"))) {`
			`return(FALSE)`
			`}`
(v1.4.0.9041) updates based on review 2020-12-17 16:22:25 +01:00			`x_disk <- tryCatch(suppressWarnings(as.disk(x[!is.na(x)])),`
			`error = function(e) NA)`
			`!any(is.na(x_disk)) && !all(is.na(x))`
(v0.9.0.9029) add uti to as.rsi() 2020-02-20 13:19:23 +01:00			`}`

(v1.7.1.9054) mdro() update - fixes #49, first_isolate() speedup 2021-11-28 23:01:26 +01:00			`#' @rdname as.disk`
			#' @details `NA_disk_` is a missing value of the new `<disk>` class.
			`#' @export`
			`NA_disk_ <- set_clean_class(as.integer(NA_real_),`
			`new_class = c("disk", "integer"))`

new antibiotics 2019-05-10 16:44:59 +02:00			`#' @rdname as.disk`
			`#' @export`
			`is.disk <- function(x) {`
(v0.9.0.9022) inheritance fix 2020-02-10 14:18:15 +01:00			`inherits(x, "disk")`
new antibiotics 2019-05-10 16:44:59 +02:00			`}`

(v1.3.0.9010) S3 extensions without dependencies 2020-08-28 21:55:47 +02:00			`# will be exported using s3_register() in R/zzz.R`
(v1.3.0.9007) tibble printing 2020-08-26 11:33:54 +02:00			`pillar_shaft.disk <- function(x, ...) {`
			`out <- trimws(format(x))`
(v1.3.0.9010) S3 extensions without dependencies 2020-08-28 21:55:47 +02:00			`out[is.na(x)] <- font_na(NA)`
			`create_pillar_column(out, align = "right", width = 2)`
(v1.3.0.9007) tibble printing 2020-08-26 11:33:54 +02:00			`}`

(v1.3.0.9010) S3 extensions without dependencies 2020-08-28 21:55:47 +02:00			`# will be exported using s3_register() in R/zzz.R`
(v1.3.0.9007) tibble printing 2020-08-26 11:33:54 +02:00			`type_sum.disk <- function(x, ...) {`
			`"disk"`
			`}`

v1.2.0 2020-05-28 16:48:55 +02:00			`#' @method print disk`
new antibiotics 2019-05-10 16:44:59 +02:00			`#' @export`
			`#' @noRd`
			`print.disk <- function(x, ...) {`
(v1.1.0.9020) updated taxonomy 2020-05-27 16:37:49 +02:00			`cat("Class <disk>\n")`
new antibiotics 2019-05-10 16:44:59 +02:00			`print(as.integer(x), quote = FALSE)`
			`}`
(v0.7.1.9036) preserve ab/mo classes in subsetting 2019-08-12 14:48:09 +02:00
v1.2.0 2020-05-28 16:48:55 +02:00			`#' @method [ disk`
(v1.0.1.9004) Support dplyr 1.0.0 2020-03-14 14:05:43 +01:00			`#' @export`
			`#' @noRd`
			`"[.disk" <- function(x, ...) {`
			`y <- NextMethod()`
			`attributes(y) <- attributes(x)`
			`y`
			`}`
v1.2.0 2020-05-28 16:48:55 +02:00			`#' @method [[ disk`
(v1.0.1.9004) Support dplyr 1.0.0 2020-03-14 14:05:43 +01:00			`#' @export`
			`#' @noRd`
			`"[[.disk" <- function(x, ...) {`
			`y <- NextMethod()`
			`attributes(y) <- attributes(x)`
			`y`
			`}`
v1.2.0 2020-05-28 16:48:55 +02:00			`#' @method [<- disk`
(v1.0.1.9004) Support dplyr 1.0.0 2020-03-14 14:05:43 +01:00			`#' @export`
			`#' @noRd`
			`"[<-.disk" <- function(i, j, ..., value) {`
(v1.0.1.9005) as.mo() improvements 2020-04-13 21:09:56 +02:00			`value <- as.disk(value)`
(v1.0.1.9004) Support dplyr 1.0.0 2020-03-14 14:05:43 +01:00			`y <- NextMethod()`
			`attributes(y) <- attributes(i)`
			`y`
			`}`
v1.2.0 2020-05-28 16:48:55 +02:00			`#' @method [[<- disk`
(v1.0.1.9004) Support dplyr 1.0.0 2020-03-14 14:05:43 +01:00			`#' @export`
			`#' @noRd`
			`"[[<-.disk" <- function(i, j, ..., value) {`
(v1.0.1.9005) as.mo() improvements 2020-04-13 21:09:56 +02:00			`value <- as.disk(value)`
(v1.0.1.9004) Support dplyr 1.0.0 2020-03-14 14:05:43 +01:00			`y <- NextMethod()`
			`attributes(y) <- attributes(i)`
			`y`
			`}`
v1.2.0 2020-05-28 16:48:55 +02:00			`#' @method c disk`
(v1.0.1.9004) Support dplyr 1.0.0 2020-03-14 14:05:43 +01:00			`#' @export`
			`#' @noRd`
(v1.6.0.9016) website update and c() fixes 2021-05-03 13:06:43 +02:00			`c.disk <- function(...) {`
			`as.disk(unlist(lapply(list(...), as.character)))`
(v1.0.1.9004) Support dplyr 1.0.0 2020-03-14 14:05:43 +01:00			`}`
(v1.3.0.9029) eucast rules fix, unique() 2020-09-25 14:44:50 +02:00
			`#' @method unique disk`
			`#' @export`
			`#' @noRd`
			`unique.disk <- function(x, incomparables = FALSE, ...) {`
			`y <- NextMethod()`
			`attributes(y) <- attributes(x)`
			`y`
			`}`
(v1.3.0.9032) support skimr 2020-09-28 01:08:55 +02:00
(v1.7.1.9014) rep() for S3 classes 2021-07-06 16:35:14 +02:00			`#' @method rep disk`
			`#' @export`
			`#' @noRd`
			`rep.disk <- function(x, ...) {`
			`y <- NextMethod()`
			`attributes(y) <- attributes(x)`
			`y`
			`}`

(v1.3.0.9032) support skimr 2020-09-28 01:08:55 +02:00			`# will be exported using s3_register() in R/zzz.R`
			`get_skimmers.disk <- function(column) {`
(v1.4.0.9041) updates based on review 2020-12-17 16:22:25 +01:00			`skimr::sfl(`
(v1.3.0.9032) support skimr 2020-09-28 01:08:55 +02:00			`skim_type = "disk",`
(v1.3.0.9033) skimr fix 2020-09-28 11:00:59 +02:00			`min = ~min(as.double(.), na.rm = TRUE),`
			`max = ~max(as.double(.), na.rm = TRUE),`
(v1.3.0.9032) support skimr 2020-09-28 01:08:55 +02:00			`median = ~stats::median(as.double(.), na.rm = TRUE),`
(v1.6.0.9020) fix for skimr in dplyr 1.0.6 2021-05-06 15:17:11 +02:00			`n_unique = ~length(unique(stats::na.omit(.))),`
(v1.4.0.9041) updates based on review 2020-12-17 16:22:25 +01:00			`hist = ~skimr::inline_hist(stats::na.omit(as.double(.)))`
(v1.3.0.9032) support skimr 2020-09-28 01:08:55 +02:00			`)`
			`}`