2018-08-22 00:02:26 +02:00
# ==================================================================== #
# TITLE #
# Antimicrobial Resistance (AMR) Analysis #
# #
# AUTHORS #
# Berends MS (m.s.berends@umcg.nl), Luz CF (c.f.luz@umcg.nl) #
# #
# LICENCE #
# This program is free software; you can redistribute it and/or modify #
# it under the terms of the GNU General Public License version 2.0, #
# as published by the Free Software Foundation. #
# #
# This program is distributed in the hope that it will be useful, #
# but WITHOUT ANY WARRANTY; without even the implied warranty of #
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the #
# GNU General Public License for more details. #
# ==================================================================== #
#' Count isolates
#'
2018-08-23 00:40:36 +02:00
#' @description These functions can be used to count resistant/susceptible microbial isolates. All functions support quasiquotation with pipes, can be used in \code{dplyr}s \code{\link[dplyr]{summarise}} and support grouped variables, see \emph{Examples}.
2018-08-22 00:02:26 +02:00
#'
#' \code{count_R} and \code{count_IR} can be used to count resistant isolates, \code{count_S} and \code{count_SI} can be used to count susceptible isolates.\cr
2018-10-12 16:35:18 +02:00
#' @param ... one or more vectors (or columns) with antibiotic interpretations. They will be transformed internally with \code{\link{as.rsi}} if needed.
2018-08-22 00:02:26 +02:00
#' @inheritParams portion
2018-10-12 16:35:18 +02:00
#' @details These functions are meant to count isolates. Use the \code{\link{portion}_*} functions to calculate microbial resistance.
2018-08-22 00:02:26 +02:00
#'
2018-10-12 16:35:18 +02:00
#' \code{n_rsi} is an alias of \code{count_all}. They can be used to count all available isolates, i.e. where all input antibiotics have an available result (S, I or R). Their use is equal to \code{\link{n_distinct}}. Their function is equal to \code{count_S(...) + count_IR(...)}.
2018-08-22 00:02:26 +02:00
#'
#' \code{count_df} takes any variable from \code{data} that has an \code{"rsi"} class (created with \code{\link{as.rsi}}) and counts the amounts of R, I and S. The resulting \emph{tidy data} (see Source) \code{data.frame} will have three rows (S/I/R) and a column for each variable with class \code{"rsi"}.
#' @source Wickham H. \strong{Tidy Data.} The Journal of Statistical Software, vol. 59, 2014. \url{http://vita.had.co.nz/papers/tidy-data.html}
2018-10-12 16:35:18 +02:00
#' @seealso \code{\link{portion}_*} to calculate microbial resistance and susceptibility.
2018-08-22 00:02:26 +02:00
#' @keywords resistance susceptibility rsi antibiotics isolate isolates
#' @return Integer
#' @rdname count
#' @name count
#' @export
#' @examples
#' # septic_patients is a data set available in the AMR package. It is true, genuine data.
#' ?septic_patients
#'
#' # Count resistant isolates
#' count_R(septic_patients$amox)
#' count_IR(septic_patients$amox)
#'
2018-12-14 07:48:12 +01:00
#' # Or susceptible isolates
2018-08-22 00:02:26 +02:00
#' count_S(septic_patients$amox)
#' count_SI(septic_patients$amox)
#'
2018-10-12 16:35:18 +02:00
#' # Count all available isolates
#' count_all(septic_patients$amox)
#' n_rsi(septic_patients$amox)
#'
2018-08-22 00:02:26 +02:00
#' # Since n_rsi counts available isolates, you can
#' # calculate back to count e.g. non-susceptible isolates.
#' # This results in the same:
#' count_IR(septic_patients$amox)
#' portion_IR(septic_patients$amox) * n_rsi(septic_patients$amox)
#'
#' library(dplyr)
#' septic_patients %>%
#' group_by(hospital_id) %>%
2018-10-12 16:35:18 +02:00
#' summarise(R = count_R(cipr),
#' I = count_I(cipr),
#' S = count_S(cipr),
#' n1 = count_all(cipr), # the actual total; sum of all three
#' n2 = n_rsi(cipr), # same - analogous to n_distinct
#' total = n()) # NOT the amount of tested isolates!
2018-08-22 00:02:26 +02:00
#'
#' # Count co-resistance between amoxicillin/clav acid and gentamicin,
#' # so we can see that combination therapy does a lot more than mono therapy.
#' # Please mind that `portion_S` calculates percentages right away instead.
2018-10-12 16:35:18 +02:00
#' count_S(septic_patients$amcl) # S = 1057 (67.1%)
#' count_all(septic_patients$amcl) # n = 1576
2018-08-22 00:02:26 +02:00
#'
2018-10-12 16:35:18 +02:00
#' count_S(septic_patients$gent) # S = 1372 (74.0%)
#' count_all(septic_patients$gent) # n = 1855
2018-08-22 00:02:26 +02:00
#'
#' with(septic_patients,
2018-10-12 16:35:18 +02:00
#' count_S(amcl, gent)) # S = 1396 (92.0%)
#' with(septic_patients, # n = 1517
2018-08-22 00:02:26 +02:00
#' n_rsi(amcl, gent))
#'
#' # Get portions S/I/R immediately of all rsi columns
#' septic_patients %>%
#' select(amox, cipr) %>%
#' count_df(translate = FALSE)
#'
#' # It also supports grouping variables
#' septic_patients %>%
#' select(hospital_id, amox, cipr) %>%
#' group_by(hospital_id) %>%
#' count_df(translate = FALSE)
#'
2018-10-19 13:53:31 +02:00
count_R <- function ( ... , also_single_tested = FALSE ) {
2018-08-23 00:40:36 +02:00
rsi_calc ( ... ,
type = " R" ,
2018-08-22 00:02:26 +02:00
include_I = FALSE ,
minimum = 0 ,
as_percent = FALSE ,
2018-10-19 13:53:31 +02:00
also_single_tested = FALSE ,
2018-08-22 00:02:26 +02:00
only_count = TRUE )
}
#' @rdname count
#' @export
2018-10-19 13:53:31 +02:00
count_IR <- function ( ... , also_single_tested = FALSE ) {
2018-08-23 00:40:36 +02:00
rsi_calc ( ... ,
type = " R" ,
2018-08-22 00:02:26 +02:00
include_I = TRUE ,
minimum = 0 ,
as_percent = FALSE ,
2018-10-19 13:53:31 +02:00
also_single_tested = FALSE ,
2018-08-22 00:02:26 +02:00
only_count = TRUE )
}
#' @rdname count
#' @export
2018-10-19 13:53:31 +02:00
count_I <- function ( ... , also_single_tested = FALSE ) {
2018-08-23 00:40:36 +02:00
rsi_calc ( ... ,
type = " I" ,
2018-08-22 00:02:26 +02:00
include_I = FALSE ,
minimum = 0 ,
as_percent = FALSE ,
2018-10-19 13:53:31 +02:00
also_single_tested = FALSE ,
2018-08-22 00:02:26 +02:00
only_count = TRUE )
}
#' @rdname count
#' @export
2018-10-19 13:53:31 +02:00
count_SI <- function ( ... , also_single_tested = FALSE ) {
2018-08-23 00:40:36 +02:00
rsi_calc ( ... ,
type = " S" ,
2018-08-22 00:02:26 +02:00
include_I = TRUE ,
minimum = 0 ,
as_percent = FALSE ,
2018-10-19 13:53:31 +02:00
also_single_tested = FALSE ,
2018-08-22 00:02:26 +02:00
only_count = TRUE )
}
#' @rdname count
#' @export
2018-10-19 13:53:31 +02:00
count_S <- function ( ... , also_single_tested = FALSE ) {
2018-08-23 00:40:36 +02:00
rsi_calc ( ... ,
type = " S" ,
2018-08-22 00:02:26 +02:00
include_I = FALSE ,
minimum = 0 ,
as_percent = FALSE ,
2018-10-19 13:53:31 +02:00
also_single_tested = FALSE ,
2018-08-22 00:02:26 +02:00
only_count = TRUE )
}
2018-10-12 16:35:18 +02:00
#' @rdname count
#' @export
count_all <- function ( ... ) {
# only print warnings once, if needed
count_S ( ... ) + suppressWarnings ( count_IR ( ... ) )
}
#' @rdname count
#' @export
n_rsi <- function ( ... ) {
# only print warnings once, if needed
count_S ( ... ) + suppressWarnings ( count_IR ( ... ) )
}
2018-08-22 00:02:26 +02:00
#' @rdname count
#' @importFrom dplyr %>% select_if bind_rows summarise_if mutate group_vars select everything
#' @export
count_df <- function ( data ,
2018-10-16 09:59:31 +02:00
translate_ab = getOption ( " get_antibiotic_names" , " official" ) ,
combine_IR = FALSE ) {
2018-08-22 00:02:26 +02:00
2018-09-16 22:11:17 +02:00
if ( ! " data.frame" %in% class ( data ) ) {
stop ( " `count_df` must be called on a data.frame" )
}
2018-08-22 00:02:26 +02:00
if ( data %>% select_if ( is.rsi ) %>% ncol ( ) == 0 ) {
stop ( " No columns with class 'rsi' found. See ?as.rsi." )
}
if ( as.character ( translate_ab ) == " TRUE" ) {
translate_ab <- " official"
}
options ( get_antibiotic_names = translate_ab )
resS <- summarise_if ( .tbl = data ,
.predicate = is.rsi ,
.funs = count_S ) %>%
mutate ( Interpretation = " S" ) %>%
select ( Interpretation , everything ( ) )
2018-10-16 09:59:31 +02:00
if ( combine_IR == FALSE ) {
resI <- summarise_if ( .tbl = data ,
.predicate = is.rsi ,
.funs = count_I ) %>%
mutate ( Interpretation = " I" ) %>%
select ( Interpretation , everything ( ) )
resR <- summarise_if ( .tbl = data ,
.predicate = is.rsi ,
.funs = count_R ) %>%
mutate ( Interpretation = " R" ) %>%
select ( Interpretation , everything ( ) )
data.groups <- group_vars ( data )
res <- bind_rows ( resS , resI , resR ) %>%
mutate ( Interpretation = factor ( Interpretation , levels = c ( " R" , " I" , " S" ) , ordered = TRUE ) ) %>%
tidyr :: gather ( Antibiotic , Value , - Interpretation , - data.groups )
} else {
resIR <- summarise_if ( .tbl = data ,
.predicate = is.rsi ,
.funs = count_IR ) %>%
mutate ( Interpretation = " IR" ) %>%
select ( Interpretation , everything ( ) )
data.groups <- group_vars ( data )
res <- bind_rows ( resS , resIR ) %>%
mutate ( Interpretation = factor ( Interpretation , levels = c ( " IR" , " S" ) , ordered = TRUE ) ) %>%
tidyr :: gather ( Antibiotic , Value , - Interpretation , - data.groups )
}
2018-08-22 00:02:26 +02:00
if ( ! translate_ab == FALSE ) {
if ( ! tolower ( translate_ab ) %in% tolower ( colnames ( AMR :: antibiotics ) ) ) {
stop ( " Parameter `translate_ab` does not occur in the `antibiotics` data set." , call. = FALSE )
}
res <- res %>% mutate ( Antibiotic = abname ( Antibiotic , from = " guess" , to = translate_ab ) )
}
res
}