AMR/man/proportion.Rd

292 lines
14 KiB
Plaintext
Raw Normal View History

2018-08-10 15:01:05 +02:00
% Generated by roxygen2: do not edit by hand
2023-01-21 23:47:20 +01:00
% Please edit documentation in R/proportion.R, R/sir_df.R
\name{proportion}
\alias{proportion}
\alias{resistance}
2018-08-10 15:01:05 +02:00
\alias{portion}
\alias{susceptibility}
2023-01-21 23:47:20 +01:00
\alias{sir_confidence_interval}
\alias{proportion_R}
\alias{proportion_IR}
\alias{proportion_I}
\alias{proportion_SI}
\alias{proportion_S}
\alias{proportion_df}
2023-01-21 23:47:20 +01:00
\alias{sir_df}
\title{Calculate Antimicrobial Resistance}
2018-08-10 15:01:05 +02:00
\source{
\strong{M39 Analysis and Presentation of Cumulative Antimicrobial Susceptibility Test Data, 5th Edition}, 2022, \emph{Clinical and Laboratory Standards Institute (CLSI)}. \url{https://clsi.org/standards/products/microbiology/documents/m39/}.
2018-08-10 15:01:05 +02:00
}
\usage{
resistance(..., minimum = 30, as_percent = FALSE, only_all_tested = FALSE)
susceptibility(..., minimum = 30, as_percent = FALSE, only_all_tested = FALSE)
2018-08-10 15:01:05 +02:00
2023-01-21 23:47:20 +01:00
sir_confidence_interval(
...,
ab_result = "R",
minimum = 30,
as_percent = FALSE,
only_all_tested = FALSE,
confidence_level = 0.95,
side = "both",
collapse = FALSE
)
proportion_R(..., minimum = 30, as_percent = FALSE, only_all_tested = FALSE)
2018-08-10 15:01:05 +02:00
proportion_IR(..., minimum = 30, as_percent = FALSE, only_all_tested = FALSE)
2018-08-10 15:01:05 +02:00
proportion_I(..., minimum = 30, as_percent = FALSE, only_all_tested = FALSE)
2018-08-10 15:01:05 +02:00
proportion_SI(..., minimum = 30, as_percent = FALSE, only_all_tested = FALSE)
2018-08-11 21:30:00 +02:00
proportion_S(..., minimum = 30, as_percent = FALSE, only_all_tested = FALSE)
proportion_df(
data,
translate_ab = "name",
language = get_AMR_locale(),
minimum = 30,
as_percent = FALSE,
combine_SI = TRUE,
confidence_level = 0.95
)
2019-06-13 14:28:46 +02:00
2023-01-21 23:47:20 +01:00
sir_df(
data,
translate_ab = "name",
language = get_AMR_locale(),
minimum = 30,
as_percent = FALSE,
combine_SI = TRUE,
confidence_level = 0.95
)
2018-08-10 15:01:05 +02:00
}
\arguments{
2023-01-21 23:47:20 +01:00
\item{...}{one or more vectors (or columns) with antibiotic interpretations. They will be transformed internally with \code{\link[=as.sir]{as.sir()}} if needed. Use multiple columns to calculate (the lack of) co-resistance: the probability where one of two drugs have a resistant or susceptible result. See \emph{Examples}.}
2018-08-10 15:01:05 +02:00
\item{minimum}{the minimum allowed number of available (tested) isolates. Any isolate count lower than \code{minimum} will return \code{NA} with a warning. The default number of \code{30} isolates is advised by the Clinical and Laboratory Standards Institute (CLSI) as best practice, see \emph{Source}.}
2018-08-10 15:01:05 +02:00
2021-05-12 18:15:03 +02:00
\item{as_percent}{a \link{logical} to indicate whether the output must be returned as a hundred fold with \% sign (a character). A value of \code{0.123456} will then be returned as \code{"12.3\%"}.}
2018-08-11 21:30:00 +02:00
2021-05-12 18:15:03 +02:00
\item{only_all_tested}{(for combination therapies, i.e. using more than one variable for \code{...}): a \link{logical} to indicate that isolates must be tested for all antibiotics, see section \emph{Combination Therapy} below}
2023-01-21 23:47:20 +01:00
\item{ab_result}{antibiotic results to test against, must be one or more values of "S", "I", or "R"}
\item{confidence_level}{the confidence level for the returned confidence interval. For the calculation, the number of S or SI isolates, and R isolates are compared with the total number of available isolates with R, S, or I by using \code{\link[=binom.test]{binom.test()}}, i.e., the Clopper-Pearson method.}
\item{side}{the side of the confidence interval to return. The default is \code{"both"} for a length 2 vector, but can also be (abbreviated as) \code{"min"}/\code{"left"}/\code{"lower"}/\code{"less"} or \code{"max"}/\code{"right"}/\code{"higher"}/\code{"greater"}.}
\item{collapse}{a \link{logical} to indicate whether the output values should be 'collapsed', i.e. be merged together into one value, or a character value to use for collapsing}
2023-01-21 23:47:20 +01:00
\item{data}{a \link{data.frame} containing columns with class \code{\link{sir}} (see \code{\link[=as.sir]{as.sir()}})}
2018-08-11 21:30:00 +02:00
2020-12-17 16:22:25 +01:00
\item{translate_ab}{a column name of the \link{antibiotics} data set to translate the antibiotic abbreviations to, using \code{\link[=ab_property]{ab_property()}}}
2019-05-10 16:44:59 +02:00
\item{language}{language of the returned text - the default is the current system language (see \code{\link[=get_AMR_locale]{get_AMR_locale()}}) and can also be set with the \link[=AMR-options]{package option} \code{\link[=AMR-options]{AMR_locale}}. Use \code{language = NULL} or \code{language = ""} to prevent translation.}
2018-10-16 09:59:31 +02:00
\item{combine_SI}{a \link{logical} to indicate whether all values of S and I must be merged into one, so the output only consists of S+I vs. R (susceptible vs. resistant) - the default is \code{TRUE}}
2018-08-10 15:01:05 +02:00
}
\value{
A \link{double} or, when \code{as_percent = TRUE}, a \link{character}.
2018-08-10 15:01:05 +02:00
}
\description{
These functions can be used to calculate the (co-)resistance or susceptibility of microbial isolates (i.e. percentage of S, SI, I, IR or R). All functions support quasiquotation with pipes, can be used in \code{summarise()} from the \code{dplyr} package and also support grouped variables, see \emph{Examples}.
2018-08-10 15:01:05 +02:00
\code{\link[=resistance]{resistance()}} should be used to calculate resistance, \code{\link[=susceptibility]{susceptibility()}} should be used to calculate susceptibility.\cr
2018-08-10 15:01:05 +02:00
}
\details{
The function \code{\link[=resistance]{resistance()}} is equal to the function \code{\link[=proportion_R]{proportion_R()}}. The function \code{\link[=susceptibility]{susceptibility()}} is equal to the function \code{\link[=proportion_SI]{proportion_SI()}}.
2018-08-10 15:01:05 +02:00
2023-01-21 23:47:20 +01:00
Use \code{\link[=sir_confidence_interval]{sir_confidence_interval()}} to calculate the confidence interval, which relies on \code{\link[=binom.test]{binom.test()}}, i.e., the Clopper-Pearson method. This function returns a vector of length 2 at default for antimicrobial \emph{resistance}. Change the \code{side} argument to "left"/"min" or "right"/"max" to return a single value, and change the \code{ab_result} argument to e.g. \code{c("S", "I")} to test for antimicrobial \emph{susceptibility}, see Examples.
\strong{Remember that you should filter your data to let it contain only first isolates!} This is needed to exclude duplicates and to reduce selection bias. Use \code{\link[=first_isolate]{first_isolate()}} to determine them in your data set with one of the four available algorithms.
2019-06-13 14:28:46 +02:00
2020-12-22 00:51:17 +01:00
These functions are not meant to count isolates, but to calculate the proportion of resistance/susceptibility. Use the \code{\link[=count]{count()}} functions to count isolates. The function \code{\link[=susceptibility]{susceptibility()}} is essentially equal to \code{count_susceptible() / count_all()}. \emph{Low counts can influence the outcome - the \code{proportion} functions may camouflage this, since they only return the proportion (albeit being dependent on the \code{minimum} argument).}
2023-01-21 23:47:20 +01:00
The function \code{\link[=proportion_df]{proportion_df()}} takes any variable from \code{data} that has an \code{\link{sir}} class (created with \code{\link[=as.sir]{as.sir()}}) and calculates the proportions S, I, and R. It also supports grouped variables. The function \code{\link[=sir_df]{sir_df()}} works exactly like \code{\link[=proportion_df]{proportion_df()}}, but adds the number of isolates.
2018-08-10 15:01:05 +02:00
}
\section{Combination Therapy}{
When using more than one variable for \code{...} (= combination therapy), use \code{only_all_tested} to only count isolates that are tested for all antibiotics/variables that you test them for. See this example for two antibiotics, Drug A and Drug B, about how \code{\link[=susceptibility]{susceptibility()}} works to calculate the \%SI:
\if{html}{\out{<div class="sourceCode">}}\preformatted{--------------------------------------------------------------------
only_all_tested = FALSE only_all_tested = TRUE
----------------------- -----------------------
Drug A Drug B include as include as include as include as
numerator denominator numerator denominator
-------- -------- ---------- ----------- ---------- -----------
S or I S or I X X X X
R S or I X X X X
<NA> S or I X X - -
S or I R X X X X
R R - X - X
<NA> R - - - -
S or I <NA> X X - -
R <NA> - - - -
<NA> <NA> - - - -
--------------------------------------------------------------------
}\if{html}{\out{</div>}}
Please note that, in combination therapies, for \code{only_all_tested = TRUE} applies that:
\if{html}{\out{<div class="sourceCode">}}\preformatted{ count_S() + count_I() + count_R() = count_all()
proportion_S() + proportion_I() + proportion_R() = 1
}\if{html}{\out{</div>}}
and that, in combination therapies, for \code{only_all_tested = FALSE} applies that:
\if{html}{\out{<div class="sourceCode">}}\preformatted{ count_S() + count_I() + count_R() >= count_all()
proportion_S() + proportion_I() + proportion_R() >= 1
}\if{html}{\out{</div>}}
Using \code{only_all_tested} has no impact when only using one antibiotic as input.
}
2023-01-21 23:47:20 +01:00
\section{Interpretation of SIR}{
2019-05-13 10:10:16 +02:00
2023-01-21 23:47:20 +01:00
In 2019, the European Committee on Antimicrobial Susceptibility Testing (EUCAST) has decided to change the definitions of susceptibility testing categories S, I, and R as shown below (\url{https://www.eucast.org/newsiandr/}):
2019-05-13 10:10:16 +02:00
\itemize{
2023-01-21 23:47:20 +01:00
\item \strong{S - Susceptible, standard dosing regimen}\cr
A microorganism is categorised as "Susceptible, standard dosing regimen", when there is a high likelihood of therapeutic success using a standard dosing regimen of the agent.
\item \strong{I - Susceptible, increased exposure} \emph{\cr
A microorganism is categorised as "Susceptible, Increased exposure}" when there is a high likelihood of therapeutic success because exposure to the agent is increased by adjusting the dosing regimen or by its concentration at the site of infection.
2019-11-29 19:43:23 +01:00
\item \strong{R = Resistant}\cr
2023-01-21 23:47:20 +01:00
A microorganism is categorised as "Resistant" when there is a high likelihood of therapeutic failure even when there is increased exposure.
\itemize{
\item \emph{Exposure} is a function of how the mode of administration, dose, dosing interval, infusion time, as well as distribution and excretion of the antimicrobial agent will influence the infecting organism at the site of infection.
}
2019-05-13 10:10:16 +02:00
}
2022-11-13 13:44:25 +01:00
This AMR package honours this insight. Use \code{\link[=susceptibility]{susceptibility()}} (equal to \code{\link[=proportion_SI]{proportion_SI()}}) to determine antimicrobial susceptibility and \code{\link[=count_susceptible]{count_susceptible()}} (equal to \code{\link[=count_SI]{count_SI()}}) to count susceptible isolates.
2019-05-13 10:10:16 +02:00
}
2018-08-10 15:01:05 +02:00
\examples{
# example_isolates is a data set available in the AMR package.
2022-08-21 16:37:20 +02:00
# run ?example_isolates for more info.
example_isolates
2022-08-21 16:37:20 +02:00
# base R ------------------------------------------------------------
# determines \%R
resistance(example_isolates$AMX)
2023-01-21 23:47:20 +01:00
sir_confidence_interval(example_isolates$AMX)
sir_confidence_interval(example_isolates$AMX,
2022-10-30 14:31:45 +01:00
confidence_level = 0.975
)
sir_confidence_interval(example_isolates$AMX,
confidence_level = 0.975,
collapse = ", "
)
# determines \%S+I:
susceptibility(example_isolates$AMX)
2023-01-21 23:47:20 +01:00
sir_confidence_interval(example_isolates$AMX,
2022-10-30 14:31:45 +01:00
ab_result = c("S", "I")
)
2018-08-10 15:01:05 +02:00
# be more specific
proportion_S(example_isolates$AMX)
proportion_SI(example_isolates$AMX)
proportion_I(example_isolates$AMX)
proportion_IR(example_isolates$AMX)
proportion_R(example_isolates$AMX)
2018-08-10 15:01:05 +02:00
2022-08-21 16:37:20 +02:00
# dplyr -------------------------------------------------------------
2021-05-24 09:00:11 +02:00
\donttest{
2020-05-16 21:40:50 +02:00
if (require("dplyr")) {
2020-05-16 20:08:21 +02:00
example_isolates \%>\%
2022-08-27 20:49:37 +02:00
group_by(ward) \%>\%
2022-08-28 10:31:50 +02:00
summarise(
r = resistance(CIP),
2023-01-21 23:47:20 +01:00
n = n_sir(CIP)
) # n_sir works like n_distinct in dplyr, see ?n_sir
}
if (require("dplyr")) {
example_isolates \%>\%
group_by(ward) \%>\%
summarise(
cipro_R = resistance(CIP),
2023-01-21 23:47:20 +01:00
ci_min = sir_confidence_interval(CIP, side = "min"),
ci_max = sir_confidence_interval(CIP, side = "max"),
)
2022-10-21 15:13:19 +02:00
}
if (require("dplyr")) {
# scoped dplyr verbs with antibiotic selectors
# (you could also use across() of course)
example_isolates \%>\%
group_by(ward) \%>\%
summarise_at(
c(aminoglycosides(), carbapenems()),
resistance
)
}
if (require("dplyr")) {
2020-05-16 20:08:21 +02:00
example_isolates \%>\%
2022-08-27 20:49:37 +02:00
group_by(ward) \%>\%
2022-08-28 10:31:50 +02:00
summarise(
R = resistance(CIP, as_percent = TRUE),
SI = susceptibility(CIP, as_percent = TRUE),
n1 = count_all(CIP), # the actual total; sum of all three
2023-01-21 23:47:20 +01:00
n2 = n_sir(CIP), # same - analogous to n_distinct
2022-08-28 10:31:50 +02:00
total = n()
) # NOT the number of tested isolates!
2020-05-16 20:08:21 +02:00
# Calculate co-resistance between amoxicillin/clav acid and gentamicin,
# so we can see that combination therapy does a lot more than mono therapy:
2022-08-28 10:31:50 +02:00
example_isolates \%>\% susceptibility(AMC) # \%SI = 76.3\%
example_isolates \%>\% count_all(AMC) # n = 1879
example_isolates \%>\% susceptibility(GEN) # \%SI = 75.4\%
example_isolates \%>\% count_all(GEN) # n = 1855
2020-05-16 20:08:21 +02:00
example_isolates \%>\% susceptibility(AMC, GEN) # \%SI = 94.1\%
2022-08-28 10:31:50 +02:00
example_isolates \%>\% count_all(AMC, GEN) # n = 1939
2020-05-16 20:08:21 +02:00
# See Details on how `only_all_tested` works. Example:
example_isolates \%>\%
2022-08-28 10:31:50 +02:00
summarise(
numerator = count_susceptible(AMC, GEN),
denominator = count_all(AMC, GEN),
proportion = susceptibility(AMC, GEN)
)
2020-05-16 20:08:21 +02:00
example_isolates \%>\%
2022-08-28 10:31:50 +02:00
summarise(
numerator = count_susceptible(AMC, GEN, only_all_tested = TRUE),
denominator = count_all(AMC, GEN, only_all_tested = TRUE),
proportion = susceptibility(AMC, GEN, only_all_tested = TRUE)
)
2020-05-16 20:08:21 +02:00
example_isolates \%>\%
2022-08-27 20:49:37 +02:00
group_by(ward) \%>\%
2022-08-28 10:31:50 +02:00
summarise(
cipro_p = susceptibility(CIP, as_percent = TRUE),
cipro_n = count_all(CIP),
genta_p = susceptibility(GEN, as_percent = TRUE),
genta_n = count_all(GEN),
combination_p = susceptibility(CIP, GEN, as_percent = TRUE),
combination_n = count_all(CIP, GEN)
)
2023-01-21 23:47:20 +01:00
# Get proportions S/I/R immediately of all sir columns
2020-05-16 20:08:21 +02:00
example_isolates \%>\%
select(AMX, CIP) \%>\%
proportion_df(translate = FALSE)
2022-08-28 10:31:50 +02:00
2020-05-16 20:08:21 +02:00
# It also supports grouping variables
2023-01-21 23:47:20 +01:00
# (use sir_df to also include the count)
2020-05-16 20:08:21 +02:00
example_isolates \%>\%
2022-08-27 20:49:37 +02:00
select(ward, AMX, CIP) \%>\%
group_by(ward) \%>\%
2023-01-21 23:47:20 +01:00
sir_df(translate = FALSE)
2020-05-16 21:40:50 +02:00
}
2018-08-10 15:01:05 +02:00
}
2021-05-24 09:00:11 +02:00
}
2018-08-10 15:01:05 +02:00
\seealso{
2020-07-08 14:48:06 +02:00
\code{\link[=count]{count()}} to count resistant and susceptible isolates.
2018-08-10 15:01:05 +02:00
}