diff --git a/DESCRIPTION b/DESCRIPTION index 696caf39..ad9c6049 100644 --- a/DESCRIPTION +++ b/DESCRIPTION @@ -1,6 +1,6 @@ Package: AMR -Version: 1.8.0.9005 -Date: 2022-03-10 +Version: 1.8.1 +Date: 2022-03-14 Title: Antimicrobial Resistance Data Analysis Description: Functions to simplify and standardise antimicrobial resistance (AMR) data analysis and to work with microbial and antimicrobial properties by diff --git a/NEWS.md b/NEWS.md index e98b492e..18f36e42 100755 --- a/NEWS.md +++ b/NEWS.md @@ -1,5 +1,5 @@ -# `AMR` 1.8.0.9005 -## Last updated: 10 March 2022 +# `AMR` 1.8.1 + All functions in this package are considered to be stable. Updates to the AMR interpretation rules (such as by EUCAST and CLSI), the microbial taxonomy, and the antibiotic dosages will all be updated every 6 to 12 months. diff --git a/R/sysdata.rda b/R/sysdata.rda index aa840ce9..e8969779 100644 Binary files a/R/sysdata.rda and b/R/sysdata.rda differ diff --git a/R/zzz.R b/R/zzz.R index c8df3be3..2d16236a 100755 --- a/R/zzz.R +++ b/R/zzz.R @@ -116,21 +116,7 @@ if (utf8_supported && !is_latex) { # Helper functions -------------------------------------------------------- create_AB_lookup <- function() { - AB_lookup <- AMR::antibiotics - AB_lookup$generalised_name <- generalise_antibiotic_name(AB_lookup$name) - AB_lookup$generalised_synonyms <- lapply(AB_lookup$synonyms, generalise_antibiotic_name) - AB_lookup$generalised_abbreviations <- lapply(AB_lookup$abbreviations, generalise_antibiotic_name) - AB_lookup$generalised_loinc <- lapply(AB_lookup$loinc, generalise_antibiotic_name) - AB_lookup$generalised_all <- unname(lapply(as.list(as.data.frame(t(AB_lookup[, - c("ab", "atc", "cid", "name", - colnames(AB_lookup)[colnames(AB_lookup) %like% "generalised"]), - drop = FALSE]), - stringsAsFactors = FALSE)), - function(x) { - x <- generalise_antibiotic_name(unname(unlist(x))) - x[x != ""] - })) - AB_lookup + cbind(AMR::antibiotics, AB_LOOKUP) } create_MO_lookup <- function() { @@ -145,12 +131,7 @@ create_MO_lookup <- function() { MO_lookup[which(is.na(MO_lookup$kingdom_index)), "kingdom_index"] <- 5 # use this paste instead of `fullname` to work with Viridans Group Streptococci, etc. - MO_lookup$fullname_lower <- tolower(trimws(paste(MO_lookup$genus, - MO_lookup$species, - MO_lookup$subspecies))) - ind <- MO_lookup$genus == "" | grepl("^[(]unknown ", MO_lookup$fullname, perl = TRUE) - MO_lookup[ind, "fullname_lower"] <- tolower(MO_lookup[ind, "fullname"]) - MO_lookup$fullname_lower <- trimws(gsub("[^.a-z0-9/ \\-]+", "", MO_lookup$fullname_lower, perl = TRUE)) + MO_lookup$fullname_lower <- MO_FULLNAME_LOWER # add a column with only "e coli" like combinations MO_lookup$g_species <- gsub("^([a-z])[a-z]+ ([a-z]+) ?.*", "\\1 \\2", MO_lookup$fullname_lower, perl = TRUE) diff --git a/data-raw/AMR_latest.tar.gz b/data-raw/AMR_latest.tar.gz index ef69a073..94158329 100644 Binary files a/data-raw/AMR_latest.tar.gz and b/data-raw/AMR_latest.tar.gz differ diff --git a/data-raw/_internals.R b/data-raw/_internals.R index 5bd82ed5..cf7198c4 100644 --- a/data-raw/_internals.R +++ b/data-raw/_internals.R @@ -122,9 +122,21 @@ create_species_cons_cops <- function(type = c("CoNS", "CoPS")) { "mo", drop = TRUE] } } +create_MO_fullname_lower <- function() { + MO_lookup <- AMR::microorganisms + # use this paste instead of `fullname` to work with Viridans Group Streptococci, etc. + MO_lookup$fullname_lower <- tolower(trimws(paste(MO_lookup$genus, + MO_lookup$species, + MO_lookup$subspecies))) + ind <- MO_lookup$genus == "" | grepl("^[(]unknown ", MO_lookup$fullname, perl = TRUE) + MO_lookup[ind, "fullname_lower"] <- tolower(MO_lookup[ind, "fullname"]) + MO_lookup$fullname_lower <- trimws(gsub("[^.a-z0-9/ \\-]+", "", MO_lookup$fullname_lower, perl = TRUE)) + MO_lookup$fullname_lower +} MO_CONS <- create_species_cons_cops("CoNS") MO_COPS <- create_species_cons_cops("CoPS") MO_STREP_ABCG <- as.mo(MO_lookup[which(MO_lookup$genus == "Streptococcus"), "mo", drop = TRUE], Lancefield = TRUE) %in% c("B_STRPT_GRPA", "B_STRPT_GRPB", "B_STRPT_GRPC", "B_STRPT_GRPG") +MO_FULLNAME_LOWER <- create_MO_fullname_lower() # antibiotic groups # (these will also be used for eucast_rules() and understanding data-raw/eucast_rules.tsv) @@ -160,6 +172,24 @@ AB_BETALACTAMS <- c(AB_PENICILLINS, AB_CEPHALOSPORINS, AB_CARBAPENEMS) # this will be used for documentation: DEFINED_AB_GROUPS <- ls(envir = globalenv()) DEFINED_AB_GROUPS <- DEFINED_AB_GROUPS[!DEFINED_AB_GROUPS %in% globalenv_before_ab] +create_AB_lookup <- function() { + AB_lookup <- AMR::antibiotics + AB_lookup$generalised_name <- generalise_antibiotic_name(AB_lookup$name) + AB_lookup$generalised_synonyms <- lapply(AB_lookup$synonyms, generalise_antibiotic_name) + AB_lookup$generalised_abbreviations <- lapply(AB_lookup$abbreviations, generalise_antibiotic_name) + AB_lookup$generalised_loinc <- lapply(AB_lookup$loinc, generalise_antibiotic_name) + AB_lookup$generalised_all <- unname(lapply(as.list(as.data.frame(t(AB_lookup[, + c("ab", "atc", "cid", "name", + colnames(AB_lookup)[colnames(AB_lookup) %like% "generalised"]), + drop = FALSE]), + stringsAsFactors = FALSE)), + function(x) { + x <- generalise_antibiotic_name(unname(unlist(x))) + x[x != ""] + })) + AB_lookup[, colnames(AB_lookup)[colnames(AB_lookup) %like% "^generalised"]] +} +AB_LOOKUP <- create_AB_lookup() # Export to package as internal data ---- usethis::use_data(EUCAST_RULES_DF, @@ -169,6 +199,8 @@ usethis::use_data(EUCAST_RULES_DF, MO_CONS, MO_COPS, MO_STREP_ABCG, + MO_FULLNAME_LOWER, + AB_LOOKUP, AB_AMINOGLYCOSIDES, AB_AMINOPENICILLINS, AB_ANTIFUNGALS, diff --git a/docs/404.html b/docs/404.html index 7bc24820..280769ef 100644 --- a/docs/404.html +++ b/docs/404.html @@ -43,7 +43,7 @@
diff --git a/docs/LICENSE-text.html b/docs/LICENSE-text.html index b9eafa18..d3d3defe 100644 --- a/docs/LICENSE-text.html +++ b/docs/LICENSE-text.html @@ -17,7 +17,7 @@ diff --git a/docs/articles/AMR.html b/docs/articles/AMR.html index bf8916e3..16dc670c 100644 --- a/docs/articles/AMR.html +++ b/docs/articles/AMR.html @@ -44,7 +44,7 @@ @@ -192,7 +192,7 @@vignettes/AMR.Rmd
AMR.Rmd
So only 53.6% is suitable for resistance analysis! We can now filter +
So only 53.1% is suitable for resistance analysis! We can now filter
on it with the filter()
function, also from the
dplyr
package:
So we end up with 10,713 isolates for analysis. Now our data looks +
So we end up with 10,616 isolates for analysis. Now our data looks like:
head(data_1st)
Time for the analysis!
@@ -809,8 +809,8 @@ readable:data_1st %>% freq(genus, species)
Frequency table
Class: character
-Length: 10,713
-Available: 10,713 (100%, NA: 0 = 0%)
+Length: 10,616
+Available: 10,616 (100%, NA: 0 = 0%)
Unique: 4
Shortest: 16
Longest: 24
proportion_SI()
, equa
own:
data_1st %>% resistance(AMX)
-# [1] 0.5424251
Or can be used in conjunction with group_by()
and
summarise()
, both from the dplyr
package:
@@ -1162,19 +1162,19 @@ own:Hospital A -0.5412355 +0.5451684 Hospital B -0.5406417 +0.5455526 Hospital C -0.5450746 +0.5361146 @@ -1197,23 +1197,23 @@ all isolates available for every group (i.e. values S, I or R): Hospital D -0.5452821 +0.5511069 Hospital A -0.5412355 -3189 +0.5451684 +3177 Hospital B -0.5406417 -3740 +0.5455526 +3710 Hospital C -0.5450746 -1675 +0.5361146 +1606 @@ -1236,27 +1236,27 @@ therapies very easily: Hospital D -0.5452821 -2109 +0.5511069 +2123 Escherichia -0.7711053 -0.8696693 -0.9738903 +0.7746630 +0.8728868 +0.9779585 Klebsiella -0.8108108 -0.9037162 -0.9805743 +0.8454936 +0.9081545 +0.9896996 Staphylococcus -0.7907308 -0.8827094 -0.9732620 +0.7874539 +0.8963100 +0.9797048 @@ -1284,23 +1284,23 @@ classes, use a antibiotic class selector such as Streptococcus -0.5324248 +0.5357834 0.0000000 -0.5324248 +0.5357834 Hospital A -54.1% -27.2% +54.5% +26.5% Hospital B -54.1% -27.4% +54.6% +25.9% Hospital C -54.5% -25.0% +53.6% +25.3% @@ -1402,16 +1402,18 @@ classes) Hospital D -54.5% -25.9% +55.1% +26.4% <mic>
and<disk>
:mic_values <- random_mic(size = 100) mic_values # Class <mic> -# [1] 1 128 256 8 64 0.5 4 32 16 0.025 -# [11] 16 0.025 2 1 0.025 64 32 32 8 0.5 -# [21] 0.025 256 1 0.005 0.001 1 16 0.025 1 0.002 -# [31] 0.0625 0.125 0.0625 0.01 0.01 4 64 0.002 0.25 128 -# [41] 64 16 16 0.005 0.125 0.5 0.5 0.5 1 32 -# [51] 0.25 0.125 8 8 0.25 256 2 256 0.125 128 -# [61] 0.001 0.001 32 4 16 256 2 0.01 4 8 -# [71] 0.001 0.125 1 0.01 0.25 8 1 0.005 64 0.025 -# [81] 256 16 1 64 8 32 0.002 0.01 4 0.0625 -# [91] 0.025 0.002 0.005 0.01 256 0.125 16 1 0.5 0.01
# base R:
plot(mic_values)
# base R:
plot(disk_values, mo = "E. coli", ab = "cipro")
What are EUCAST rules? The European Committee on Antimicrobial Susceptibility Testing (EUCAST) states on their website:
+What are EUCAST rules? The European Committee on Antimicrobial +Susceptibility Testing (EUCAST) states on +their website:
--EUCAST expert rules are a tabulated collection of expert knowledge on intrinsic resistances, exceptional resistance phenotypes and interpretive rules that may be applied to antimicrobial susceptibility testing in order to reduce errors and make appropriate recommendations for reporting particular resistances.
+EUCAST expert rules are a tabulated collection of expert +knowledge on intrinsic resistances, exceptional resistance phenotypes +and interpretive rules that may be applied to antimicrobial +susceptibility testing in order to reduce errors and make appropriate +recommendations for reporting particular resistances.
In Europe, a lot of medical microbiological laboratories already apply these rules (Brown et al., 2015). Our package features their latest insights on intrinsic resistance and unusual phenotypes (v3.3, 2021).
-Moreover, the eucast_rules()
function we use for this purpose can also apply additional rules, like forcing
In Europe, a lot of medical microbiological laboratories already +apply these rules (Brown +et al., 2015). Our package features their latest insights +on intrinsic resistance and unusual phenotypes (v3.3, 2021).
+Moreover, the eucast_rules()
function we use for this
+purpose can also apply additional rules, like forcing
+
These rules can be used to discard impossible bug-drug combinations in your data. For example, Klebsiella produces beta-lactamase that prevents ampicillin (or amoxicillin) from working against it. In other words, practically every strain of Klebsiella is resistant to ampicillin.
-Sometimes, laboratory data can still contain such strains with ampicillin being susceptible to ampicillin. This could be because an antibiogram is available before an identification is available, and the antibiogram is then not re-interpreted based on the identification (namely, Klebsiella). EUCAST expert rules solve this, that can be applied using eucast_rules()
:
These rules can be used to discard impossible bug-drug combinations +in your data. For example, Klebsiella produces beta-lactamase +that prevents ampicillin (or amoxicillin) from working against it. In +other words, practically every strain of Klebsiella is +resistant to ampicillin.
+Sometimes, laboratory data can still contain such strains with
+ampicillin being susceptible to ampicillin. This could be because an
+antibiogram is available before an identification is available, and the
+antibiogram is then not re-interpreted based on the identification
+(namely, Klebsiella). EUCAST expert rules solve this, that can
+be applied using eucast_rules()
:
oops <- data.frame(mo = c("Klebsiella",
"Escherichia"),
@@ -226,7 +247,10 @@
# mo ampicillin
# 1 Klebsiella R
# 2 Escherichia S
A more convenient function is mo_is_intrinsic_resistant()
that uses the same guideline, but allows to check for one or more specific microorganisms or antibiotics:
A more convenient function is
+mo_is_intrinsic_resistant()
that uses the same guideline,
+but allows to check for one or more specific microorganisms or
+antibiotics:
mo_is_intrinsic_resistant(c("Klebsiella", "Escherichia"),
"ampicillin")
@@ -235,7 +259,11 @@
mo_is_intrinsic_resistant("Klebsiella",
c("ampicillin", "kanamycin"))
# [1] TRUE FALSE
EUCAST rules can not only be used for correction, they can also be used for filling in known resistance and susceptibility based on results of other antimicrobials drugs. This process is called interpretive reading, is basically a form of imputation, and is part of the eucast_rules()
function as well:
EUCAST rules can not only be used for correction, they can also be
+used for filling in known resistance and susceptibility based on results
+of other antimicrobials drugs. This process is called interpretive
+reading, is basically a form of imputation, and is part of the
+eucast_rules()
function as well:
data <- data.frame(mo = c("Staphylococcus aureus",
"Enterococcus faecalis",
@@ -397,12 +425,14 @@
diff --git a/docs/articles/MDR.html b/docs/articles/MDR.html
index e306389f..d6bd8507 100644
--- a/docs/articles/MDR.html
+++ b/docs/articles/MDR.html
@@ -44,7 +44,7 @@
vignettes/MDR.Rmd
@@ -198,54 +199,87 @@
-With the function mdro()
, you can determine which micro-organisms are multi-drug resistant organisms (MDRO).
With the function mdro()
, you can determine which
+micro-organisms are multi-drug resistant organisms (MDRO).
The mdro()
function takes a data set as input, such as a regular data.frame
. It tries to automatically determine the right columns for info about your isolates, such as the name of the species and all columns with results of antimicrobial agents. See the help page for more info about how to set the right settings for your data with the command ?mdro
.
For WHONET data (and most other data), all settings are automatically set correctly.
+The mdro()
function takes a data set as input, such as a
+regular data.frame
. It tries to automatically determine the
+right columns for info about your isolates, such as the name of the
+species and all columns with results of antimicrobial agents. See the
+help page for more info about how to set the right settings for your
+data with the command ?mdro
.
For WHONET data (and most other data), all settings are automatically +set correctly.
The mdro()
function support multiple guidelines. You can select a guideline with the guideline
parameter. Currently supported guidelines are (case-insensitive):
The mdro()
function support multiple guidelines. You can
+select a guideline with the guideline
parameter. Currently
+supported guidelines are (case-insensitive):
guideline = "CMI2012"
(default)
Magiorakos AP, Srinivasan A et al. “Multidrug-resistant, extensively drug-resistant and pandrug-resistant bacteria: an international expert proposal for interim standard definitions for acquired resistance.” Clinical Microbiology and Infection (2012) (link)
+Magiorakos AP, Srinivasan A et al. “Multidrug-resistant, +extensively drug-resistant and pandrug-resistant bacteria: an +international expert proposal for interim standard definitions for +acquired resistance.” Clinical Microbiology and Infection (2012) (link)
guideline = "EUCAST3.2"
(or simply guideline = "EUCAST"
)
The European international guideline - EUCAST Expert Rules Version 3.2 “Intrinsic Resistance and Unusual Phenotypes” (link)
+guideline = "EUCAST3.2"
(or simply
+guideline = "EUCAST"
)
The European international guideline - EUCAST Expert Rules Version +3.2 “Intrinsic Resistance and Unusual Phenotypes” (link)
guideline = "EUCAST3.1"
The European international guideline - EUCAST Expert Rules Version 3.1 “Intrinsic Resistance and Exceptional Phenotypes Tables” (link)
+The European international guideline - EUCAST Expert Rules Version +3.1 “Intrinsic Resistance and Exceptional Phenotypes Tables” (link)
guideline = "TB"
The international guideline for multi-drug resistant tuberculosis - World Health Organization “Companion handbook to the WHO guidelines for the programmatic management of drug-resistant tuberculosis” (link)
+The international guideline for multi-drug resistant tuberculosis - +World Health Organization “Companion handbook to the WHO guidelines for +the programmatic management of drug-resistant tuberculosis” (link)
guideline = "MRGN"
The German national guideline - Mueller et al. (2015) Antimicrobial Resistance and Infection Control 4:7. DOI: 10.1186/s13756-015-0047-6
+The German national guideline - Mueller et al. (2015) +Antimicrobial Resistance and Infection Control 4:7. DOI: +10.1186/s13756-015-0047-6
guideline = "BRMO"
The Dutch national guideline - Rijksinstituut voor Volksgezondheid en Milieu “WIP-richtlijn BRMO (Bijzonder Resistente Micro-Organismen) (ZKH)” (link)
+The Dutch national guideline - Rijksinstituut voor Volksgezondheid en +Milieu “WIP-richtlijn BRMO (Bijzonder Resistente Micro-Organismen) +(ZKH)” (link)
Please suggest your own (country-specific) guidelines by letting us know: https://github.com/msberends/AMR/issues/new.
+Please suggest your own (country-specific) guidelines by letting us +know: https://github.com/msberends/AMR/issues/new.
You can also use your own custom guideline. Custom guidelines can be set with the custom_mdro_guideline()
function. This is of great importance if you have custom rules to determine MDROs in your hospital, e.g., rules that are dependent on ward, state of contact isolation or other variables in your data.
If you are familiar with case_when()
of the dplyr
package, you will recognise the input method to set your own rules. Rules must be set using what R considers to be the ‘formula notation’:
You can also use your own custom guideline. Custom guidelines can be
+set with the custom_mdro_guideline()
function. This is of
+great importance if you have custom rules to determine MDROs in your
+hospital, e.g., rules that are dependent on ward, state of contact
+isolation or other variables in your data.
If you are familiar with case_when()
of the
+dplyr
package, you will recognise the input method to set
+your own rules. Rules must be set using what R considers to be the
+‘formula notation’:
custom <- custom_mdro_guideline(CIP == "R" & age > 60 ~ "Elderly Type A",
ERY == "R" & age > 60 ~ "Elderly Type B")
If a row/an isolate matches the first rule, the value after the first ~
(in this case ‘Elderly Type A’) will be set as MDRO value. Otherwise, the second rule will be tried and so on. The maximum number of rules is unlimited.
You can print the rules set in the console for an overview. Colours will help reading it if your console supports colours.
+If a row/an isolate matches the first rule, the value after the first
+~
(in this case ‘Elderly Type A’) will be set as
+MDRO value. Otherwise, the second rule will be tried and so on. The
+maximum number of rules is unlimited.
You can print the rules set in the console for an overview. Colours +will help reading it if your console supports colours.
custom
# A set of custom MDRO rules:
@@ -255,7 +289,8 @@
#
# Unmatched rows will return NA.
# Results will be of class <factor>, with ordered levels: Negative < Elderly Type A < Elderly Type B
The outcome of the function can be used for the guideline
argument in the mdro()
function:
The outcome of the function can be used for the
+guideline
argument in the mdro()
function:
x <- mdro(example_isolates, guideline = custom)
# Determining MDROs based on custom rules, resulting in factor levels:
@@ -266,14 +301,25 @@
# x
# Negative Elderly Type A Elderly Type B
# 1070 198 732
The rules set (the custom
object in this case) could be exported to a shared file location using saveRDS()
if you collaborate with multiple users. The custom rules set could then be imported using readRDS()
.
The rules set (the custom
object in this case) could be
+exported to a shared file location using saveRDS()
if you
+collaborate with multiple users. The custom rules set could then be
+imported using readRDS()
.
The mdro()
function always returns an ordered factor
for predefined guidelines. For example, the output of the default guideline by Magiorakos et al. returns a factor
with levels ‘Negative’, ‘MDR’, ‘XDR’ or ‘PDR’ in that order.
The next example uses the example_isolates
data set. This is a data set included with this package and contains full antibiograms of 2,000 microbial isolates. It reflects reality and can be used to practise AMR data analysis. If we test the MDR/XDR/PDR guideline on this data set, we get:
The mdro()
function always returns an ordered
+factor
for predefined guidelines. For example, the output
+of the default guideline by Magiorakos et al. returns a
+factor
with levels ‘Negative’, ‘MDR’, ‘XDR’ or ‘PDR’ in
+that order.
The next example uses the example_isolates
data set.
+This is a data set included with this package and contains full
+antibiograms of 2,000 microbial isolates. It reflects reality and can be
+used to practise AMR data analysis. If we test the MDR/XDR/PDR guideline
+on this data set, we get:
Only results with ‘R’ are considered as resistance. Use combine_SI = FALSE
to also consider ‘I’ as resistance.
Determining multidrug-resistant organisms (MDRO), according to: Guideline: Multidrug-resistant, extensively drug-resistant and pandrug-resistant bacteria: an international expert proposal for interim standard definitions for acquired resistance. Author(s): Magiorakos AP, Srinivasan A, Carey RB, …, Vatopoulos A, Weber JT, Monnet DL Source: Clinical Microbiology and Infection 18:3, 2012; doi: 10.1111/j.1469-0691.2011.03570.x
+# Warning: in `mdro()`: NA introduced for isolates where the available percentage of +# antimicrobial classes was below 50% (set with `pct_required_classes`)Only results with ‘R’ are considered as resistance. Use
+combine_SI = FALSE
to also consider ‘I’ as resistance.
Determining multidrug-resistant organisms (MDRO), according to: +Guideline: Multidrug-resistant, extensively drug-resistant and +pandrug-resistant bacteria: an international expert proposal for interim +standard definitions for acquired resistance. Author(s): Magiorakos AP, +Srinivasan A, Carey RB, …, Vatopoulos A, Weber JT, Monnet DL Source: +Clinical Microbiology and Infection 18:3, 2012; doi: +10.1111/j.1469-0691.2011.03570.x
(16 isolates had no test results)
Frequency table
Class: factor > ordered (numeric)
Length: 2,000
-Levels: 4: Negative < Multi-drug-resistant (MDR) < Extensively drug-resistant …
+Levels: 4: Negative < Multi-drug-resistant (MDR) < Extensively
+drug-resistant …
Available: 1,729 (86.45%, NA: 271 = 13.55%)
Unique: 2
Item | @@ -320,21 +382,22 @@ Unique: 21 | Negative | 1601 | -92.60% | +92.6% | 1601 | -92.60% | +92.6% | |
---|---|---|---|---|---|---|---|---|---|
2 | Multi-drug-resistant (MDR) | 128 | -7.40% | +7.4% | 1729 | -100.00% | +100.0% |
For another example, I will create a data set to determine multi-drug resistant TB:
+For another example, I will create a data set to determine multi-drug +resistant TB:
# random_rsi() is a helper function to generate
# a random vector with values S, I and R
@@ -345,7 +408,8 @@ Unique: 2
pyrazinamide = random_rsi(5000),
moxifloxacin = random_rsi(5000),
kanamycin = random_rsi(5000))
Because all column names are automatically verified for valid drug names or codes, this would have worked exactly the same way:
+Because all column names are automatically verified for valid drug +names or codes, this would have worked exactly the same way:
my_TB_data <- data.frame(RIF = random_rsi(5000),
INH = random_rsi(5000),
@@ -358,20 +422,21 @@ Unique: 2
head(my_TB_data)
# rifampicin isoniazid gatifloxacin ethambutol pyrazinamide moxifloxacin
-# 1 I R I S R S
-# 2 I S R R S R
-# 3 R I S I R S
-# 4 S S I R I S
-# 5 S R S S S I
-# 6 S R R S R I
+# 1 R S S I S I
+# 2 R S S S R I
+# 3 S S I I S S
+# 4 I I S S S S
+# 5 I R R I R R
+# 6 I R S I S S
# kanamycin
-# 1 S
-# 2 I
+# 1 I
+# 2 R
# 3 R
-# 4 R
+# 4 S
# 5 I
-# 6 R
-We can now add the interpretation of MDR-TB to our data set. You can use:
+# 6 I
We can now add the interpretation of MDR-TB to our data set. You can +use:
mdro(my_TB_data, guideline = "TB")
or its shortcut mdr_tb()
:
Frequency table
Class: factor > ordered (numeric)
Length: 5,000
-Levels: 5: Negative < Mono-resistant < Poly-resistant < Multi-drug-resistant <…
-Available: 5,000 (100.0%, NA: 0 = 0.0%)
+Levels: 5: Negative < Mono-resistant < Poly-resistant <
+Multi-drug-resistant <…
+Available: 5,000 (100%, NA: 0 = 0%)
Unique: 5
Item | @@ -413,40 +487,40 @@ Unique: 5|||||||||
---|---|---|---|---|---|---|---|---|---|
1 | Mono-resistant | -3250 | -65.00% | -3250 | -65.00% | +3175 | +63.50% | +3175 | +63.50% |
2 | Negative | -975 | -19.50% | -4225 | -84.50% | +1057 | +21.14% | +4232 | +84.64% |
3 | Multi-drug-resistant | -474 | -9.48% | -4699 | -93.98% | +431 | +8.62% | +4663 | +93.26% |
4 | Poly-resistant | -203 | -4.06% | -4902 | -98.04% | +236 | +4.72% | +4899 | +97.98% |
5 | Extensively drug-resistant | -98 | -1.96% | +101 | +2.02% | 5000 | 100.00% |
Item | @@ -334,7 +361,7 @@ Longest: 40
---|
(omitted 27 entries, n = 56 [11.20%])
+(omitted 27 entries, n = 56 [11.2%])
# our transformed antibiotic columns
# amoxicillin/clavulanic acid (J01CR02) as an example
@@ -388,7 +415,8 @@ Drug group: Beta-lactams/penicillins
A first glimpse at results
-An easy ggplot
will already give a lot of information, using the included ggplot_rsi()
function:
+An easy ggplot
will already give a lot of information,
+using the included ggplot_rsi()
function:
data %>%
group_by(Country) %>%
@@ -408,12 +436,14 @@ Drug group: Beta-lactams/penicillins
diff --git a/docs/articles/WHONET_files/figure-html/unnamed-chunk-7-1.png b/docs/articles/WHONET_files/figure-html/unnamed-chunk-7-1.png
index 78144edc..0ce239d4 100644
Binary files a/docs/articles/WHONET_files/figure-html/unnamed-chunk-7-1.png and b/docs/articles/WHONET_files/figure-html/unnamed-chunk-7-1.png differ
diff --git a/docs/articles/benchmarks.html b/docs/articles/benchmarks.html
index 0e2362a8..7ca1bb22 100644
--- a/docs/articles/benchmarks.html
+++ b/docs/articles/benchmarks.html
@@ -44,7 +44,7 @@
@@ -198,14 +198,30 @@
-One of the most important features of this package is the complete microbial taxonomic database, supplied by the Catalogue of Life (CoL) and the List of Prokaryotic names with Standing in Nomenclature (LPSN). We created a function as.mo()
that transforms any user input value to a valid microbial ID by using intelligent rules combined with the microbial taxonomy.
-Using the microbenchmark
package, we can review the calculation performance of this function. Its function microbenchmark()
runs different input expressions independently of each other and measures their time-to-result.
+One of the most important features of this package is the complete
+microbial taxonomic database, supplied by the Catalogue of Life (CoL) and
+the List of Prokaryotic names with
+Standing in Nomenclature (LPSN). We created a function
+as.mo()
that transforms any user input value to a valid
+microbial ID by using intelligent rules combined with the microbial
+taxonomy.
+Using the microbenchmark
package, we can review the
+calculation performance of this function. Its function
+microbenchmark()
runs different input expressions
+independently of each other and measures their time-to-result.
-In the next test, we try to ‘coerce’ different input values into the microbial code of Staphylococcus aureus. Coercion is a computational process of forcing output based on an input. For microorganism names, coercing user input to taxonomically valid microorganism names is crucial to ensure correct interpretation and to enable grouping based on taxonomic properties.
-The actual result is the same every time: it returns its microorganism code B_STPHY_AURS
(B stands for Bacteria, its taxonomic kingdom).
+In the next test, we try to ‘coerce’ different input values into the
+microbial code of Staphylococcus aureus. Coercion is a
+computational process of forcing output based on an input. For
+microorganism names, coercing user input to taxonomically valid
+microorganism names is crucial to ensure correct interpretation and to
+enable grouping based on taxonomic properties.
+The actual result is the same every time: it returns its
+microorganism code B_STPHY_AURS
(B stands for
+Bacteria, its taxonomic kingdom).
But the calculation time differs a lot:
S.aureus <- microbenchmark(
@@ -224,27 +240,40 @@
times = 25)
print(S.aureus, unit = "ms", signif = 2)
# Unit: milliseconds
-# expr min lq mean median uq max neval
-# as.mo("sau") 10.0 12.0 20.0 12.0 15.0 53 25
-# as.mo("stau") 49.0 54.0 72.0 58.0 91.0 97 25
-# as.mo("STAU") 50.0 54.0 71.0 57.0 90.0 110 25
-# as.mo("staaur") 10.0 12.0 17.0 12.0 14.0 51 25
-# as.mo("STAAUR") 10.0 12.0 17.0 12.0 14.0 54 25
-# as.mo("S. aureus") 26.0 27.0 40.0 31.0 56.0 74 25
-# as.mo("S aureus") 26.0 27.0 39.0 29.0 58.0 68 25
-# as.mo("Staphylococcus aureus") 3.5 3.9 6.6 4.1 4.8 38 25
-# as.mo("Staphylococcus aureus (MRSA)") 230.0 240.0 250.0 240.0 250.0 280 25
-# as.mo("Sthafilokkockus aaureuz") 180.0 190.0 200.0 190.0 200.0 290 25
-# as.mo("MRSA") 11.0 12.0 19.0 13.0 14.0 50 25
-# as.mo("VISA") 21.0 22.0 32.0 25.0 50.0 60 25
+# expr min lq mean median uq max neval
+# as.mo("sau") 12.0 13 18.0 14.0 15.0 48 25
+# as.mo("stau") 54.0 59 80.0 91.0 96.0 99 25
+# as.mo("STAU") 53.0 61 77.0 66.0 94.0 100 25
+# as.mo("staaur") 12.0 13 19.0 14.0 16.0 62 25
+# as.mo("STAAUR") 12.0 13 16.0 14.0 15.0 48 25
+# as.mo("S. aureus") 28.0 30 38.0 33.0 35.0 69 25
+# as.mo("S aureus") 27.0 31 46.0 34.0 65.0 73 25
+# as.mo("Staphylococcus aureus") 3.7 4 6.7 4.3 4.5 36 25
+# as.mo("Staphylococcus aureus (MRSA)") 260.0 270 290.0 280.0 290.0 360 25
+# as.mo("Sthafilokkockus aaureuz") 190.0 210 220.0 210.0 220.0 330 25
+# as.mo("MRSA") 12.0 13 20.0 14.0 16.0 68 25
+# as.mo("VISA") 22.0 23 32.0 25.0 27.0 63 25
-In the table above, all measurements are shown in milliseconds (thousands of seconds). A value of 5 milliseconds means it can determine 200 input values per second. It case of 200 milliseconds, this is only 5 input values per second. It is clear that accepted taxonomic names are extremely fast, but some variations are up to 47 times slower to determine.
-To improve performance, we implemented two important algorithms to save unnecessary calculations: repetitive results and already precalculated results.
+In the table above, all measurements are shown in milliseconds
+(thousands of seconds). A value of 5 milliseconds means it can determine
+200 input values per second. It case of 200 milliseconds, this is only 5
+input values per second. It is clear that accepted taxonomic names are
+extremely fast, but some variations are up to 67 times slower to
+determine.
+To improve performance, we implemented two important algorithms to
+save unnecessary calculations: repetitive results and
+already precalculated results.
Repetitive results
-Repetitive results are values that are present more than once in a vector. Unique values will only be calculated once by as.mo()
. So running as.mo(c("E. coli", "E. coli"))
will check the value "E. coli"
only once.
-To prove this, we will use mo_name()
for testing - a helper function that returns the full microbial name (genus, species and possibly subspecies) which uses as.mo()
internally.
+Repetitive results are values that are present more than once in a
+vector. Unique values will only be calculated once by
+as.mo()
. So running
+as.mo(c("E. coli", "E. coli"))
will check the value
+"E. coli"
only once.
+To prove this, we will use mo_name()
for testing - a
+helper function that returns the full microbial name (genus, species and
+possibly subspecies) which uses as.mo()
internally.
# start with the example_isolates data set
x <- example_isolates %>%
@@ -258,8 +287,8 @@
# what do these values look like? They are of class <mo>:
head(x)
# Class <mo>
-# [1] B_STPHY_AURS B_STRPT_EQNS B_KLBSL_PNMN B_STPHY_EPDR B_STPHY_AURS
-# [6] B_CRYNB_STRT
+# [1] B_ESCHR_COLI B_STRPT_MITS B_STRPT_ANGN B_STPHY_CONS B_ESCHR_COLI
+# [6] B_ESCHR_COLI
# as the example_isolates data set has 2,000 rows, we should have 2 million items
length(x)
@@ -275,13 +304,20 @@
print(run_it, unit = "ms", signif = 3)
# Unit: milliseconds
# expr min lq mean median uq max neval
-# mo_name(x) 196 209 274 223 364 388 10
-So getting official taxonomic names of 2,000,000 (!!) items consisting of 90 unique values only takes 0.223 seconds. That is 112 nanoseconds on average. You only lose time on your unique input values.
+# mo_name(x) 207 225 288 233 370 414 10
+So getting official taxonomic names of 2,000,000 (!!) items
+consisting of 90 unique values only takes 0.233 seconds. That is 117
+nanoseconds on average. You only lose time on your unique input
+values.
What about precalculated results? If the input is an already precalculated result of a helper function such as mo_name()
, it almost doesn’t take any time at all. In other words, if you run mo_name()
on a valid taxonomic name, it will return the results immediately (see ‘C’ below):
What about precalculated results? If the input is an already
+precalculated result of a helper function such as
+mo_name()
, it almost doesn’t take any time at all. In other
+words, if you run mo_name()
on a valid taxonomic name, it
+will return the results immediately (see ‘C’ below):
run_it <- microbenchmark(A = mo_name("STAAUR"),
B = mo_name("S. aureus"),
@@ -289,11 +325,14 @@
times = 10)
print(run_it, unit = "ms", signif = 3)
# Unit: milliseconds
-# expr min lq mean median uq max neval
-# A 8.00 9.16 9.19 9.28 9.46 9.73 10
-# B 23.40 27.20 32.60 27.90 28.10 80.20 10
-# C 1.85 2.25 2.40 2.47 2.62 2.90 10
So going from mo_name("Staphylococcus aureus")
to "Staphylococcus aureus"
takes 0.0025 seconds - it doesn’t even start calculating if the result would be the same as the expected resulting value. That goes for all helper functions:
So going from mo_name("Staphylococcus aureus")
to
+"Staphylococcus aureus"
takes 0.0028 seconds - it doesn’t
+even start calculating if the result would be the same as the
+expected resulting value. That goes for all helper functions:
run_it <- microbenchmark(A = mo_species("aureus"),
B = mo_genus("Staphylococcus"),
@@ -307,20 +346,28 @@
print(run_it, unit = "ms", signif = 3)
# Unit: milliseconds
# expr min lq mean median uq max neval
-# A 1.76 1.80 2.07 1.95 2.26 2.90 10
-# B 1.69 1.73 1.90 1.81 2.03 2.48 10
-# C 1.71 1.77 1.92 1.91 2.05 2.17 10
-# D 1.68 1.71 1.76 1.76 1.82 1.88 10
-# E 1.68 1.70 1.89 1.89 2.04 2.26 10
-# F 1.67 1.75 1.93 1.89 2.11 2.35 10
-# G 1.70 1.76 1.97 1.88 2.12 2.43 10
-# H 1.67 1.71 1.83 1.75 1.98 2.14 10
Of course, when running mo_phylum("Firmicutes")
the function has zero knowledge about the actual microorganism, namely S. aureus. But since the result would be "Firmicutes"
anyway, there is no point in calculating the result. And because this package contains all phyla of all known bacteria, it can just return the initial value immediately.
Of course, when running mo_phylum("Firmicutes")
the
+function has zero knowledge about the actual microorganism, namely
+S. aureus. But since the result would be
+"Firmicutes"
anyway, there is no point in calculating the
+result. And because this package contains all phyla of all known
+bacteria, it can just return the initial value immediately.
When the system language is non-English and supported by this AMR
package, some functions will have a translated result. This almost does’t take extra time (compare “en” from the table below with the other languages):
When the system language is non-English and supported by this
+AMR
package, some functions will have a translated result.
+This almost does’t take extra time (compare “en” from the table below
+with the other languages):
CoNS <- as.mo("CoNS")
CoNS
@@ -349,18 +396,19 @@
times = 100)
print(run_it, unit = "ms", signif = 4)
# Unit: milliseconds
-# expr min lq mean median uq max neval
-# da 1.9470 2.0220 2.190 2.0720 2.358 3.234 100
-# de 1.9560 2.0330 3.649 2.1610 2.401 50.670 100
-# en 0.8937 0.9124 1.022 0.9776 1.120 1.748 100
-# es 1.9710 2.0290 2.216 2.1000 2.391 3.109 100
-# fr 1.8280 1.8960 3.214 1.9420 2.237 71.550 100
-# it 1.9370 1.9970 2.163 2.0610 2.339 3.210 100
-# nl 1.9710 2.0280 2.698 2.1110 2.421 49.340 100
-# pt 1.8920 1.9600 2.119 2.0200 2.261 3.265 100
-# ru 1.8630 1.9420 2.779 2.0270 2.335 66.660 100
-# sv 1.8680 1.9190 4.062 1.9890 2.263 78.870 100
Currently supported languages are Danish, Dutch, English, French, German, Italian, Portuguese, Russian, Spanish and Swedish.
+# expr min lq mean median uq max neval +# da 2.1730 2.476 3.956 2.609 2.873 45.180 100 +# de 2.2170 2.497 3.161 2.646 2.855 48.260 100 +# en 0.9509 1.122 1.640 1.183 1.321 38.430 100 +# es 2.1870 2.546 2.763 2.659 2.872 5.676 100 +# fr 1.9880 2.339 2.609 2.456 2.636 5.197 100 +# it 2.2580 2.475 4.081 2.619 2.867 47.080 100 +# nl 2.3120 2.535 2.792 2.664 2.822 8.113 100 +# pt 2.1930 2.417 3.329 2.528 2.783 48.600 100 +# ru 2.0470 2.360 2.596 2.481 2.683 6.030 100 +# sv 2.2030 2.443 3.077 2.545 2.703 43.350 100Currently supported languages are Danish, Dutch, English, French, +German, Italian, Portuguese, Russian, Spanish and Swedish.
vignettes/datasets.Rmd
datasets.Rmd
As with many uses in R, we need some additional packages for AMR data analysis. Our package works closely together with the tidyverse packages dplyr
and ggplot2
by Dr Hadley Wickham. The tidyverse tremendously improves the way we conduct data science - it allows for a very natural way of writing syntaxes and creating beautiful plots in R.
Our AMR
package depends on these packages and even extends their use and functions.
As with many uses in R, we need some additional packages for AMR data
+analysis. Our package works closely together with the tidyverse packages dplyr
and ggplot2
by Dr
+Hadley Wickham. The tidyverse tremendously improves the way we conduct
+data science - it allows for a very natural way of writing syntaxes and
+creating beautiful plots in R.
Our AMR
package depends on these packages and even
+extends their use and functions.
library(dplyr)
library(ggplot2)
-library(AMR)
+library(AMR)
# (if not yet installed, install with:)
# install.packages(c("tidyverse", "AMR"))
Our package contains a function resistance_predict()
, which takes the same input as functions for other AMR data analysis. Based on a date column, it calculates cases per year and uses a regression model to predict antimicrobial resistance.
Our package contains a function resistance_predict()
,
+which takes the same input as functions for other
+AMR data analysis. Based on a date column, it calculates cases per
+year and uses a regression model to predict antimicrobial
+resistance.
It is basically as easy as:
# resistance prediction of piperacillin/tazobactam (TZP):
resistance_predict(tbl = example_isolates, col_date = "date", col_ab = "TZP", model = "binomial")
@@ -228,10 +237,16 @@
<- example_isolates %>%
predict_TZP resistance_predict(col_ab = "TZP",
model = "binomial")
The function will look for a date column itself if col_date
is not set.
When running any of these commands, a summary of the regression model will be printed unless using resistance_predict(..., info = FALSE)
.
The function will look for a date column itself if
+col_date
is not set.
When running any of these commands, a summary of the regression model
+will be printed unless using
+resistance_predict(..., info = FALSE)
.
# ℹ Using column 'date' as input for `col_date`.
-This text is only a printed summary - the actual result (output) of the function is a data.frame
containing for each year: the number of observations, the actual observed resistance, the estimated resistance and the standard error below and above the estimation:
This text is only a printed summary - the actual result (output) of
+the function is a data.frame
containing for each year: the
+number of observations, the actual observed resistance, the estimated
+resistance and the standard error below and above the estimation:
predict_TZP
# year value se_min se_max observations observed estimated
@@ -264,13 +279,20 @@
# 27 2028 0.43730688 0.3418075 0.5328063 NA NA 0.43730688
# 28 2029 0.46175755 0.3597639 0.5637512 NA NA 0.46175755
# 29 2030 0.48639359 0.3782932 0.5944939 NA NA 0.48639359
-# 30 2031 0.51109592 0.3973697 0.6248221 NA NA 0.51109592
The function plot
is available in base R, and can be extended by other packages to depend the output based on the type of input. We extended its function to cope with resistance predictions:
The function plot
is available in base R, and can be
+extended by other packages to depend the output based on the type of
+input. We extended its function to cope with resistance predictions:
plot(predict_TZP)
This is the fastest way to plot the result. It automatically adds the right axes, error bars, titles, number of available observations and type of model.
-We also support the ggplot2
package with our custom function ggplot_rsi_predict()
to create more appealing plots:
This is the fastest way to plot the result. It automatically adds the +right axes, error bars, titles, number of available observations and +type of model.
+We also support the ggplot2
package with our custom
+function ggplot_rsi_predict()
to create more appealing
+plots:
ggplot_rsi_predict(predict_TZP)
Resistance is not easily predicted; if we look at vancomycin resistance in Gram-positive bacteria, the spread (i.e. standard error) is enormous:
+Resistance is not easily predicted; if we look at vancomycin +resistance in Gram-positive bacteria, the spread (i.e. standard error) +is enormous:
example_isolates %>%
filter(mo_gramstain(mo, language = NULL) == "Gram-positive") %>%
@@ -290,8 +314,13 @@
ggplot_rsi_predict()
# ℹ Using column 'date' as input for `col_date`.
Vancomycin resistance could be 100% in ten years, but might also stay around 0%.
-You can define the model with the model
parameter. The model chosen above is a generalised linear regression model using a binomial distribution, assuming that a period of zero resistance was followed by a period of increasing resistance leading slowly to more and more resistance.
Vancomycin resistance could be 100% in ten years, but might also stay +around 0%.
+You can define the model with the model
parameter. The
+model chosen above is a generalised linear regression model using a
+binomial distribution, assuming that a period of zero resistance was
+followed by a period of increasing resistance leading slowly to more and
+more resistance.
Valid values are:
-"binomial" or "binom" or "logit"
+"binomial" or "binom" or
+"logit"
|
glm(..., family = binomial) |
Generalised linear model with binomial distribution | @@ -328,7 +358,9 @@
For the vancomycin resistance in Gram-positive bacteria, a linear model might be more appropriate since no binomial distribution is to be expected based on the observed years:
+For the vancomycin resistance in Gram-positive bacteria, a linear +model might be more appropriate since no binomial distribution is to be +expected based on the observed years:
example_isolates %>%
filter(mo_gramstain(mo, language = NULL) == "Gram-positive") %>%
@@ -337,7 +369,8 @@
# ℹ Using column 'date' as input for `col_date`.
This seems more likely, doesn’t it?
-The model itself is also available from the object, as an attribute
:
The model itself is also available from the object, as an
+attribute
:
model <- attributes(predict_TZP)$model
@@ -366,12 +399,14 @@
diff --git a/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-4-1.png b/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-4-1.png
index 19d48509..fda3270b 100644
Binary files a/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-4-1.png and b/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-4-1.png differ
diff --git a/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-5-1.png b/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-5-1.png
index e61ce2c0..f13b7a97 100644
Binary files a/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-5-1.png and b/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-5-1.png differ
diff --git a/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-5-2.png b/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-5-2.png
index 46a24c42..9097b80c 100644
Binary files a/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-5-2.png and b/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-5-2.png differ
diff --git a/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-6-1.png b/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-6-1.png
index fd9ead20..b88c19ad 100644
Binary files a/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-6-1.png and b/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-6-1.png differ
diff --git a/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-7-1.png b/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-7-1.png
index 29df232e..3477a162 100644
Binary files a/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-7-1.png and b/docs/articles/resistance_predict_files/figure-html/unnamed-chunk-7-1.png differ
diff --git a/docs/articles/welcome_to_AMR.html b/docs/articles/welcome_to_AMR.html
index 5539d3ba..9a1ac845 100644
--- a/docs/articles/welcome_to_AMR.html
+++ b/docs/articles/welcome_to_AMR.html
@@ -44,7 +44,7 @@
Note: to keep the package size as small as possible, we only included this vignette on CRAN. You can read more vignettes on our website about how to conduct AMR data analysis, determine MDRO’s, find explanation of EUCAST rules, and much more: https://msberends.github.io/AMR/articles/.
+Note: to keep the package size as small as possible, we only included +this vignette on CRAN. You can read more vignettes on our website about +how to conduct AMR data analysis, determine MDRO’s, find explanation of +EUCAST rules, and much more: https://msberends.github.io/AMR/articles/.
AMR
is a free, open-source and independent R package (see Copyright) to simplify the analysis and prediction of Antimicrobial Resistance (AMR) and to work with microbial and antimicrobial data and properties, by using evidence-based methods. Our aim is to provide a standard for clean and reproducible antimicrobial resistance data analysis, that can therefore empower epidemiological analyses to continuously enable surveillance and treatment evaluation in any setting.
After installing this package, R knows ~71,000 distinct microbial species and all ~570 antibiotic, antimycotic and antiviral drugs by name and code (including ATC, EARS-Net, PubChem, LOINC and SNOMED CT), and knows all about valid R/SI and MIC values. It supports any data format, including WHONET/EARS-Net data.
-The AMR
package is available in Danish, Dutch, English, French, German, Italian, Portuguese, Russian, Spanish and Swedish. Antimicrobial drug (group) names and colloquial microorganism names are provided in these languages.
This package is fully independent of any other R package and works on Windows, macOS and Linux with all versions of R since R-3.0 (April 2013). It was designed to work in any setting, including those with very limited resources. Since its first public release in early 2018, this package has been downloaded from more than 175 countries.
+AMR
is a free, open-source and independent R package
+(see Copyright)
+to simplify the analysis and prediction of Antimicrobial Resistance
+(AMR) and to work with microbial and antimicrobial data and properties,
+by using evidence-based methods. Our aim is to provide a
+standard for clean and reproducible antimicrobial resistance
+data analysis, that can therefore empower epidemiological analyses to
+continuously enable surveillance and treatment evaluation in any
+setting.
After installing this package, R knows ~71,000 distinct microbial +species and all ~570 antibiotic, antimycotic and antiviral drugs by name +and code (including ATC, EARS-Net, PubChem, LOINC and SNOMED CT), and +knows all about valid R/SI and MIC values. It supports any data format, +including WHONET/EARS-Net data.
+The AMR
package is available in Danish, Dutch, English,
+French, German, Italian, Portuguese, Russian, Spanish and Swedish.
+Antimicrobial drug (group) names and colloquial microorganism names are
+provided in these languages.
This package is fully independent of any other R package and works on +Windows, macOS and Linux with all versions of R since R-3.0 (April +2013). It was designed to work in any setting, including those +with very limited resources. Since its first public release in +early 2018, this package has been downloaded from more than 175 +countries.
This package can be used for:
All reference data sets (about microorganisms, antibiotics, R/SI interpretation, EUCAST rules, etc.) in this AMR
package are publicly and freely available. We continually export our data sets to formats for use in R, SPSS, SAS, Stata and Excel. We also supply flat files that are machine-readable and suitable for input in any software program, such as laboratory information systems. Please find all download links on our website, which is automatically updated with every code change.
This R package was created for both routine data analysis and academic research at the Faculty of Medical Sciences of the University of Groningen, in collaboration with non-profit organisations Certe Medical Diagnostics and Advice Foundation and University Medical Center Groningen. This R package formed the basis of two PhD theses (DOI 10.33612/diss.177417131 and DOI 10.33612/diss.192486375) but is actively and durably maintained (see changelog)) by two public healthcare organisations in the Netherlands.
+All reference data sets (about microorganisms, antibiotics, R/SI
+interpretation, EUCAST rules, etc.) in this AMR
package are
+publicly and freely available. We continually export our data sets to
+formats for use in R, SPSS, SAS, Stata and Excel. We also supply flat
+files that are machine-readable and suitable for input in any software
+program, such as laboratory information systems. Please find all
+download links on our website, which is automatically updated with
+every code change.
This R package was created for both routine data analysis and +academic research at the Faculty of Medical Sciences of the University of Groningen, in collaboration +with non-profit organisations Certe +Medical Diagnostics and Advice Foundation and University Medical Center Groningen. This +R package formed the basis of two PhD theses (DOI +10.33612/diss.177417131 and DOI +10.33612/diss.192486375) but is actively and durably maintained (see +changelog)) +by two public healthcare organisations in the Netherlands.
AMR
1.8.0.9004All functions in this package are considered to be stable. Updates to the AMR interpretation rules (such as by EUCAST and CLSI), the microbial taxonomy, and the antibiotic dosages will all be updated every 6 to 12 months.
+AMR
1.8.1All functions in this package are considered to be stable. Updates to +the AMR interpretation rules (such as by EUCAST and CLSI), the microbial +taxonomy, and the antibiotic dosages will all be updated every 6 to 12 +months.
Support for antibiotic interpretations of the MIPS laboratory system: "U"
for S (‘susceptible urine’), "D"
for I (‘susceptible dose-dependent’)
Fix for using as.rsi()
on values containing capped
+values (such as >=
), sometimes leading to
+NA
Support for antibiotic interpretations of the MIPS laboratory
+system: "U"
for S (‘susceptible urine’), "D"
+for I (‘susceptible dose-dependent’)
Improved algorithm of as.mo()
, especially for ignoring non-taxonomic text, such as:
Improved algorithm of as.mo()
, especially for
+ignoring non-taxonomic text, such as:
mo_name("methicillin-resistant S. aureus (MRSA)")
@@ -177,113 +184,220 @@
Updated MIC printing in tibbles
AMR
1.8.02022-01-07p_symbol()
and all filter_*()
functions (except for filter_first_isolate()
), which were all deprecated in a previous package versionkey_antibiotics()
and key_antibiotics_equal()
functions, which were deprecated and superseded by key_antimicrobials()
and antimicrobials_equal()
+p_symbol()
and all filter_*()
+functions (except for filter_first_isolate()
), which were
+all deprecated in a previous package versionkey_antibiotics()
and
+key_antibiotics_equal()
functions, which were deprecated
+and superseded by key_antimicrobials()
and
+antimicrobials_equal()
ggplot2::ggplot()
generics for classes <mic>
, <disk>
, <rsi>
and <resistance_predict>
as they did not follow the ggplot2
logic. They were replaced with ggplot2::autoplot()
generics.get_locale()
to get_AMR_locale()
to prevent conflicts with other packagesggplot2::ggplot()
+generics for classes <mic>
,
+<disk>
, <rsi>
and
+<resistance_predict>
as they did not follow the
+ggplot2
logic. They were replaced with
+ggplot2::autoplot()
generics.get_locale()
to
+get_AMR_locale()
to prevent conflicts with other
+packagesSupport for the CLSI 2021 guideline for interpreting MIC/disk diffusion values, which are incorporated in the rsi_translation
data set. This data set now more strictly follows the WHONET software as well.
Support for EUCAST Intrinsic Resistance and Unusual Phenotypes v3.3 (October 2021). This is now the default EUCAST guideline in the package (all older guidelines are still available) for eucast_rules()
, mo_is_intrinsic_resistant()
and mdro()
. The intrinsic_resistant
data set was also updated accordingly.
Support for all antimicrobial drug (group) names and colloquial microorganism names in Danish, Dutch, English, French, German, Italian, Portuguese, Russian, Spanish and Swedish
Support for the CLSI 2021 guideline for interpreting MIC/disk
+diffusion values, which are incorporated in the
+rsi_translation
data set. This data set now more strictly
+follows the WHONET software as well.
Support for EUCAST Intrinsic Resistance and Unusual Phenotypes
+v3.3 (October 2021). This is now the default EUCAST guideline in the
+package (all older guidelines are still available) for
+eucast_rules()
, mo_is_intrinsic_resistant()
+and mdro()
. The intrinsic_resistant
data set
+was also updated accordingly.
Support for all antimicrobial drug (group) names and colloquial +microorganism names in Danish, Dutch, English, French, German, Italian, +Portuguese, Russian, Spanish and Swedish
Function set_ab_names()
to rename data set columns that resemble antimicrobial drugs. This allows for quickly renaming columns to official names, ATC codes, etc. Its second argument can be a tidyverse way of selecting:
Function set_ab_names()
to rename data set columns
+that resemble antimicrobial drugs. This allows for quickly renaming
+columns to official names, ATC codes, etc. Its second argument can be a
+tidyverse way of selecting:
example_isolates %>% set_ab_names(where(is.rsi))
example_isolates %>% set_ab_names(AMC:GEN, property = "atc")
Function ab_ddd_units()
to get units of DDDs (daily defined doses), deprecating the use of ab_ddd(..., units = TRUE)
to be more consistent in data types of function output
Function ab_ddd_units()
to get units of DDDs (daily
+defined doses), deprecating the use of
+ab_ddd(..., units = TRUE)
to be more consistent in data
+types of function output
antibiotics
data set now contains all ATC codes that are available through the WHOCC website, regardless of drugs being present in more than one ATC group. This means that:
-antibiotics
data set now contains all ATC
+codes that are available through the WHOCC website, regardless of drugs being
+present in more than one ATC group. This means that:
+antibiotics$atc
is now a list
containing character
vectors, and this atc
column was moved to the 5th position of the antibiotics
data setantibiotics$atc
is now a list
containing
+character
vectors, and this atc
column was
+moved to the 5th position of the antibiotics
data setab_atc()
does not always return a character vector of length 1, and returns a list
if the input is larger than length 1ab_atc()
does not always return a character vector of
+length 1, and returns a list
if the input is larger than
+length 1ab_info()
has a slightly different outputThey now also work in R-3.0 and R-3.1, supporting every version of R since 2013 like the rest of the package
Added more selectors for antibiotic classes: aminopenicillins()
, antifungals()
, antimycobacterials()
, lincosamides()
, lipoglycopeptides()
, polymyxins()
, quinolones()
, streptogramins()
, trimethoprims()
and ureidopenicillins()
They now also work in R-3.0 and R-3.1, supporting every version +of R since 2013 like the rest of the package
Added more selectors for antibiotic classes:
+aminopenicillins()
, antifungals()
,
+antimycobacterials()
, lincosamides()
,
+lipoglycopeptides()
, polymyxins()
,
+quinolones()
, streptogramins()
,
+trimethoprims()
and
+ureidopenicillins()
Added specific selectors for certain types for treatment: administrable_per_os()
and administrable_iv()
, which are based on available Defined Daily Doses (DDDs), as defined by the WHOCC. These are ideal for e.g. analysing pathogens in primary care where IV treatment is not an option. They can be combined with other AB selectors, e.g. to select penicillins that are only administrable per os (i.e., orally):
Added specific selectors for certain types for treatment:
+administrable_per_os()
and administrable_iv()
,
+which are based on available Defined Daily Doses (DDDs), as defined by
+the WHOCC. These are ideal for e.g. analysing pathogens in primary care
+where IV treatment is not an option. They can be combined with other AB
+selectors, e.g. to select penicillins that are only administrable per os
+(i.e., orally):
example_isolates[, penicillins() & administrable_per_os()] # base R
example_isolates %>% select(penicillins() & administrable_per_os()) # dplyr
Added the selector ab_selector()
, which accepts a filter to be used internally on the antibiotics
data set, yielding great flexibility on drug properties, such as selecting antibiotic columns with an oral DDD of at least 1 gram:
Added the selector ab_selector()
, which accepts a
+filter to be used internally on the antibiotics
data set,
+yielding great flexibility on drug properties, such as selecting
+antibiotic columns with an oral DDD of at least 1 gram:
example_isolates[, ab_selector(oral_ddd > 1 & oral_units == "g")] # base R
example_isolates %>% select(ab_selector(oral_ddd > 1 & oral_units == "g")) # dplyr
Added the selector not_intrinsic_resistant()
, which only keeps antibiotic columns that are not intrinsic resistant for all microorganisms in a data set, based on the latest EUCAST guideline on intrinsic resistance. For example, if a data set contains only microorganism codes or names of E. coli and K. pneumoniae and contains a column “vancomycin”, this column will be removed (or rather, unselected) using this function.
Added argument only_treatable
, which defaults to TRUE
and will exclude drugs that are only for laboratory tests and not for treating patients (such as imipenem/EDTA and gentamicin-high)
Fix for using selectors multiple times in one call (e.g., using them in dplyr::filter()
and immediately after in dplyr::select()
)
Fix for using having multiple columns that are coerced to the same antibiotic agent
Fixed for using all()
or any()
on antibiotic selectors in an R Markdown file
Added the selector not_intrinsic_resistant()
, which
+only keeps antibiotic columns that are not intrinsic resistant for all
+microorganisms in a data set, based on the latest EUCAST guideline on
+intrinsic resistance. For example, if a data set contains only
+microorganism codes or names of E. coli and K.
+pneumoniae and contains a column “vancomycin”, this column will be
+removed (or rather, unselected) using this function.
Added argument only_treatable
, which defaults to
+TRUE
and will exclude drugs that are only for laboratory
+tests and not for treating patients (such as imipenem/EDTA and
+gentamicin-high)
Fix for using selectors multiple times in one call (e.g., using
+them in dplyr::filter()
and immediately after in
+dplyr::select()
)
Fix for using having multiple columns that are coerced to the +same antibiotic agent
Fixed for using all()
or any()
on
+antibiotic selectors in an R Markdown file
mo_gramstain()
) determination of the taxonomic class Negativicutes within the phylum of Firmicutes - they were considered Gram-positives because of their phylum but are actually Gram-negative. This impacts 137 taxonomic species, genera and families, such as Negativicoccus and Veillonella.mo_gramstain()
) determination of
+the taxonomic class Negativicutes within the phylum of Firmicutes - they
+were considered Gram-positives because of their phylum but are actually
+Gram-negative. This impacts 137 taxonomic species, genera and families,
+such as Negativicoccus and Veillonella.first_isolate()
NA
s for old MO codes when running as.mo()
on themproportion_*()
and count_*()
functions failas.mo()
+NA
s for old MO codes when
+running as.mo()
on themproportion_*()
and count_*()
functions
+failas.mo()
col_*
arguments are left blank, e.g. in first_isolate()
+col_*
arguments
+are left blank, e.g. in first_isolate()
random_mic()
, random_disk()
and random_rsi()
are now enforcedrandom_mic()
,
+random_disk()
and random_rsi()
are now
+enforcedas.rsi()
has an improved algorithm and can now also correct for textual input (such as “Susceptible”, “Resistant”) in all supported languagesas.rsi()
has an improved algorithm and can now also
+correct for textual input (such as “Susceptible”, “Resistant”) in all
+supported languages
as.mic()
has an improved algorithmcount_*()
, proportion_*()
function (or resistant()
or susceptible()
), the dplyr
group will be shown, if availablescale_rsi_colours()
when using ggplot2
v3.3.4 or higher (this is ggplot2 bug 4511, soon to be fixed)count_*()
, proportion_*()
function (or
+resistant()
or susceptible()
), the
+dplyr
group will be shown, if availablescale_rsi_colours()
when
+using ggplot2
v3.3.4 or higher (this is ggplot2 bug 4511,
+soon to be fixed)as.mo()
random_mic()
+random_mic()
as.ab()
and all ab_*()
functionsfortify()
extensions for plotting methodsas.ab()
and all ab_*()
+functionsfortify()
extensions for plotting methodsNA
values of the classes <mic>
, <disk>
and <rsi>
are now exported objects of this package, e.g. NA_mic_
is an NA
of class mic
(just like the base R NA_character_
is an NA
of class character
)proportion_df()
, count_df()
and rsi_df()
functions now return with the additional S3 class ‘rsi_df’ so they can be extended by other packagesmdro()
function now returns NA
for all rows that have no test resultsspecies_id
column in the microorganisms
data set now only contains LPSN record numbers. For this reason, this column is now numeric instead of a character, and mo_url()
has been updated to reflect this change.get_episode()
and is_new_episode()
+NA
values of the classes <mic>
,
+<disk>
and <rsi>
are now exported
+objects of this package, e.g. NA_mic_
is an NA
+of class mic
(just like the base R
+NA_character_
is an NA
of class
+character
)proportion_df()
, count_df()
and
+rsi_df()
functions now return with the additional S3 class
+‘rsi_df’ so they can be extended by other packagesmdro()
function now returns NA
for all
+rows that have no test resultsspecies_id
column in the
+microorganisms
data set now only contains LPSN record
+numbers. For this reason, this column is now numeric instead of a
+character, and mo_url()
has been updated to reflect this
+change.get_episode()
and
+is_new_episode()
get_episode()
and is_new_episode()
can now cope with NA
sget_episode()
and is_new_episode()
can now
+cope with NA
s
All antibiotic class selectors (such as carbapenems()
, aminoglycosides()
) can now be used for filtering as well, making all their accompanying filter_*()
functions redundant (such as filter_carbapenems()
, filter_aminoglycosides()
). These functions are now deprecated and will be removed in a next release. Examples of how the selectors can be used for filtering:
All antibiotic class selectors (such as
+carbapenems()
, aminoglycosides()
) can now be
+used for filtering as well, making all their accompanying
+filter_*()
functions redundant (such as
+filter_carbapenems()
,
+filter_aminoglycosides()
). These functions are now
+deprecated and will be removed in a next release. Examples of how the
+selectors can be used for filtering:
# select columns with results for carbapenems
@@ -312,71 +433,144 @@
as.rsi()
)custom_eucast_rules()
that brings support for custom AMR rules in eucast_rules()
+as.rsi()
)custom_eucast_rules()
that brings support for
+custom AMR rules in eucast_rules()
italicise_taxonomy()
to make taxonomic names within a string italic, with support for markdown and ANSIfirst_isolate()
function gained the argument method
that has to be “phenotype-based”, “episode-based”, “patient-based”, or “isolate-based”. The old behaviour is equal to “episode-based”. The new default is “phenotype-based” if antimicrobial test results are available, and “episode-based” otherwise. This new default will yield slightly more isolates for selection (which is a good thing).key_antibiotics()
and key_antibiotics_equal()
are now deprecated in favour of the key_antimicrobials()
and antimicrobials_equal()
functions. Also, the new all_antimicrobials()
function works like the old key_antibiotics()
function, but includes any column with antimicrobial test results. Using key_antimicrobials()
still only selects six preferred antibiotics for Gram-negatives, six for Gram-positives, and six universal antibiotics. It has a new antifungal
argument to set antifungal agents (antimycotics).type == "points"
in the first_isolate()
function for phenotype-based selection will now consider all antimicrobial drugs in the data set, using the new all_antimicrobials()
+italicise_taxonomy()
to make taxonomic names
+within a string italic, with support for markdown and ANSIfirst_isolate()
function gained the argument
+method
that has to be “phenotype-based”, “episode-based”,
+“patient-based”, or “isolate-based”. The old behaviour is equal to
+“episode-based”. The new default is “phenotype-based” if antimicrobial
+test results are available, and “episode-based” otherwise. This new
+default will yield slightly more isolates for selection (which is a good
+thing).key_antibiotics()
and key_antibiotics_equal()
+are now deprecated in favour of the key_antimicrobials()
+and antimicrobials_equal()
functions. Also, the new
+all_antimicrobials()
function works like the old
+key_antibiotics()
function, but includes any column with
+antimicrobial test results. Using key_antimicrobials()
+still only selects six preferred antibiotics for Gram-negatives, six for
+Gram-positives, and six universal antibiotics. It has a new
+antifungal
argument to set antifungal agents
+(antimycotics).type == "points"
in the
+first_isolate()
function for phenotype-based selection will
+now consider all antimicrobial drugs in the data set, using the new
+all_antimicrobials()
first_isolate()
function can now take a vector of values for col_keyantibiotics
and can have an episode length of Inf
+first_isolate()
function can now take a vector of
+values for col_keyantibiotics
and can have an episode
+length of Inf
filter_first_isolate()
renders the filter_first_weighted_isolate()
function redundant. For this reason, filter_first_weighted_isolate()
is now deprecated.first_isolate()
and key_antimicrobials()
functions has been completely rewritten.filter_first_isolate()
renders the
+filter_first_weighted_isolate()
function redundant. For
+this reason, filter_first_weighted_isolate()
is now
+deprecated.first_isolate()
and
+key_antimicrobials()
functions has been completely
+rewritten.betalactams()
as additional antbiotic column selector and function filter_betalactams()
as additional antbiotic column filter. The group of betalactams consists of all carbapenems, cephalosporins and penicillins.ggplot()
method for resistance_predict()
+betalactams()
as additional antbiotic column
+selector and function filter_betalactams()
as additional
+antbiotic column filter. The group of betalactams consists of all
+carbapenems, cephalosporins and penicillins.ggplot()
method for
+resistance_predict()
bug_drug_combinations()
now supports grouping using the dplyr
packagemdro()
, custom_mdro_guideline()
):
-c()
+bug_drug_combinations()
now supports grouping using the
+dplyr
packagemdro()
,
+custom_mdro_guideline()
):
+c()
age_groups()
for persons aged zeroexample_isolates
data set now contains some (fictitious) zero-year old patientsexample_isolates
data set now contains some
+(fictitious) zero-year old patientsdata.frame
or tibble
now gives a warning if the data contains old microbial codes (from a previous AMR package version)data.frame
or
+tibble
now gives a warning if the data contains old
+microbial codes (from a previous AMR package version)like()
functions:
-Now checks if pattern
is a valid regular expression
Now checks if pattern
is a valid regular
+expression
Added %unlike%
and %unlike_case%
(as negations of the existing %like%
and %like_case%
). This greatly improves readability:
Added %unlike%
and %unlike_case%
(as
+negations of the existing %like%
and
+%like_case%
). This greatly improves readability:
Altered the RStudio addin, so it now iterates over %like%
-> %unlike%
-> %like_case%
-> %unlike_case%
if you keep pressing your keyboard shortcut
Altered the RStudio addin, so it now iterates over
+%like%
-> %unlike%
->
+%like_case%
-> %unlike_case%
if you keep
+pressing your keyboard shortcut
info
argument to as.mo()
to turn on/off the progress barcol_mo
in some functions (esp. eucast_rules()
and mdro()
) could not be a column name of the microorganisms
data set as it would throw an erroras.rsi()
) when the vctrs
package is loaded (i.e., when using tidyverse)info
argument to as.mo()
to turn
+on/off the progress barcol_mo
in some functions
+(esp. eucast_rules()
and mdro()
) could not be
+a column name of the microorganisms
data set as it would
+throw an erroras.rsi()
)
+when the vctrs
package is loaded (i.e., when using
+tidyverse)barplot()
on an RSI classmicroorganisms.codes
data setantibiotics
data setskimr::skim()
on classes mo
, mic
and disk
when using the just released dplyr
v1.0.6skimr::skim()
usage for MIC values to also include 25th and 75th percentilesmicroorganisms.codes
data setantibiotics
data setskimr::skim()
on classes mo
,
+mic
and disk
when using the just released
+dplyr
v1.0.6skimr::skim()
usage for MIC values to also
+include 25th and 75th percentilesdplyr
join functions if the dplyr
package is installed - now also preserving grouped variablescephalosporins()
) now maintain the column order from the original datadplyr
join
+functions if the dplyr
package is installed - now also
+preserving grouped variablescephalosporins()
)
+now maintain the column order from the original datafluoroquinolones()
age()
now vectorises over both x
and reference
+age()
now vectorises over both x
and
+reference
tinytest
package, instead of the testthat
package. The testthat
package unfortunately requires tons of dependencies that are also heavy and only usable for recent R versions, disallowing developers to test a package under any R 3.* version. On the contrary, the tinytest
package is very lightweight and dependency-free.tinytest
+package, instead of the testthat
package. The
+testthat
package unfortunately requires tons of
+dependencies that are also heavy and only usable for recent R versions,
+disallowing developers to test a package under any R 3.* version. On the
+contrary, the tinytest
package is very lightweight and
+dependency-free.Support for EUCAST Clinical Breakpoints v11.0 (2021), effective in the eucast_rules()
function and in as.rsi()
to interpret MIC and disk diffusion values. This is now the default guideline in this package.
eucast_dosage()
to get a data.frame
with advised dosages of a certain bug-drug combination, which is based on the new dosage
data setdosage
to fuel the new eucast_dosage()
function and to make this data available in a structured wayexample_isolates
now reflects the latest EUCAST rulesSupport for EUCAST Clinical Breakpoints v11.0 (2021), effective
+in the eucast_rules()
function and in as.rsi()
+to interpret MIC and disk diffusion values. This is now the default
+guideline in this package.
eucast_dosage()
to get a
+data.frame
with advised dosages of a certain bug-drug
+combination, which is based on the new dosage
data setdosage
to fuel the new
+eucast_dosage()
function and to make this data available in
+a structured wayexample_isolates
now reflects the
+latest EUCAST rulesAdded argument only_rsi_columns
for some functions, which defaults to FALSE
, to indicate if the functions must only be applied to columns that are of class <rsi>
(i.e., transformed with as.rsi()
). This increases speed since automatic determination of antibiotic columns is not needed anymore. Affected functions are:
ab_class()
and its wrappers, such as aminoglycosides()
, carbapenems()
, penicillins()
)filter_ab_class()
and its wrappers, such as filter_aminoglycosides()
, filter_carbapenems()
, filter_penicillins()
)Added argument only_rsi_columns
for some functions,
+which defaults to FALSE
, to indicate if the functions must
+only be applied to columns that are of class <rsi>
+(i.e., transformed with as.rsi()
). This increases speed
+since automatic determination of antibiotic columns is not needed
+anymore. Affected functions are:
ab_class()
and its
+wrappers, such as aminoglycosides()
,
+carbapenems()
, penicillins()
)filter_ab_class()
and
+its wrappers, such as filter_aminoglycosides()
,
+filter_carbapenems()
,
+filter_penicillins()
)eucast_rules()
mdro()
(including wrappers such as brmo()
, mrgn()
and eucast_exceptional_phenotypes()
)mdro()
(including wrappers such as brmo()
,
+mrgn()
and
+eucast_exceptional_phenotypes()
)guess_ab_col()
Functions oxazolidinones()
(an antibiotic selector function) and filter_oxazolidinones()
(an antibiotic filter function) to select/filter on e.g. linezolid and tedizolid
Functions oxazolidinones()
(an antibiotic selector
+function) and filter_oxazolidinones()
(an antibiotic filter
+function) to select/filter on e.g. linezolid and tedizolid
Support for custom MDRO guidelines, using the new custom_mdro_guideline()
function, please see mdro()
for additional info
ggplot()
generics for classes <mic>
and <disk>
Support for custom MDRO guidelines, using the new
+custom_mdro_guideline()
function, please see
+mdro()
for additional info
ggplot()
generics for classes
+<mic>
and <disk>
Function mo_is_yeast()
, which determines whether a microorganism is a member of the taxonomic class Saccharomycetes or the taxonomic order Saccharomycetales:
Function mo_is_yeast()
, which determines whether a
+microorganism is a member of the taxonomic class Saccharomycetes or the
+taxonomic order Saccharomycetales:
mo_kingdom(c("Aspergillus", "Candida"))
@@ -424,7 +645,8 @@
# usage for filtering data:
example_isolates[which(mo_is_yeast()), ] # base R
example_isolates %>% filter(mo_is_yeast()) # dplyr
The mo_type()
function has also been updated to reflect this change:
The mo_type()
function has also been updated to reflect
+this change:
Added Pretomanid (PMD, J04AK08) to the antibiotics
data set
Added Pretomanid (PMD, J04AK08) to the antibiotics
+data set
MIC values (see as.mic()
) can now be used in any mathematical processing, such as usage inside functions min()
, max()
, range()
, and with binary operators (+
, -
, etc.). This allows for easy distribution analysis and fast filtering on MIC values:
MIC values (see as.mic()
) can now be used in any
+mathematical processing, such as usage inside functions
+min()
, max()
, range()
, and with
+binary operators (+
, -
, etc.). This allows for
+easy distribution analysis and fast filtering on MIC values:
x <- random_mic(10)
@@ -453,49 +680,107 @@
Changed
- Updated the bacterial taxonomy to 3 March 2021 (using LPSN)
-
- Added 3,372 new species and 1,523 existing species became synomyms
-- The URL of a bacterial species (
mo_url()
) will now lead to https://lpsn.dsmz.de
+- Added 3,372 new species and 1,523 existing species became
+synomyms
+- The URL of a bacterial species (
mo_url()
) will now lead
+to https://lpsn.dsmz.de
-- Big update for plotting classes
rsi
, <mic>
, and <disk>
:
-- Plotting of MIC and disk diffusion values now support interpretation colouring if you supply the microorganism and antimicrobial agent
-- All colours were updated to colour-blind friendly versions for values R, S and I for all plot methods (also applies to tibble printing)
-- Interpretation of MIC and disk diffusion values to R/SI will now be translated if the system language is German, Dutch or Spanish (see
translate
)
-- Plotting is now possible with base R using
plot()
and with ggplot2 using ggplot()
on any vector of MIC and disk diffusion values
+- Big update for plotting classes
rsi
,
+<mic>
, and <disk>
:
+- Plotting of MIC and disk diffusion values now support interpretation
+colouring if you supply the microorganism and antimicrobial agent
+- All colours were updated to colour-blind friendly versions for
+values R, S and I for all plot methods (also applies to tibble
+printing)
+- Interpretation of MIC and disk diffusion values to R/SI will now be
+translated if the system language is German, Dutch or Spanish (see
+
translate
)
+- Plotting is now possible with base R using
plot()
and
+with ggplot2 using ggplot()
on any vector of MIC and disk
+diffusion values
-- Updated SNOMED codes to US Edition of SNOMED CT from 1 September 2020 and added the source to the help page of the
microorganisms
data set
+- Updated SNOMED codes to US Edition of SNOMED CT from 1 September
+2020 and added the source to the help page of the
+
microorganisms
data set
-
-
is.rsi()
and is.rsi.eligible()
now return a vector of TRUE
/FALSE
when the input is a data set, by iterating over all columns
-- Using functions without setting a data set (e.g.,
mo_is_gram_negative()
, mo_is_gram_positive()
, mo_is_intrinsic_resistant()
, first_isolate()
, mdro()
) now work with dplyr
s group_by()
again
+is.rsi()
and is.rsi.eligible()
now return
+a vector of TRUE
/FALSE
when the input is a
+data set, by iterating over all columns
+- Using functions without setting a data set (e.g.,
+
mo_is_gram_negative()
, mo_is_gram_positive()
,
+mo_is_intrinsic_resistant()
, first_isolate()
,
+mdro()
) now work with dplyr
s
+group_by()
again
-
-
first_isolate()
can be used with group_by()
(also when using a dot .
as input for the data) and now returns the names of the groups
-- Updated the data set
microorganisms.codes
(which contains popular LIS and WHONET codes for microorganisms) for some species of Mycobacterium that previously incorrectly returned M. africanum
+first_isolate()
can be used with
+group_by()
(also when using a dot .
as input
+for the data) and now returns the names of the groups
+- Updated the data set
microorganisms.codes
(which
+contains popular LIS and WHONET codes for microorganisms) for some
+species of Mycobacterium that previously incorrectly returned
+M. africanum
-- WHONET code
"PNV"
will now correctly be interpreted as PHN
, the antibiotic code for phenoxymethylpenicillin (‘peni V’)
-- Fix for verbose output of
mdro(..., verbose = TRUE)
for German guideline (3MGRN and 4MGRN) and Dutch guideline (BRMO, only P. aeruginosa)
+- WHONET code
"PNV"
will now correctly be interpreted as
+PHN
, the antibiotic code for phenoxymethylpenicillin (‘peni
+V’)
+- Fix for verbose output of
mdro(..., verbose = TRUE)
for
+German guideline (3MGRN and 4MGRN) and Dutch guideline (BRMO, only
+P. aeruginosa)
-
-
is.rsi.eligible()
now detects if the column name resembles an antibiotic name or code and now returns TRUE
immediately if the input contains any of the values “R”, “S” or “I”. This drastically improves speed, also for a lot of other functions that rely on automatic determination of antibiotic columns.
-- Functions
get_episode()
and is_new_episode()
now support less than a day as value for argument episode_days
(e.g., to include one patient/test per hour)
-- Argument
ampc_cephalosporin_resistance
in eucast_rules()
now also applies to value “I” (not only “S”)
-- Functions
print()
and summary()
on a Principal Components Analysis object (pca()
) now print additional group info if the original data was grouped using dplyr::group_by()
+is.rsi.eligible()
now detects if the column name
+resembles an antibiotic name or code and now returns TRUE
+immediately if the input contains any of the values “R”, “S” or “I”.
+This drastically improves speed, also for a lot of other functions that
+rely on automatic determination of antibiotic columns.
+- Functions
get_episode()
and
+is_new_episode()
now support less than a day as value for
+argument episode_days
(e.g., to include one patient/test
+per hour)
+- Argument
ampc_cephalosporin_resistance
in
+eucast_rules()
now also applies to value “I” (not only
+“S”)
+- Functions
print()
and summary()
on a
+Principal Components Analysis object (pca()
) now print
+additional group info if the original data was grouped using
+dplyr::group_by()
-- Improved speed and reliability of
guess_ab_col()
. As this also internally improves the reliability of first_isolate()
and mdro()
, this might have a slight impact on the results of those functions.
-- Fix for
mo_name()
when used in other languages than English
-- The
like()
function (and its fast alias %like%
) now always use Perl compatibility, improving speed for many functions in this package (e.g., as.mo()
is now up to 4 times faster)
+- Improved speed and reliability of
guess_ab_col()
. As
+this also internally improves the reliability of
+first_isolate()
and mdro()
, this might have a
+slight impact on the results of those functions.
+- Fix for
mo_name()
when used in other languages than
+English
+- The
like()
function (and its fast alias
+%like%
) now always use Perl compatibility, improving speed
+for many functions in this package (e.g., as.mo()
is now up
+to 4 times faster)
-
-Staphylococcus cornubiensis is now correctly categorised as coagulase-positive
+Staphylococcus cornubiensis is now correctly categorised as
+coagulase-positive
-
-
random_disk()
and random_mic()
now have an expanded range in their randomisation
-- Support for GISA (glycopeptide-intermediate S. aureus), so e.g.
mo_genus("GISA")
will return "Staphylococcus"
+random_disk()
and random_mic()
now have an
+expanded range in their randomisation
+- Support for GISA (glycopeptide-intermediate S. aureus), so
+e.g.
mo_genus("GISA")
will return
+"Staphylococcus"
-- Added translations of German and Spanish for more than 200 antimicrobial drugs
-- Speed improvement for
as.ab()
when the input is an official name or ATC code
-- Added argument
include_untested_rsi
to the first_isolate()
functions (defaults to TRUE
to keep existing behaviour), to be able to exclude rows where all R/SI values (class <rsi>
, see as.rsi()
) are empty
+- Added translations of German and Spanish for more than 200
+antimicrobial drugs
+- Speed improvement for
as.ab()
when the input is an
+official name or ATC code
+- Added argument
include_untested_rsi
to the
+first_isolate()
functions (defaults to TRUE
to
+keep existing behaviour), to be able to exclude rows where all R/SI
+values (class <rsi>
, see as.rsi()
) are
+empty
Other
- Big documentation updates
-- Loading the package (i.e.,
library(AMR)
) now is ~50 times faster than before, in costs of package size (which increased by ~3 MB)
+- Loading the package (i.e.,
library(AMR)
) now is ~50
+times faster than before, in costs of package size (which increased by
+~3 MB)
Functions get_episode()
and is_new_episode()
to determine (patient) episodes which are not necessarily based on microorganisms. The get_episode()
function returns the index number of the episode per group, while the is_new_episode()
function returns values TRUE
/FALSE
to indicate whether an item in a vector is the start of a new episode. They also support dplyr
s grouping (i.e. using group_by()
):
Functions get_episode()
and
+is_new_episode()
to determine (patient) episodes which are
+not necessarily based on microorganisms. The get_episode()
+function returns the index number of the episode per group, while the
+is_new_episode()
function returns values
+TRUE
/FALSE
to indicate whether an item in a
+vector is the start of a new episode. They also support
+dplyr
s grouping (i.e. using group_by()
):
Functions mo_is_gram_negative()
and mo_is_gram_positive()
as wrappers around mo_gramstain()
. They always return TRUE
or FALSE
(except when the input is NA
or the MO code is UNKNOWN
), thus always return FALSE
for species outside the taxonomic kingdom of Bacteria.
Function mo_is_intrinsic_resistant()
to test for intrinsic resistance, based on EUCAST Intrinsic Resistance and Unusual Phenotypes v3.2 from 2020.
Functions random_mic()
, random_disk()
and random_rsi()
for random value generation. The functions random_mic()
and random_disk()
take microorganism names and antibiotic names as input to make generation more realistic.
Functions mo_is_gram_negative()
and
+mo_is_gram_positive()
as wrappers around
+mo_gramstain()
. They always return TRUE
or
+FALSE
(except when the input is NA
or the MO
+code is UNKNOWN
), thus always return FALSE
for
+species outside the taxonomic kingdom of Bacteria.
Function mo_is_intrinsic_resistant()
to test for
+intrinsic resistance, based on EUCAST
+Intrinsic Resistance and Unusual Phenotypes v3.2 from 2020.
Functions random_mic()
, random_disk()
+and random_rsi()
for random value generation. The functions
+random_mic()
and random_disk()
take
+microorganism names and antibiotic names as input to make generation
+more realistic.
New argument ampc_cephalosporin_resistance
in eucast_rules()
to correct for AmpC de-repressed cephalosporin-resistant mutants
New argument ampc_cephalosporin_resistance
in
+eucast_rules()
to correct for AmpC de-repressed
+cephalosporin-resistant mutants
Interpretation of antimicrobial resistance - as.rsi()
:
as.rsi()
can now be set by the user, using the reference_data
argument. This allows for using own interpretation guidelines. The user-set data must have the same structure as rsi_translation
.as.rsi()
on a data.frameas.rsi()
on a data.frame in older R versionsInterpretation of antimicrobial resistance -
+as.rsi()
:
as.rsi()
can now be set by the
+user, using the reference_data
argument. This allows for
+using own interpretation guidelines. The user-set data must have the
+same structure as rsi_translation
.as.rsi()
on a data.frameas.rsi()
on a data.frame in older R
+versionsas.rsi()
on a data.frame will not print a message anymore if the values are already clean R/SI valuesas.rsi()
on MICs or disk diffusion while there is intrinsic antimicrobial resistance, a warning will be thrown to remind about thisas.rsi()
on a data.frame
that only contains one column for antibiotic interpretationsas.rsi()
on a data.frame will not print a message
+anymore if the values are already clean R/SI valuesas.rsi()
on MICs or disk diffusion while there
+is intrinsic antimicrobial resistance, a warning will be thrown to
+remind about thisas.rsi()
on a data.frame
+that only contains one column for antibiotic interpretationsSome functions are now context-aware when used inside dplyr
verbs, such as filter()
, mutate()
and summarise()
. This means that then the data argument does not need to be set anymore. This is the case for the new functions:
Some functions are now context-aware when used inside
+dplyr
verbs, such as filter()
,
+mutate()
and summarise()
. This means that then
+the data argument does not need to be set anymore. This is the case for
+the new functions:
mo_is_gram_negative()
mo_is_gram_positive()
mo_is_intrinsic_resistant()
For antibiotic selection functions (such as cephalosporins()
, aminoglycosides()
) to select columns based on a certain antibiotic group, the dependency on the tidyselect
package was removed, meaning that they can now also be used without the need to have this package installed and now also work in base R function calls (they rely on R 3.2 or later):
For antibiotic selection functions (such as
+cephalosporins()
, aminoglycosides()
) to select
+columns based on a certain antibiotic group, the dependency on the
+tidyselect
package was removed, meaning that they can now
+also be used without the need to have this package installed and now
+also work in base R function calls (they rely on R 3.2 or later):
# above example in base R:
example_isolates[which(first_isolate() & mo_is_gram_negative()),
c("mo", cephalosporins(), aminoglycosides())]
For all function arguments in the code, it is now defined what the exact type of user input should be (inspired by the typed
package). If the user input for a certain function does not meet the requirements for a specific argument (such as the class or length), an informative error will be thrown. This makes the package more robust and the use of it more reproducible and reliable. In total, more than 420 arguments were defined.
Fix for set_mo_source()
, that previously would not remember the file location of the original file
Deprecated function p_symbol()
that not really fits the scope of this package. It will be removed in a future version. See here for the source code to preserve it.
Updated coagulase-negative staphylococci determination with Becker et al. 2020 (PMID 32056452), meaning that the species S. argensis, S. caeli, S. debuckii, S. edaphicus and S. pseudoxylosus are now all considered CoNS
Fix for using argument reference_df
in as.mo()
and mo_*()
functions that contain old microbial codes (from previous package versions)
Fixed a bug where mo_uncertainties()
would not return the results based on the MO matching score
Fixed a bug where as.mo()
would not return results for known laboratory codes for microorganisms
Fixed a bug where as.ab()
would sometimes fail
For all function arguments in the code, it is now defined what
+the exact type of user input should be (inspired by the typed
+package). If the user input for a certain function does not meet the
+requirements for a specific argument (such as the class or length), an
+informative error will be thrown. This makes the package more robust and
+the use of it more reproducible and reliable. In total, more than 420
+arguments were defined.
Fix for set_mo_source()
, that previously would not
+remember the file location of the original file
Deprecated function p_symbol()
that not really fits
+the scope of this package. It will be removed in a future version. See
+here
+for the source code to preserve it.
Updated coagulase-negative staphylococci determination with +Becker et al. 2020 (PMID 32056452), meaning that the species +S. argensis, S. caeli, S. debuckii, S. +edaphicus and S. pseudoxylosus are now all considered +CoNS
Fix for using argument reference_df
in
+as.mo()
and mo_*()
functions that contain old
+microbial codes (from previous package versions)
Fixed a bug where mo_uncertainties()
would not
+return the results based on the MO matching score
Fixed a bug where as.mo()
would not return results
+for known laboratory codes for microorganisms
Fixed a bug where as.ab()
would sometimes
+fail
Better tibble printing for MIC values
Fix for plotting MIC values with plot()
Added plot()
generic to class <disk>
LA-MRSA and CA-MRSA are now recognised as an abbreviation for Staphylococcus aureus, meaning that e.g. mo_genus("LA-MRSA")
will return "Staphylococcus"
and mo_is_gram_positive("LA-MRSA")
will return TRUE
.
Fix for printing class NA
Fix for mo_shortname()
when the input contains NA
If as.mo()
takes more than 30 seconds, some suggestions will be done to improve speed
Added plot()
generic to class
+<disk>
LA-MRSA and CA-MRSA are now recognised as an abbreviation for
+Staphylococcus aureus, meaning that
+e.g. mo_genus("LA-MRSA")
will return
+"Staphylococcus"
and
+mo_is_gram_positive("LA-MRSA")
will return
+TRUE
.
Fix for printing class NA
Fix for mo_shortname()
when the input contains
+NA
If as.mo()
takes more than 30 seconds, some
+suggestions will be done to improve speed
options()
were all removed in favour of a new internal environment pkg_env
+options()
were all removed in favour
+of a new internal environment pkg_env
sapply()
calls with vapply()
)sapply()
calls with vapply()
)Support for ‘EUCAST Expert Rules’ / ‘EUCAST Intrinsic Resistance and Unusual Phenotypes’ version 3.2 of May 2020. With this addition to the previously implemented version 3.1 of 2016, the eucast_rules()
function can now correct for more than 180 different antibiotics and the mdro()
function can determine multidrug resistance based on more than 150 different antibiotics. All previously implemented versions of the EUCAST rules are now maintained and kept available in this package. The eucast_rules()
function consequently gained the arguments version_breakpoints
(at the moment defaults to v10.0, 2020) and version_expertrules
(at the moment defaults to v3.2, 2020). The example_isolates
data set now also reflects the change from v3.1 to v3.2. The mdro()
function now accepts guideline == "EUCAST3.1"
and guideline == "EUCAST3.2"
.
A new vignette and website page with info about all our public and freely available data sets, that can be downloaded as flat files or in formats for use in R, SPSS, SAS, Stata and Excel: https://msberends.github.io/AMR/articles/datasets.html
Support for ‘EUCAST Expert Rules’ / ‘EUCAST Intrinsic Resistance
+and Unusual Phenotypes’ version 3.2 of May 2020. With this addition to
+the previously implemented version 3.1 of 2016, the
+eucast_rules()
function can now correct for more than 180
+different antibiotics and the mdro()
function can determine
+multidrug resistance based on more than 150 different antibiotics. All
+previously implemented versions of the EUCAST rules are now maintained
+and kept available in this package. The eucast_rules()
+function consequently gained the arguments
+version_breakpoints
(at the moment defaults to v10.0, 2020)
+and version_expertrules
(at the moment defaults to v3.2,
+2020). The example_isolates
data set now also reflects the
+change from v3.1 to v3.2. The mdro()
function now accepts
+guideline == "EUCAST3.1"
and
+guideline == "EUCAST3.2"
.
A new vignette and website page with info about all our public +and freely available data sets, that can be downloaded as flat files or +in formats for use in R, SPSS, SAS, Stata and Excel: https://msberends.github.io/AMR/articles/datasets.html
Data set intrinsic_resistant
. This data set contains all bug-drug combinations where the ‘bug’ is intrinsic resistant to the ‘drug’ according to the latest EUCAST insights. It contains just two columns: microorganism
and antibiotic
.
Curious about which enterococci are actually intrinsic resistant to vancomycin?
+Data set intrinsic_resistant
. This data set contains
+all bug-drug combinations where the ‘bug’ is intrinsic resistant to the
+‘drug’ according to the latest EUCAST insights. It contains just two
+columns: microorganism
and antibiotic
.
Curious about which enterococci are actually intrinsic resistant to +vancomycin?
Support for veterinary ATC codes
Support for skimming classes <rsi>
, <mic>
, <disk>
and <mo>
with the skimr
package
Support for skimming classes <rsi>
,
+<mic>
, <disk>
and
+<mo>
with the skimr
package
Although advertised that this package should work under R 3.0.0, we still had a dependency on R 3.6.0. This is fixed, meaning that our package should now work under R 3.0.0.
Although advertised that this package should work under R 3.0.0, +we still had a dependency on R 3.6.0. This is fixed, meaning that our +package should now work under R 3.0.0.
Improvements for as.rsi()
:
Support for using dplyr
’s across()
to interpret MIC values or disk zone diameters, which also automatically determines the column with microorganism names or codes.
Support for using dplyr
’s across()
to
+interpret MIC values or disk zone diameters, which also automatically
+determines the column with microorganism names or codes.
Cleaning columns in a data.frame now allows you to specify those columns with tidy selection, e.g. as.rsi(df, col1:col9)
Big speed improvement for interpreting MIC values and disk zone diameters. When interpreting 5,000 MIC values of two antibiotics (10,000 values in total), our benchmarks showed a total run time going from 80.7-85.1 seconds to 1.8-2.0 seconds.
Added argument ‘add_intrinsic_resistance’ (defaults to FALSE
), that considers intrinsic resistance according to EUCAST
Fixed a bug where in EUCAST rules the breakpoint for R would be interpreted as “>=” while this should have been “<”
Cleaning columns in a data.frame now allows you to specify those
+columns with tidy selection,
+e.g. as.rsi(df, col1:col9)
Big speed improvement for interpreting MIC values and disk zone +diameters. When interpreting 5,000 MIC values of two antibiotics (10,000 +values in total), our benchmarks showed a total run time going from +80.7-85.1 seconds to 1.8-2.0 seconds.
Added argument ‘add_intrinsic_resistance’ (defaults to
+FALSE
), that considers intrinsic resistance according to
+EUCAST
Fixed a bug where in EUCAST rules the breakpoint for R would be +interpreted as “>=” while this should have been “<”
Added intelligent data cleaning to as.disk()
, so numbers can also be extracted from text and decimal numbers will always be rounded up:
Added intelligent data cleaning to as.disk()
, so
+numbers can also be extracted from text and decimal numbers will always
+be rounded up:
as.disk(c("disk zone: 23.4 mm", 23.4))
@@ -648,47 +1039,102 @@
-
Improvements for as.mo()
:
-- A completely new matching score for ambiguous user input, using
mo_matching_score()
. Any user input value that could mean more than one taxonomic entry is now considered ‘uncertain’. Instead of a warning, a message will be thrown and the accompanying mo_uncertainties()
has been changed completely; it now prints all possible candidates with their matching score.
-- Big speed improvement for already valid microorganism ID. This also means an significant speed improvement for using
mo_*
functions like mo_name()
on microoganism IDs.
-- Added argument
ignore_pattern
to as.mo()
which can also be given to mo_*
functions like mo_name()
, to exclude known non-relevant input from analysing. This can also be set with the option AMR_ignore_pattern
.
+- A completely new matching score for ambiguous user input, using
+
mo_matching_score()
. Any user input value that could mean
+more than one taxonomic entry is now considered ‘uncertain’. Instead of
+a warning, a message will be thrown and the accompanying
+mo_uncertainties()
has been changed completely; it now
+prints all possible candidates with their matching score.
+- Big speed improvement for already valid microorganism ID. This also
+means an significant speed improvement for using
mo_*
+functions like mo_name()
on microoganism IDs.
+- Added argument
ignore_pattern
to as.mo()
+which can also be given to mo_*
functions like
+mo_name()
, to exclude known non-relevant input from
+analysing. This can also be set with the option
+AMR_ignore_pattern
.
-get_locale()
now uses at default Sys.getenv("LANG")
or, if LANG
is not set, Sys.getlocale()
. This can be overwritten by setting the option AMR_locale
.
+get_locale()
now uses at default
+Sys.getenv("LANG")
or, if LANG
is not set,
+Sys.getlocale()
. This can be overwritten by setting the
+option AMR_locale
.
Big speed improvement for eucast_rules()
Overall speed improvement by tweaking joining functions
-Function mo_shortname()
now returns the genus for input where the species is unknown
-BORSA is now recognised as an abbreviation for Staphylococcus aureus, meaning that e.g. mo_genus("BORSA")
will return “Staphylococcus”
-Added a feature from AMR 1.1.0 and earlier again, but now without other package dependencies: tibble
printing support for classes <rsi>
, <mic>
, <disk>
, <ab>
and <mo>
. When using tibble
s containing antimicrobial columns (class <rsi>
), “S” will print in green, “I” will print in yellow and “R” will print in red. Microbial IDs (class <mo>
) will emphasise on the genus and species, not on the kingdom.
-Names of antiviral agents in data set antivirals
now have a starting capital letter, like it is the case in the antibiotics
data set
-Updated the documentation of the WHONET
data set to clarify that all patient names are fictitious
+Function mo_shortname()
now returns the genus for
+input where the species is unknown
+BORSA is now recognised as an abbreviation for Staphylococcus
+aureus, meaning that e.g. mo_genus("BORSA")
will
+return “Staphylococcus”
+Added a feature from AMR 1.1.0 and earlier again, but now without
+other package dependencies: tibble
printing support for
+classes <rsi>
, <mic>
,
+<disk>
, <ab>
and
+<mo>
. When using tibble
s containing
+antimicrobial columns (class <rsi>
), “S” will print
+in green, “I” will print in yellow and “R” will print in red. Microbial
+IDs (class <mo>
) will emphasise on the genus and
+species, not on the kingdom.
+Names of antiviral agents in data set antivirals
now
+have a starting capital letter, like it is the case in the
+antibiotics
data set
+Updated the documentation of the WHONET
data set to
+clarify that all patient names are fictitious
Small as.ab()
algorithm improvements
-Fix for combining MIC values with raw numbers, i.e. c(as.mic(2), 2)
previously failed but now returns a valid MIC class
-ggplot_rsi()
and geom_rsi()
gained arguments minimum
and language
, to influence the internal use of rsi_df()
+Fix for combining MIC values with raw numbers,
+i.e. c(as.mic(2), 2)
previously failed but now returns a
+valid MIC class
+ggplot_rsi()
and geom_rsi()
gained
+arguments minimum
and language
, to influence
+the internal use of rsi_df()
-
Changes in the antibiotics
data set:
- Updated oral and parental DDDs from the WHOCC
- Added abbreviation “piptazo” to ‘Piperacillin/tazobactam’ (TZP)
-- ‘Penicillin G’ (for intravenous use) is now named ‘Benzylpenicillin’ (code
PEN
)
-- ‘Penicillin V’ (for oral use, code
PNV
) was removed, since its actual entry ‘Phenoxymethylpenicillin’ (code PHN
) already existed
-- The group name (
antibiotics$group
) of ‘Linezolid’ (LNZ
), ‘Cycloserine’ (CYC
), ‘Tedizolid’ (TZD
) and ‘Thiacetazone’ (THA
) is now “Oxazolidinones” instead of “Other antibacterials”
+- ‘Penicillin G’ (for intravenous use) is now named ‘Benzylpenicillin’
+(code
PEN
)
+- ‘Penicillin V’ (for oral use, code
PNV
) was removed,
+since its actual entry ‘Phenoxymethylpenicillin’ (code PHN
)
+already existed
+- The group name (
antibiotics$group
) of ‘Linezolid’
+(LNZ
), ‘Cycloserine’ (CYC
), ‘Tedizolid’
+(TZD
) and ‘Thiacetazone’ (THA
) is now
+“Oxazolidinones” instead of “Other antibacterials”
-Added support for using unique()
on classes <rsi>
, <mic>
, <disk>
, <ab>
and <mo>
-Added argument excess
to the kurtosis()
function (defaults to FALSE
), to return the excess kurtosis, defined as the kurtosis minus three.
+Added support for using unique()
on classes
+<rsi>
, <mic>
,
+<disk>
, <ab>
and
+<mo>
+Added argument excess
to the kurtosis()
+function (defaults to FALSE
), to return the excess
+kurtosis, defined as the kurtosis minus three.
portion_R()
, portion_S()
and portion_I()
that were deprecated since version 0.9.0 (November 2019) and were replaced with proportion_R()
, proportion_S()
and proportion_I()
+portion_R()
, portion_S()
+and portion_I()
that were deprecated since version 0.9.0
+(November 2019) and were replaced with proportion_R()
,
+proportion_S()
and proportion_I()
base
packageSuggests
field of the DESCRIPTION
fileSuggests
field of the DESCRIPTION
fileFunction ab_from_text()
to retrieve antimicrobial drug names, doses and forms of administration from clinical texts in e.g. health care records, which also corrects for misspelling since it uses as.ab()
internally
Function ab_from_text()
to retrieve antimicrobial
+drug names, doses and forms of administration from clinical texts in
+e.g. health care records, which also corrects for misspelling since it
+uses as.ab()
internally
Tidyverse selection helpers for antibiotic classes, that help to select the columns of antibiotics that are of a specific antibiotic class, without the need to define the columns or antibiotic abbreviations. They can be used in any function that allows selection helpers, like dplyr::select()
and tidyr::pivot_longer()
:
Tidyverse
+selection helpers for antibiotic classes, that help to select the
+columns of antibiotics that are of a specific antibiotic class, without
+the need to define the columns or antibiotic abbreviations. They can be
+used in any function that allows selection helpers, like
+dplyr::select()
and tidyr::pivot_longer()
:
library(dplyr)
@@ -698,54 +1144,105 @@
select(carbapenems())
#> Selecting carbapenems: `IPM` (imipenem), `MEM` (meropenem)
Added mo_domain()
as an alias to mo_kingdom()
Added function filter_penicillins()
to filter isolates on a specific result in any column with a name in the antimicrobial ‘penicillins’ class (more specific: ATC subgroup Beta-lactam antibacterials, penicillins)
Added official antimicrobial names to all filter_ab_class()
functions, such as filter_aminoglycosides()
Added antibiotics code “FOX1” for cefoxitin screening (abbreviation “cfsc”) to the antibiotics
data set
Added mo_domain()
as an alias to
+mo_kingdom()
Added function filter_penicillins()
to filter
+isolates on a specific result in any column with a name in the
+antimicrobial ‘penicillins’ class (more specific: ATC subgroup
+Beta-lactam antibacterials, penicillins)
Added official antimicrobial names to all
+filter_ab_class()
functions, such as
+filter_aminoglycosides()
Added antibiotics code “FOX1” for cefoxitin screening
+(abbreviation “cfsc”) to the antibiotics
data set
Added Monuril as trade name for fosfomycin
Added argument conserve_capped_values
to as.rsi()
for interpreting MIC values - it makes sure that values starting with “<” (but not “<=”) will always return “S” and values starting with “>” (but not “>=”) will always return “R”. The default behaviour of as.rsi()
has not changed, so you need to specifically do as.rsi(..., conserve_capped_values = TRUE)
.
Added argument conserve_capped_values
to
+as.rsi()
for interpreting MIC values - it makes sure that
+values starting with “<” (but not “<=”) will always return “S” and
+values starting with “>” (but not “>=”) will always return “R”.
+The default behaviour of as.rsi()
has not changed, so you
+need to specifically do
+as.rsi(..., conserve_capped_values = TRUE)
.
Big speed improvement for using any function on microorganism codes from earlier package versions (prior to AMR
v1.2.0), such as as.mo()
, mo_name()
, first_isolate()
, eucast_rules()
, mdro()
, etc.
As a consequence, very old microbial codes (from AMR
v0.5.0 and lower) are not supported anymore. Use as.mo()
on your microorganism names or codes to transform them to current abbreviations used in this package.
Big speed improvement for using any function on microorganism
+codes from earlier package versions (prior to AMR
v1.2.0),
+such as as.mo()
, mo_name()
,
+first_isolate()
, eucast_rules()
,
+mdro()
, etc.
As a consequence, very old microbial codes (from AMR
+v0.5.0 and lower) are not supported anymore. Use
+as.mo()
on your microorganism names or codes to transform
+them to current abbreviations used in this package.
Improvements for susceptibility()
and resistance()
and all count_*()
, proportion_*()
functions:
dplyr::all_of()
) now works againImprovements for susceptibility()
and
+resistance()
and all count_*()
,
+proportion_*()
functions:
dplyr::all_of()
) now works againImprovements for as.ab()
:
as.ab()
, making many more input errors translatable, such as digitalised health care records, using too few or too many vowels or consonants and many moreas.ab()
,
+making many more input errors translatable, such as digitalised health
+care records, using too few or too many vowels or consonants and many
+moreas.ab()
would return an error on invalid input valuesas.ab()
function will now throw a note if more than 1 antimicrobial drug could be retrieved from a single input value.as.ab()
would return an error on
+invalid input valuesas.ab()
function will now throw a note if more than
+1 antimicrobial drug could be retrieved from a single input value.Fixed a bug where eucast_rules()
would not work on a tibble when the tibble
or dplyr
package was loaded
Fixed a bug for CLSI 2019 guidelines (using as.rsi()
), that also included results for animals. It now only contains interpretation guidelines for humans.
All *_join_microorganisms()
functions and bug_drug_combinations()
now return the original data class (e.g. tibble
s and data.table
s)
Fixed a bug where eucast_rules()
would not work on a
+tibble when the tibble
or dplyr
package was
+loaded
Fixed a bug for CLSI 2019 guidelines (using
+as.rsi()
), that also included results for animals. It now
+only contains interpretation guidelines for humans.
All *_join_microorganisms()
functions and
+bug_drug_combinations()
now return the original data class
+(e.g. tibble
s and data.table
s)
For functions rsi_df()
, proportion_df()
and count_df()
:
For functions rsi_df()
, proportion_df()
+and count_df()
:
count_df()
) when all antibiotics in the data set have only NA
scount_df()
)
+when all antibiotics in the data set have only NA
sImproved auto-determination for columns of types <mo>
and <Date>
Fixed a bug in bug_drug_combinations()
for when only one antibiotic was in the input data
Changed the summary for class <rsi>
, to highlight the %SI vs. %R
Improved error handling, giving more useful info when functions return an error
Any progress bar will now only show in interactive mode (i.e. not in R Markdown)
Speed improvement for mdro()
and filter_ab_class()
New option arrows_textangled
for ggplot_pca()
to indicate whether the text at the end of the arrows should be angled (defaults to TRUE
, as it was in previous versions)
Improved auto-determination for columns of types
+<mo>
and <Date>
Fixed a bug in bug_drug_combinations()
for when only
+one antibiotic was in the input data
Changed the summary for class <rsi>
, to
+highlight the %SI vs. %R
Improved error handling, giving more useful info when functions +return an error
Any progress bar will now only show in interactive mode (i.e. not +in R Markdown)
Speed improvement for mdro()
and
+filter_ab_class()
New option arrows_textangled
for
+ggplot_pca()
to indicate whether the text at the end of the
+arrows should be angled (defaults to TRUE
, as it was in
+previous versions)
Added parenteral DDD to benzylpenicillin
Fixed a bug where as.mic()
could not handle dots without a leading zero (like "<=.25
)
Fixed a bug where as.mic()
could not handle dots
+without a leading zero (like "<=.25
)
Removed code dependency on all other R packages, making this package fully independent of the development process of others. This is a major code change, but will probably not be noticeable by most users.
-Making this package independent of especially the tidyverse (e.g. packages dplyr
and tidyr
) tremendously increases sustainability on the long term, since tidyverse functions change quite often. Good for users, but hard for package maintainers. Most of our functions are replaced with versions that only rely on base R, which keeps this package fully functional for many years to come, without requiring a lot of maintenance to keep up with other packages anymore. Another upside it that this package can now be used with all versions of R since R-3.0.0 (April 2013). Our package is being used in settings where the resources are very limited. Fewer dependencies on newer software is helpful for such settings.
Removed code dependency on all other R packages, making this +package fully independent of the development process of others. This is +a major code change, but will probably not be noticeable by most +users.
+Making this package independent of especially the tidyverse
+(e.g. packages dplyr
and tidyr
) tremendously
+increases sustainability on the long term, since tidyverse functions
+change quite often. Good for users, but hard for package maintainers.
+Most of our functions are replaced with versions that only rely on base
+R, which keeps this package fully functional for many years to come,
+without requiring a lot of maintenance to keep up with other packages
+anymore. Another upside it that this package can now be used with all
+versions of R since R-3.0.0 (April 2013). Our package is being used in
+settings where the resources are very limited. Fewer dependencies on
+newer software is helpful for such settings.
Negative effects of this change are:
-freq()
that was borrowed from the cleaner
package was removed. Use cleaner::freq()
, or run library("cleaner")
before you use freq()
.mo
or rsi
in a tibble will no longer be in colour and printing rsi
in a tibble will show the class <ord>
, not <rsi>
anymore. This is purely a visual effect.mo_*
family (like mo_name()
and mo_gramstain()
) are noticeably slower when running on hundreds of thousands of rows.mo
and ab
now both also inherit class character
, to support any data transformation. This change invalidates code that checks for class length == 1.freq()
that was borrowed from the
+cleaner
package was removed. Use
+cleaner::freq()
, or run library("cleaner")
+before you use freq()
.mo
or rsi
in
+a tibble will no longer be in colour and printing rsi
in a
+tibble will show the class <ord>
, not
+<rsi>
anymore. This is purely a visual
+effect.mo_*
family (like
+mo_name()
and mo_gramstain()
) are noticeably
+slower when running on hundreds of thousands of rows.mo
and ab
now both
+also inherit class character
, to support any data
+transformation. This change invalidates code that checks for class
+length == 1.first_isolate()
), since some bacterial names might be renamed to other genera or other (sub)species. This is expected behaviour.first_isolate()
), since some bacterial names might
+be renamed to other genera or other (sub)species. This is expected
+behaviour.eucast_rules()
function no longer applies “other” rules at default that are made available by this package (like setting ampicillin = R when ampicillin + enzyme inhibitor = R). The default input value for rules
is now c("breakpoints", "expert")
instead of "all"
, but this can be changed by the user. To return to the old behaviour, set options(AMR.eucast_rules = "all")
.antibiotics
data set these two rules:
-eucast_rules()
function no longer applies “other”
+rules at default that are made available by this package (like setting
+ampicillin = R when ampicillin + enzyme inhibitor = R). The default
+input value for rules
is now
+c("breakpoints", "expert")
instead of "all"
,
+but this can be changed by the user. To return to the old behaviour, set
+options(AMR.eucast_rules = "all")
.antibiotics
data set these two rules:
+eucast_rules()
+This works for all drug combinations, such as ampicillin/sulbactam,
+ceftazidime/avibactam, trimethoprim/sulfamethoxazole, etc.eucast_rules()
ab_url()
to return the direct URL of an antimicrobial agent from the official WHO websiteas.ab()
, so that e.g. as.ab("ampi sul")
and ab_name("ampi sul")
workab_atc()
and ab_group()
now return NA
if no antimicrobial agent could be foundset_mo_source()
to make sure that column mo
will always be the second columnab_url()
to return the direct URL of an
+antimicrobial agent from the official WHO websiteas.ab()
, so that
+e.g. as.ab("ampi sul")
and ab_name("ampi sul")
+workab_atc()
and ab_group()
now
+return NA
if no antimicrobial agent could be foundset_mo_source()
to make sure that column
+mo
will always be the second columnp.symbol()
- it was replaced with p_symbol()
+p.symbol()
- it
+was replaced with p_symbol()
read.4d()
, that was only useful for reading data from an old test database.read.4d()
, that was only useful for
+reading data from an old test database.pca()
functionggplot_pca()
functionpca()
functionggplot_pca()
functionas.mo()
(and consequently all mo_*
functions, that use as.mo()
internally):
-SPE
for species, like "ESCSPE"
for Escherichia coli
+as.mo()
(and
+consequently all mo_*
functions, that use
+as.mo()
internally):
+SPE
for species, like
+"ESCSPE"
for Escherichia coli
antibiotics
data setas.rsi()
for years 2010-2019 (thanks to Anthony Underwood)antibiotics
data
+setas.rsi()
for years 2010-2019 (thanks to Anthony
+Underwood)Fixed important floating point error for some MIC comparisons in EUCAST 2020 guideline
Fixed important floating point error for some MIC comparisons in +EUCAST 2020 guideline
Interpretation from MIC values (and disk zones) to R/SI can now be used with mutate_at()
of the dplyr
package:
Interpretation from MIC values (and disk zones) to R/SI can now
+be used with mutate_at()
of the dplyr
+package:
Added antibiotic abbreviations for a laboratory manufacturer (GLIMS) for cefuroxime, cefotaxime, ceftazidime, cefepime, cefoxitin and trimethoprim/sulfamethoxazole
Added uti
(as abbreviation of urinary tract infections) as argument to as.rsi()
, so interpretation of MIC values and disk zones can be made dependent on isolates specifically from UTIs
Info printing in functions eucast_rules()
, first_isolate()
, mdro()
and resistance_predict()
will now at default only print when R is in an interactive mode (i.e. not in RMarkdown)
Added antibiotic abbreviations for a laboratory manufacturer +(GLIMS) for cefuroxime, cefotaxime, ceftazidime, cefepime, cefoxitin and +trimethoprim/sulfamethoxazole
Added uti
(as abbreviation of urinary tract
+infections) as argument to as.rsi()
, so interpretation of
+MIC values and disk zones can be made dependent on isolates specifically
+from UTIs
Info printing in functions eucast_rules()
,
+first_isolate()
, mdro()
and
+resistance_predict()
will now at default only print when R
+is in an interactive mode (i.e. not in RMarkdown)
This software is now out of beta and considered stable. Nonetheless, this package will be developed continually.
+This software is now out of beta and considered stable. Nonetheless, +this package will be developed continually.
as.rsi()
and inferred resistance and susceptibility using eucast_rules()
.as.rsi()
and
+inferred resistance and susceptibility using
+eucast_rules()
.Support for LOINC codes in the antibiotics
data set. Use ab_loinc()
to retrieve LOINC codes, or use a LOINC code for input in any ab_*
function:
Support for LOINC codes in the antibiotics
data set.
+Use ab_loinc()
to retrieve LOINC codes, or use a LOINC code
+for input in any ab_*
function:
ab_loinc("ampicillin")
@@ -863,7 +1456,9 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
#> [1] "J01CA01"
Support for SNOMED CT codes in the microorganisms
data set. Use mo_snomed()
to retrieve SNOMED codes, or use a SNOMED code for input in any mo_*
function:
Support for SNOMED CT codes in the microorganisms
+data set. Use mo_snomed()
to retrieve SNOMED codes, or use
+a SNOMED code for input in any mo_*
function:
mo_snomed("S. aureus")
@@ -877,25 +1472,47 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
as.mo()
function previously wrote to the package folder to improve calculation speed for previously calculated results. This is no longer the case, to comply with CRAN policies. Consequently, the function clear_mo_history()
was removed.as.rsi()
+as.mo()
function previously wrote to the package
+folder to improve calculation speed for previously calculated results.
+This is no longer the case, to comply with CRAN policies. Consequently,
+the function clear_mo_history()
was removed.as.rsi()
as.mo()
(and consequently all mo_*
functions, that use as.mo()
internally):
-as.mo("Methicillin-resistant S.aureus")
+as.mo()
(and
+consequently all mo_*
functions, that use
+as.mo()
internally):
+as.mo("Methicillin-resistant S.aureus")
as.disk()
limited to a maximum of 50 millimeterstidyverse
+as.disk()
limited to a maximum of 50
+millimeterstidyverse
as.ab()
: support for drugs starting with “co-” like co-amoxiclav, co-trimoxazole, co-trimazine and co-trimazole (thanks to Peter Dutey)antibiotics
data set (thanks to Peter Dutey):
-RIF
) to rifampicin/isoniazid (RFI
). Please note that the combination rifampicin/isoniazid has no DDDs defined, so e.g. ab_ddd("Rimactazid")
will now return NA
.SMX
) to trimethoprim/sulfamethoxazole (SXT
)as.ab()
: support for drugs starting with “co-”
+like co-amoxiclav, co-trimoxazole, co-trimazine and co-trimazole (thanks
+to Peter Dutey)antibiotics
data set (thanks to Peter
+Dutey):
+RIF
) to rifampicin/isoniazid (RFI
). Please
+note that the
+combination rifampicin/isoniazid has no DDDs defined, so
+e.g. ab_ddd("Rimactazid")
will now return
+NA
.SMX
) to trimethoprim/sulfamethoxazole
+(SXT
)microorganisms
data set, which means that the new order Enterobacterales now consists of a part of the existing family Enterobacteriaceae, but that this family has been split into other families as well (like Morganellaceae and Yersiniaceae). Although published in 2016, this information is not yet in the Catalogue of Life version of 2019. All MDRO determinations with mdro()
will now use the Enterobacterales order for all guidelines before 2016 that were dependent on the Enterobacteriaceae family.
+microorganisms
data set, which means that the new order
+Enterobacterales now consists of a part of the existing family
+Enterobacteriaceae, but that this family has been split into other
+families as well (like Morganellaceae and
+Yersiniaceae). Although published in 2016, this information is
+not yet in the Catalogue of Life version of 2019. All MDRO
+determinations with mdro()
will now use the
+Enterobacterales order for all guidelines before 2016 that were
+dependent on the Enterobacteriaceae family.
If you were dependent on the old Enterobacteriaceae family e.g. by using in your code:
+If you were dependent on the old Enterobacteriaceae family +e.g. by using in your code:
if (mo_family(somebugs) == "Enterobacteriaceae") ...
Functions susceptibility()
and resistance()
as aliases of proportion_SI()
and proportion_R()
, respectively. These functions were added to make it more clear that “I” should be considered susceptible and not resistant.
Functions susceptibility()
and
+resistance()
as aliases of proportion_SI()
and
+proportion_R()
, respectively. These functions were added to
+make it more clear that “I” should be considered susceptible and not
+resistant.
Support for a new MDRO guideline: Magiorakos AP, Srinivasan A et al. “Multidrug-resistant, extensively drug-resistant and pandrug-resistant bacteria: an international expert proposal for interim standard definitions for acquired resistance.” Clinical Microbiology and Infection (2012).
-mdro()
functionmdro(...., verbose = TRUE)
) returns an informative data set where the reason for MDRO determination is given for every isolate, and an list of the resistant antimicrobial agentsSupport for a new MDRO guideline: Magiorakos AP, Srinivasan A +et al. “Multidrug-resistant, extensively drug-resistant and +pandrug-resistant bacteria: an international expert proposal for interim +standard definitions for acquired resistance.” Clinical Microbiology and +Infection (2012).
+mdro()
+functionmdro(...., verbose = TRUE)
)
+returns an informative data set where the reason for MDRO determination
+is given for every isolate, and an list of the resistant antimicrobial
+agentsData set antivirals
, containing all entries from the ATC J05 group with their DDDs for oral and parenteral treatment
Data set antivirals
, containing all entries from the
+ATC J05 group with their DDDs for oral and parenteral treatment
as.mo()
:
-Now allows “ou” where “au” should have been used and vice versa
More intelligent way of coping with some consonants like “l” and “r”
Now allows “ou” where “au” should have been used and vice +versa
More intelligent way of coping with some consonants like “l” and +“r”
Added a score (a certainty percentage) to mo_uncertainties()
, that is calculated using the Levenshtein distance:
Added a score (a certainty percentage) to
+mo_uncertainties()
, that is calculated using the Levenshtein
+distance:
as.atc()
- this function was replaced by ab_atc()
+as.atc()
- this
+function was replaced by ab_atc()
portion_*
functions to proportion_*
. All portion_*
functions are still available as deprecated functions, and will return a warning when used.as.rsi()
over a data set, it will now print the guideline that will be used if it is not specified by the userportion_*
functions to
+proportion_*
. All portion_*
functions are
+still available as deprecated functions, and will return a warning when
+used.as.rsi()
over a data set, it will now
+print the guideline that will be used if it is not specified by the
+usereucast_rules()
:
-eucast_rules()
are now applied first and not as last anymore. This is to improve the dependency on certain antibiotics for the official EUCAST rules. Please see ?eucast_rules
.eucast_rules()
are now applied
+first and not as last anymore. This is to improve the dependency on
+certain antibiotics for the official EUCAST rules. Please see
+?eucast_rules
.as.rsi()
where the input is NA
+as.rsi()
where the
+input is NA
mdro()
and eucast_rules()
+mdro()
and eucast_rules()
antibiotics
data setantibiotics
data setexample_isolates
data set to better reflect realityexample_isolates
data set to
+better reflect realitymo_info()
clean
to cleaner
, as this package was renamed accordingly upon CRAN requestclean
to cleaner
, as
+this package was renamed accordingly upon CRAN requestDetermination of first isolates now excludes all ‘unknown’ microorganisms at default, i.e. microbial code "UNKNOWN"
. They can be included with the new argument include_unknown
:
Determination of first isolates now excludes all
+‘unknown’ microorganisms at default, i.e. microbial code
+"UNKNOWN"
. They can be included with the new argument
+include_unknown
:
first_isolate(..., include_unknown = TRUE)
For WHONET users, this means that all records/isolates with organism code "con"
(contamination) will be excluded at default, since as.mo("con") = "UNKNOWN"
. The function always shows a note with the number of ‘unknown’ microorganisms that were included or excluded.
For WHONET users, this means that all records/isolates with organism
+code "con"
(contamination) will be excluded at
+default, since as.mo("con") = "UNKNOWN"
. The function
+always shows a note with the number of ‘unknown’ microorganisms that
+were included or excluded.
For code consistency, classes ab
and mo
will now be preserved in any subsetting or assignment. For the sake of data integrity, this means that invalid assignments will now result in NA
:
For code consistency, classes ab
and mo
+will now be preserved in any subsetting or assignment. For the sake of
+data integrity, this means that invalid assignments will now result in
+NA
:
# how it works in base R:
@@ -1017,15 +1694,26 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
x[1] <- "testvalue"
#> Warning message:
#> invalid microorganism code, NA generated
This is important, because a value like "testvalue"
could never be understood by e.g. mo_name()
, although the class would suggest a valid microbial code.
This is important, because a value like "testvalue"
+could never be understood by e.g. mo_name()
, although the
+class would suggest a valid microbial code.
Function freq()
has moved to a new package, clean
(CRAN link), since creating frequency tables actually does not fit the scope of this package. The freq()
function still works, since it is re-exported from the clean
package (which will be installed automatically upon updating this AMR
package).
Renamed data set septic_patients
to example_isolates
Function freq()
has moved to a new package, clean
(CRAN link), since
+creating frequency tables actually does not fit the scope of this
+package. The freq()
function still works, since it is
+re-exported from the clean
package (which will be installed
+automatically upon updating this AMR
package).
Renamed data set septic_patients
to
+example_isolates
Function bug_drug_combinations()
to quickly get a data.frame
with the results of all bug-drug combinations in a data set. The column containing microorganism codes is guessed automatically and its input is transformed with mo_shortname()
at default:
Function bug_drug_combinations()
to quickly get a
+data.frame
with the results of all bug-drug combinations in
+a data set. The column containing microorganism codes is guessed
+automatically and its input is transformed with
+mo_shortname()
at default:
x <- bug_drug_combinations(example_isolates)
@@ -1048,13 +1736,25 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
#> 3 Gram-negative AMP 227 0 405 632
#> 4 Gram-negative AMX 227 0 405 632
#> NOTE: Use 'format()' on this result to get a publicable/printable format.
You can format this to a printable format, ready for reporting or exporting to e.g. Excel with the base R format()
function:
You can format this to a printable format, ready for reporting or
+exporting to e.g. Excel with the base R format()
+function:
format(x, combine_IR = FALSE)
Additional way to calculate co-resistance, i.e. when using multiple antimicrobials as input for portion_*
functions or count_*
functions. This can be used to determine the empiric susceptibility of a combination therapy. A new argument only_all_tested
(which defaults to FALSE
) replaces the old also_single_tested
and can be used to select one of the two methods to count isolates and calculate portions. The difference can be seen in this example table (which is also on the portion
and count
help pages), where the %SI is being determined:
Additional way to calculate co-resistance, i.e. when using
+multiple antimicrobials as input for portion_*
functions or
+count_*
functions. This can be used to determine the
+empiric susceptibility of a combination therapy. A new argument
+only_all_tested
(which defaults to
+FALSE
) replaces the old
+also_single_tested
and can be used to select one of the two
+methods to count isolates and calculate portions. The difference can be
+seen in this example table (which is also on the portion
+and count
help pages), where the %SI is being
+determined:
# --------------------------------------------------------------------
@@ -1073,10 +1773,18 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
# R <NA> - - - -
# <NA> <NA> - - - -
# --------------------------------------------------------------------
Since this is a major change, usage of the old also_single_tested
will throw an informative error that it has been replaced by only_all_tested
.
Since this is a major change, usage of the old
+also_single_tested
will throw an informative error that it
+has been replaced by only_all_tested
.
tibble
printing support for classes rsi
, mic
, disk
, ab
mo
. When using tibble
s containing antimicrobial columns, values S
will print in green, values I
will print in yellow and values R
will print in red. Microbial IDs (class mo
) will emphasise on the genus and species, not on the kingdom.
tibble
printing support for classes
+rsi
, mic
, disk
, ab
+mo
. When using tibble
s containing
+antimicrobial columns, values S
will print in green, values
+I
will print in yellow and values R
will print
+in red. Microbial IDs (class mo
) will emphasise on the
+genus and species, not on the kingdom.
# (run this on your own console, as this page does not support colour printing)
@@ -1088,44 +1796,93 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
as.mo()
(of which some led to additions to the microorganisms
data set). Many thanks to all contributors that helped improving the algorithms.
-as.mo()
(of which some
+led to additions to the microorganisms
data set). Many
+thanks to all contributors that helped improving the algorithms.
+B_ENTRC_FAE
could have been both E. faecalis and E. faecium. Its new code is B_ENTRC_FCLS
and E. faecium has become B_ENTRC_FACM
. Also, the Latin character ae is now preserved at the start of each genus and species abbreviation. For example, the old code for Aerococcus urinae was B_ARCCC_NAE
. This is now B_AERCC_URIN
. IMPORTANT: Old microorganism IDs are still supported, but support will be dropped in a future version. Use as.mo()
on your old codes to transform them to the new format. Using functions from the mo_*
family (like mo_name()
and mo_gramstain()
) on old codes, will throw a warning.B_ENTRC_FAE
could have been both E.
+faecalis and E. faecium. Its new code is
+B_ENTRC_FCLS
and E. faecium has become
+B_ENTRC_FACM
. Also, the Latin character ae is now preserved
+at the start of each genus and species abbreviation. For example, the
+old code for Aerococcus urinae was B_ARCCC_NAE
.
+This is now B_AERCC_URIN
. IMPORTANT: Old
+microorganism IDs are still supported, but support will be dropped in a
+future version. Use as.mo()
on your old codes to transform
+them to the new format. Using functions from the mo_*
+family (like mo_name()
and mo_gramstain()
) on
+old codes, will throw a warning.as.ab()
, including bidirectional language supportmdro()
function, to determine multi-drug resistant organismsas.ab()
, including
+bidirectional language supportmdro()
function, to determine multi-drug resistant
+organismseucast_rules()
:
eucast_rules(..., verbose = TRUE)
) returns more informative and readable outputeucast_rules(..., verbose = TRUE)
) returns more
+informative and readable outputAMR:::get_column_abx()
)atc
- using as.atc()
is now deprecated in favour of ab_atc()
and this will return a character, not the atc
class anymoreabname()
, ab_official()
, atc_name()
, atc_official()
, atc_property()
, atc_tradenames()
, atc_trivial_nl()
+AMR:::get_column_abx()
)atc
- using as.atc()
is now
+deprecated in favour of ab_atc()
and this will return a
+character, not the atc
class anymoreabname()
,
+ab_official()
, atc_name()
,
+atc_official()
, atc_property()
,
+atc_tradenames()
, atc_trivial_nl()
mo_shortname()
mo_*
functions where the coercion uncertainties and failures would not be available through mo_uncertainties()
and mo_failures()
anymorecountry
argument of mdro()
in favour of the already existing guideline
argument to support multiple guidelines within one countryname
of RIF
is now Rifampicin instead of Rifampinantibiotics
data set is now sorted by name and all cephalosporins now have their generation between bracketsguess_ab_col()
which is now 30 times faster for antibiotic abbreviationsfilter_ab_class()
to be more reliable and to support 5th generation cephalosporinsavailability()
now uses portion_R()
instead of portion_IR()
, to comply with EUCAST insightsage()
and age_groups()
now have a na.rm
argument to remove empty valuesp.symbol()
to p_symbol()
(the former is now deprecated and will be removed in a future version)x
in age_groups()
will now introduce NA
s and not return an error anymoremo_*
functions where the coercion
+uncertainties and failures would not be available through
+mo_uncertainties()
and mo_failures()
+anymorecountry
argument of mdro()
+in favour of the already existing guideline
argument to
+support multiple guidelines within one countryname
of RIF
is now Rifampicin instead
+of Rifampinantibiotics
data set is now sorted by name and all
+cephalosporins now have their generation between bracketsguess_ab_col()
which is now 30
+times faster for antibiotic abbreviationsfilter_ab_class()
to be more reliable and to
+support 5th generation cephalosporinsavailability()
now uses
+portion_R()
instead of portion_IR()
, to comply
+with EUCAST insightsage()
and age_groups()
now have
+a na.rm
argument to remove empty valuesp.symbol()
to p_symbol()
+(the former is now deprecated and will be removed in a future
+version)x
in
+age_groups()
will now introduce NA
s and not
+return an error anymorekey_antibiotics()
on foreign systemsas.mic()
)lintr
packagelintr
packageFunction rsi_df()
to transform a data.frame
to a data set containing only the microbial interpretation (S, I, R), the antibiotic, the percentage of S/I/R and the number of available isolates. This is a convenient combination of the existing functions count_df()
and portion_df()
to immediately show resistance percentages and number of available isolates:
Function rsi_df()
to transform a
+data.frame
to a data set containing only the microbial
+interpretation (S, I, R), the antibiotic, the percentage of S/I/R and
+the number of available isolates. This is a convenient combination of
+the existing functions count_df()
and
+portion_df()
to immediately show resistance percentages and
+number of available isolates:
septic_patients %>%
@@ -1157,7 +1923,8 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
# 4 Ciprofloxacin R 0.1618169 228
Support for all scientifically published pathotypes of E. coli to date (that we could find). Supported are:
+Support for all scientifically published pathotypes of E. +coli to date (that we could find). Supported are:
Function mo_info()
as an analogy to ab_info()
. The mo_info()
prints a list with the full taxonomy, authors, and the URL to the online database of a microorganism
Function mo_synonyms()
to get all previously accepted taxonomic names of a microorganism
Function mo_info()
as an analogy to
+ab_info()
. The mo_info()
prints a list with
+the full taxonomy, authors, and the URL to the online database of a
+microorganism
Function mo_synonyms()
to get all previously
+accepted taxonomic names of a microorganism
count_df()
and portion_df()
are now lowercasecount_df()
and
+portion_df()
are now lowercaseas.ab()
and as.mo()
to understand even more severely misspelled inputas.ab()
now allows spaces for coercing antibiotics namesggplot2
methods for automatically determining the scale type of classes mo
and ab
+as.ab()
and
+as.mo()
to understand even more severely misspelled
+inputas.ab()
now allows spaces for coercing
+antibiotics namesggplot2
methods for automatically determining the
+scale type of classes mo
and ab
"bacteria"
from getting coerced by as.ab()
because Bacterial is a brand name of trimethoprim (TMP)eucast_rules()
and mdro()
+"bacteria"
from getting coerced by
+as.ab()
because Bacterial is a brand name of trimethoprim
+(TMP)eucast_rules()
and mdro()
latest_annual_release
from the catalogue_of_life_version()
functionPVM1
from the antibiotics
data set as this was a duplicate of PME
+latest_annual_release
from the
+catalogue_of_life_version()
functionPVM1
from the
+antibiotics
data set as this was a duplicate of
+PME
as.mo()
+as.mo()
plot()
and barplot()
for MIC and RSI classesas.mo()
+plot()
and barplot()
+for MIC and RSI classesas.mo()
as.rsi()
on an MIC value (created with as.mic()
), a disk diffusion value (created with the new as.disk()
) or on a complete date set containing columns with MIC or disk diffusion values.mo_name()
as alias of mo_fullname()
+as.rsi()
+on an MIC value (created with as.mic()
), a disk diffusion
+value (created with the new as.disk()
) or on a complete
+date set containing columns with MIC or disk diffusion values.mo_name()
as alias of
+mo_fullname()
mdr_tb()
) and added a new vignette about MDR. Read this tutorial here on our website.mdr_tb()
) and added a new vignette about MDR. Read
+this tutorial here on our
+website.first_isolate()
where missing species would lead to incorrect FALSEs. This bug was not present in AMR v0.5.0, but was in v0.6.0 and v0.6.1.eucast_rules()
where antibiotics from WHONET software would not be recognisedfirst_isolate()
where missing
+species would lead to incorrect FALSEs. This bug was not present in AMR
+v0.5.0, but was in v0.6.0 and v0.6.1.eucast_rules()
where antibiotics from
+WHONET software would not be recognisedantibiotics
data set:
ab
contains a human readable EARS-Net code, used by ECDC and WHO/WHONET - this is the primary identifier used in this packageatc
contains the ATC code, used by WHO/WHOCCcid
contains the CID code (Compound ID), used by PubChemab
contains a human readable EARS-Net code, used
+by ECDC and WHO/WHONET - this is the primary identifier used in this
+packageatc
contains the ATC code, used by
+WHO/WHOCCcid
contains the CID code (Compound ID), used by
+PubChemAMX
for amoxicillinatc_certe
, ab_umcg
and atc_trivial_nl
have been removedatc_*
functions are superseded by ab_*
functionsAMX
for amoxicillinatc_certe
, ab_umcg
and
+atc_trivial_nl
have been removedatc_*
functions are superseded by ab_*
+functionsggplot_rsi()
:
colours
to set the bar colourstitle
, subtitle
, caption
, x.title
and y.title
to set titles and axis descriptionstitle
, subtitle
,
+caption
, x.title
and y.title
to
+set titles and axis descriptionsguess_ab_col()
+guess_ab_col()
microorganisms.old
data set, which leads to better results finding when using the as.mo()
functionportion_df()
and count_df()
this means that their new argument combine_SI
is TRUE at default. Our plotting function ggplot_rsi()
also reflects this change since it uses count_df()
internally.age()
function gained a new argument exact
to determine ages with decimalsguess_mo()
, guess_atc()
, EUCAST_rules()
, interpretive_reading()
, rsi()
+microorganisms.old
data set, which leads to better results
+finding when using the as.mo()
functionportion_df()
and count_df()
this means that
+their new argument combine_SI
is TRUE at default. Our
+plotting function ggplot_rsi()
also reflects this change
+since it uses count_df()
internally.age()
function gained a new argument
+exact
to determine ages with decimalsguess_mo()
,
+guess_atc()
, EUCAST_rules()
,
+interpretive_reading()
, rsi()
freq()
):
+freq()
):
speed improvement for microbial IDs
fixed factor level names for R Markdown
when all values are unique it now shows a message instead of a warning
when all values are unique it now shows a message instead of a +warning
support for boxplots:
age_groups()
, to let groups of fives and tens end with 100+ instead of 120+freq()
for when all values are NA
+age_groups()
, to let
+groups of fives and tens end with 100+ instead of 120+freq()
for when all values are
+NA
first_isolate()
for when dates are missingguess_ab_col()
as.mo()
now gently interprets any number of whitespace characters (like tabs) as one spaceas.mo()
now returns UNKNOWN
for "con"
(WHONET ID of ‘contamination’) and returns NA
for "xxx"
(WHONET ID of ‘no growth’)as.mo()
now gently interprets any number of
+whitespace characters (like tabs) as one spaceas.mo()
now returns UNKNOWN
for
+"con"
(WHONET ID of ‘contamination’) and returns
+NA
for "xxx"
(WHONET ID of ‘no growth’)as.mo()
microorganisms.codes
and cleaned it upmo_shortname()
where species would not be determined correctlymicroorganisms.codes
and
+cleaned it upmo_shortname()
where species would not be
+determined correctlyeucast_rules()
with verbose = TRUE
+eucast_rules()
with
+verbose = TRUE
New website!
-We’ve got a new website: https://msberends.gitlab.io/AMR (built with the great pkgdown
)
We’ve got a new website: https://msberends.gitlab.io/AMR
+(built with the great pkgdown
)
BREAKING: removed deprecated functions, arguments and references to ‘bactid’. Use as.mo()
to identify an MO code.
BREAKING: removed deprecated functions,
+arguments and references to ‘bactid’. Use as.mo()
to
+identify an MO code.
Catalogue of Life as a new taxonomic source for data about microorganisms, which also contains all ITIS data we used previously. The microorganisms
data set now contains:
All ~55,000 (sub)species from the kingdoms of Archaea, Bacteria and Protozoa
All ~3,000 (sub)species from these orders of the kingdom of Fungi: Eurotiales, Onygenales, Pneumocystales, Saccharomycetales and Schizosaccharomycetales (covering at least like all species of Aspergillus, Candida, Pneumocystis, Saccharomyces and Trichophyton)
All ~2,000 (sub)species from ~100 other relevant genera, from the kingdoms of Animalia and Plantae (like Strongyloides and Taenia)
All ~15,000 previously accepted names of included (sub)species that have been taxonomically renamed
Catalogue of Life as a new taxonomic source for data about
+microorganisms, which also contains all ITIS data we used previously.
+The microorganisms
data set now contains:
All ~55,000 (sub)species from the kingdoms of Archaea, Bacteria +and Protozoa
All ~3,000 (sub)species from these orders of the kingdom of +Fungi: Eurotiales, Onygenales, Pneumocystales, Saccharomycetales and +Schizosaccharomycetales (covering at least like all species of +Aspergillus, Candida, Pneumocystis, +Saccharomyces and Trichophyton)
All ~2,000 (sub)species from ~100 other relevant genera, from the +kingdoms of Animalia and Plantae (like Strongyloides and +Taenia)
All ~15,000 previously accepted names of included (sub)species +that have been taxonomically renamed
The responsible author(s) and year of scientific publication
-This data is updated annually - check the included version with the new function catalogue_of_life_version()
.
This data is updated annually - check the included version with the
+new function catalogue_of_life_version()
.
Due to this change, some mo
codes changed (e.g. Streptococcus changed from B_STRPTC
to B_STRPT
). A translation table is used internally to support older microorganism IDs, so users will not notice this difference.
New function mo_rank()
for the taxonomic rank (genus, species, infraspecies, etc.)
New function mo_url()
to get the direct URL of a species from the Catalogue of Life
Due to this change, some mo
codes changed
+(e.g. Streptococcus changed from B_STRPTC
to
+B_STRPT
). A translation table is used internally to support
+older microorganism IDs, so users will not notice this
+difference.
New function mo_rank()
for the taxonomic rank
+(genus, species, infraspecies, etc.)
New function mo_url()
to get the direct URL of a
+species from the Catalogue of Life
Support for data from WHONET and EARS-Net (European Antimicrobial Resistance Surveillance Network):
-first_isolate()
and eucast_rules()
, all arguments will be filled in automatically.antibiotics
data set now contains a column ears_net
.as.mo()
now knows all WHONET species abbreviations too, because almost 2,000 microbial abbreviations were added to the microorganisms.codes
data set.Support for data from WHONET +and EARS-Net +(European Antimicrobial Resistance Surveillance Network):
+first_isolate()
and
+eucast_rules()
, all arguments will be filled in
+automatically.antibiotics
+data set now contains a column ears_net
.as.mo()
now knows all WHONET species
+abbreviations too, because almost 2,000 microbial abbreviations were
+added to the microorganisms.codes
data set.New filters for antimicrobial classes. Use these functions to filter isolates on results in one of more antibiotics from a specific class:
+New filters for antimicrobial classes. Use these functions to +filter isolates on results in one of more antibiotics from a specific +class:
filter_aminoglycosides()
@@ -1342,7 +2212,10 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
filter_glycopeptides()
filter_macrolides()
filter_tetracyclines()
The antibiotics
data set will be searched, after which the input data will be checked for column names with a value in any abbreviations, codes or official names found in the antibiotics
data set. For example:
The antibiotics
data set will be searched, after which
+the input data will be checked for column names with a value in any
+abbreviations, codes or official names found in the
+antibiotics
data set. For example:
septic_patients %>% filter_glycopeptides(result = "R")
@@ -1351,7 +2224,8 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
# Filtering on glycopeptide antibacterials: all of `vanc` and `teic` is R
All ab_*
functions are deprecated and replaced by atc_*
functions:
All ab_*
functions are deprecated and replaced by
+atc_*
functions:
ab_property -> atc_property()
@@ -1361,18 +2235,42 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
ab_certe -> atc_certe()
ab_umcg -> atc_umcg()
ab_tradenames -> atc_tradenames()
These functions use as.atc()
internally. The old atc_property
has been renamed atc_online_property()
. This is done for two reasons: firstly, not all ATC codes are of antibiotics (ab) but can also be of antivirals or antifungals. Secondly, the input must have class atc
or must be coerable to this class. Properties of these classes should start with the same class name, analogous to as.mo()
and e.g. mo_genus
.
These functions use as.atc()
internally. The old
+atc_property
has been renamed
+atc_online_property()
. This is done for two reasons:
+firstly, not all ATC codes are of antibiotics (ab) but can also be of
+antivirals or antifungals. Secondly, the input must have class
+atc
or must be coerable to this class. Properties of these
+classes should start with the same class name, analogous to
+as.mo()
and e.g. mo_genus
.
New functions set_mo_source()
and get_mo_source()
to use your own predefined MO codes as input for as.mo()
and consequently all mo_*
functions
Support for the upcoming dplyr
version 0.8.0
New function guess_ab_col()
to find an antibiotic column in a table
New function mo_failures()
to review values that could not be coerced to a valid MO code, using as.mo()
. This latter function will now only show a maximum of 10 uncoerced values and will refer to mo_failures()
.
New function mo_uncertainties()
to review values that could be coerced to a valid MO code using as.mo()
, but with uncertainty.
New function mo_renamed()
to get a list of all returned values from as.mo()
that have had taxonomic renaming
New function age()
to calculate the (patients) age in years
New function age_groups()
to split ages into custom or predefined groups (like children or elderly). This allows for easier demographic AMR data analysis per age group.
New functions set_mo_source()
and
+get_mo_source()
to use your own predefined MO codes as
+input for as.mo()
and consequently all mo_*
+functions
Support for the upcoming dplyr
version
+0.8.0
New function guess_ab_col()
to find an antibiotic
+column in a table
New function mo_failures()
to review values that
+could not be coerced to a valid MO code, using as.mo()
.
+This latter function will now only show a maximum of 10 uncoerced values
+and will refer to mo_failures()
.
New function mo_uncertainties()
to review values
+that could be coerced to a valid MO code using as.mo()
, but
+with uncertainty.
New function mo_renamed()
to get a list of all
+returned values from as.mo()
that have had taxonomic
+renaming
New function age()
to calculate the (patients) age
+in years
New function age_groups()
to split ages into custom
+or predefined groups (like children or elderly). This allows for easier
+demographic AMR data analysis per age group.
New function ggplot_rsi_predict()
as well as the base R plot()
function can now be used for resistance prediction calculated with resistance_predict()
:
New function ggplot_rsi_predict()
as well as the
+base R plot()
function can now be used for resistance
+prediction calculated with resistance_predict()
:
x <- resistance_predict(septic_patients, col_ab = "amox")
@@ -1380,7 +2278,9 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
ggplot_rsi_predict(x)
Functions filter_first_isolate()
and filter_first_weighted_isolate()
to shorten and fasten filtering on data sets with antimicrobial results, e.g.:
Functions filter_first_isolate()
and
+filter_first_weighted_isolate()
to shorten and fasten
+filtering on data sets with antimicrobial results, e.g.:
septic_patients %>% filter_first_isolate(...)
@@ -1394,26 +2294,50 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
filter(only_firsts == TRUE) %>%
select(-only_firsts)
New function availability()
to check the number of available (non-empty) results in a data.frame
New vignettes about how to conduct AMR analysis, predict antimicrobial resistance, use the G-test and more. These are also available (and even easier readable) on our website: https://msberends.gitlab.io/AMR.
New function availability()
to check the number of
+available (non-empty) results in a data.frame
New vignettes about how to conduct AMR analysis, predict +antimicrobial resistance, use the G-test and more. These are +also available (and even easier readable) on our website: https://msberends.gitlab.io/AMR.
eucast_rules()
:
-septic_patients
now reflects these changeseucast_rules(..., verbose = TRUE)
to get a data set with all changed per bug and drug combination.septic_patients
now reflects
+these changeseucast_rules(..., verbose = TRUE)
to get a data set with
+all changed per bug and drug combination.microorganisms.oldDT
, microorganisms.prevDT
, microorganisms.unprevDT
and microorganismsDT
since they were no longer needed and only contained info already available in the microorganisms
data setantibiotics
data set, from the Pharmaceuticals Community Register of the European Commissionatc_group1_nl
and atc_group2_nl
from the antibiotics
data setatc_ddd()
and atc_groups()
have been renamed atc_online_ddd()
and atc_online_groups()
. The old functions are deprecated and will be removed in a future version.guess_mo()
is now deprecated in favour of as.mo()
and will be removed in future versionsguess_atc()
is now deprecated in favour of as.atc()
and will be removed in future versionsmicroorganisms.oldDT
,
+microorganisms.prevDT
, microorganisms.unprevDT
+and microorganismsDT
since they were no longer needed and
+only contained info already available in the microorganisms
+data setantibiotics
data set, from
+the Pharmaceuticals
+Community Register of the European Commissionatc_group1_nl
and
+atc_group2_nl
from the antibiotics
data
+setatc_ddd()
and atc_groups()
have
+been renamed atc_online_ddd()
and
+atc_online_groups()
. The old functions are deprecated and
+will be removed in a future version.guess_mo()
is now deprecated in favour of
+as.mo()
and will be removed in future versionsguess_atc()
is now deprecated in favour of
+as.atc()
and will be removed in future versionsas.mo()
:
Now handles incorrect spelling, like i
instead of y
and f
instead of ph
:
Now handles incorrect spelling, like i
instead of
+y
and f
instead of ph
:
# mo_fullname() uses as.mo() internally
@@ -1425,7 +2349,10 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
#> [1] "Staphylococcus kloosii"
Uncertainty of the algorithm is now divided into four levels, 0 to 3, where the default allow_uncertain = TRUE
is equal to uncertainty level 2. Run ?as.mo
for more info about these levels.
Uncertainty of the algorithm is now divided into four levels, 0
+to 3, where the default allow_uncertain = TRUE
is equal to
+uncertainty level 2. Run ?as.mo
for more info about these
+levels.
# equal:
@@ -1435,84 +2362,135 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
# also equal:
as.mo(..., allow_uncertain = FALSE)
as.mo(..., allow_uncertain = 0)
Using as.mo(..., allow_uncertain = 3)
could lead to very unreliable results.
Using as.mo(..., allow_uncertain = 3)
could lead to very
+unreliable results.
Implemented the latest publication of Becker et al. (2019), for categorising coagulase-negative Staphylococci
All microbial IDs that found are now saved to a local file ~/.Rhistory_mo
. Use the new function clean_mo_history()
to delete this file, which resets the algorithms.
Incoercible results will now be considered ‘unknown’, MO code UNKNOWN
. On foreign systems, properties of these will be translated to all languages already previously supported: German, Dutch, French, Italian, Spanish and Portuguese.
Implemented the latest publication of Becker et al. +(2019), for categorising coagulase-negative +Staphylococci
All microbial IDs that found are now saved to a local file
+~/.Rhistory_mo
. Use the new function
+clean_mo_history()
to delete this file, which resets the
+algorithms.
Incoercible results will now be considered ‘unknown’, MO code
+UNKNOWN
. On foreign systems, properties of these will be
+translated to all languages already previously supported: German, Dutch,
+French, Italian, Spanish and Portuguese.
Fix for vector containing only empty values
Finds better results when input is in other languages
Better handling for subspecies
Better handling for Salmonellae, especially the ‘city like’ serovars like Salmonella London
Understanding of highly virulent E. coli strains like EIEC, EPEC and STEC
There will be looked for uncertain results at default - these results will be returned with an informative warning
Manual (help page) now contains more info about the algorithms
Progress bar will be shown when it takes more than 3 seconds to get results
Better handling for Salmonellae, especially the ‘city +like’ serovars like Salmonella London
Understanding of highly virulent E. coli strains like +EIEC, EPEC and STEC
There will be looked for uncertain results at default - these +results will be returned with an informative warning
Manual (help page) now contains more info about the +algorithms
Progress bar will be shown when it takes more than 3 seconds to +get results
Support for formatted console text
Console will return the percentage of uncoercable input
first_isolate()
:
-septic_patients
data set this yielded a difference of 0.15% more isolatescol_patientid
), when this argument was left blankcol_keyantibiotics()
), when this argument was left blankoutput_logical
, the function will now always return a logical valuefilter_specimen
to specimen_group
, although using filter_specimen
will still workseptic_patients
data set this yielded a
+difference of 0.15% more isolatescol_patientid
), when this argument was left
+blankcol_keyantibiotics()
),
+when this argument was left blankoutput_logical
, the function will now
+always return a logical valuefilter_specimen
to
+specimen_group
, although using filter_specimen
+will still workportion
functions, that low counts can influence the outcome and that the portion
functions may camouflage this, since they only return the portion (albeit being dependent on the minimum
argument)microorganisms.certe
and microorganisms.umcg
into microorganisms.codes
+portion
functions,
+that low counts can influence the outcome and that the
+portion
functions may camouflage this, since they only
+return the portion (albeit being dependent on the minimum
+argument)microorganisms.certe
and
+microorganisms.umcg
into
+microorganisms.codes
mo_taxonomy()
now contains the kingdom toois.rsi.eligible()
using the new threshold
argumentmo_taxonomy()
now contains the kingdom
+toois.rsi.eligible()
using the
+new threshold
argumentscale_rsi_colours()
mo
will now return the top 3 and the unique count, e.g. using summary(mo)
+mo
will now return the top 3 and the
+unique count, e.g. using summary(mo)
rsi
and mic
+rsi
and
+mic
as.rsi()
:
"HIGH S"
will return S
+"HIGH S"
will
+return S
freq()
function):
+freq()
function):
Support for tidyverse quasiquotation! Now you can create frequency tables of function outcomes:
+Support for tidyverse quasiquotation! Now you can create +frequency tables of function outcomes:
# Determine genus of microorganisms (mo) in `septic_patients` data set:
# OLD WAY
septic_patients %>%
mutate(genus = mo_genus(mo)) %>%
- freq(genus)
+ freq(genus)
# NEW WAY
septic_patients %>%
- freq(mo_genus(mo))
+ freq(mo_genus(mo))
# Even supports grouping variables:
septic_patients %>%
group_by(gender) %>%
- freq(mo_genus(mo))
Header info is now available as a list, with the header
function
The argument header
is now set to TRUE
at default, even for markdown
Added header info for class mo
to show unique count of families, genera and species
Now honours the decimal.mark
setting, which just like format
defaults to getOption("OutDec")
The new big.mark
argument will at default be ","
when decimal.mark = "."
and "."
otherwise
Fix for header text where all observations are NA
New argument droplevels
to exclude empty factor levels when input is a factor
Factor levels will be in header when present in input data (maximum of 5)
Header info is now available as a list, with the
+header
function
The argument header
is now set to TRUE
+at default, even for markdown
Added header info for class mo
to show unique count
+of families, genera and species
Now honours the decimal.mark
setting, which just
+like format
defaults to
+getOption("OutDec")
The new big.mark
argument will at default be
+","
when decimal.mark = "."
and
+"."
otherwise
Fix for header text where all observations are
+NA
New argument droplevels
to exclude empty factor
+levels when input is a factor
Factor levels will be in header when present in input data +(maximum of 5)
Fix for using select()
on frequency tables
scale_y_percent()
now contains the limits
argumentmdro()
, key_antibiotics()
and eucast_rules()
+scale_y_percent()
now contains the
+limits
argumentmdro()
,
+key_antibiotics()
and eucast_rules()
resistance_predict()
function)as.mic()
to support more values ending in (several) zeroes%like%
, it will now return the callresistance_predict()
function)as.mic()
to support more values ending in
+(several) zeroes%like%
,
+it will now return the callcount_all
to get all available isolates (that like all portion_*
and count_*
functions also supports summarise
and group_by
), the old n_rsi
is now an alias of count_all
+count_all
to get all available isolates (that
+like all portion_*
and count_*
functions also
+supports summarise
and group_by
), the old
+n_rsi
is now an alias of count_all
get_locale
to determine language for language-dependent output for some mo_*
functions. This is now the default value for their language
argument, by which the system language will be used at default.microorganismsDT
, microorganisms.prevDT
, microorganisms.unprevDT
and microorganisms.oldDT
to improve the speed of as.mo
. They are for reference only, since they are primarily for internal use of as.mo
.read.4D
to read from the 4D database of the MMB department of the UMCGmo_authors
and mo_year
to get specific values about the scientific reference of a taxonomic entryget_locale
to determine language for
+language-dependent output for some mo_*
functions. This is
+now the default value for their language
argument, by which
+the system language will be used at default.microorganismsDT
,
+microorganisms.prevDT
, microorganisms.unprevDT
+and microorganisms.oldDT
to improve the speed of
+as.mo
. They are for reference only, since they are
+primarily for internal use of as.mo
.read.4D
to read from the 4D database of the
+MMB department of the UMCGmo_authors
and mo_year
to get
+specific values about the scientific reference of a taxonomic entryFunctions MDRO
, BRMO
, MRGN
and EUCAST_exceptional_phenotypes
were renamed to mdro
, brmo
, mrgn
and eucast_exceptional_phenotypes
EUCAST_rules
was renamed to eucast_rules
, the old function still exists as a deprecated function
Functions MDRO
, BRMO
, MRGN
+and EUCAST_exceptional_phenotypes
were renamed to
+mdro
, brmo
, mrgn
and
+eucast_exceptional_phenotypes
EUCAST_rules
was renamed to
+eucast_rules
, the old function still exists as a deprecated
+function
Big changes to the eucast_rules
function:
rules
to specify which rules should be applied (expert rules, breakpoints, others or all)verbose
which can be set to TRUE
to get very specific messages about which columns and rows were affectedseptic_patients
now reflects these changespipe
for piperacillin (J01CA12), also to the mdro
functionrules
to specify which rules should be
+applied (expert rules, breakpoints, others or all)verbose
which can be set to
+TRUE
to get very specific messages about which columns and
+rows were affectedseptic_patients
now reflects these
+changespipe
for piperacillin (J01CA12), also to
+the mdro
functionAdded column kingdom
to the microorganisms data set, and function mo_kingdom
to look up values
Tremendous speed improvement for as.mo
(and subsequently all mo_*
functions), as empty values wil be ignored a priori
Fewer than 3 characters as input for as.mo
will return NA
Added column kingdom
to the microorganisms data set,
+and function mo_kingdom
to look up values
Tremendous speed improvement for as.mo
(and
+subsequently all mo_*
functions), as empty values wil be
+ignored a priori
Fewer than 3 characters as input for as.mo
will
+return NA
Function as.mo
(and all mo_*
wrappers) now supports genus abbreviations with “species” attached
Function as.mo
(and all mo_*
wrappers)
+now supports genus abbreviations with “species” attached
as.mo("E. species") # B_ESCHR
@@ -1554,45 +2563,69 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
as.mo("S. spp") # B_STPHY
mo_fullname("S. species") # "Staphylococcus species"
Added argument combine_IR
(TRUE/FALSE) to functions portion_df
and count_df
, to indicate that all values of I and R must be merged into one, so the output only consists of S vs. IR (susceptible vs. non-susceptible)
Fix for portion_*(..., as_percent = TRUE)
when minimal number of isolates would not be met
Added argument also_single_tested
for portion_*
and count_*
functions to also include cases where not all antibiotics were tested but at least one of the tested antibiotics includes the target antimicribial interpretation, see ?portion
Using portion_*
functions now throws a warning when total available isolate is below argument minimum
Functions as.mo
, as.rsi
, as.mic
, as.atc
and freq
will not set package name as attribute anymore
Added argument combine_IR
(TRUE/FALSE) to functions
+portion_df
and count_df
, to indicate that all
+values of I and R must be merged into one, so the output only consists
+of S vs. IR (susceptible vs. non-susceptible)
Fix for portion_*(..., as_percent = TRUE)
when
+minimal number of isolates would not be met
Added argument also_single_tested
for
+portion_*
and count_*
functions to also
+include cases where not all antibiotics were tested but at least one of
+the tested antibiotics includes the target antimicribial interpretation,
+see ?portion
Using portion_*
functions now throws a warning when
+total available isolate is below argument minimum
Functions as.mo
, as.rsi
,
+as.mic
, as.atc
and freq
will not
+set package name as attribute anymore
Frequency tables - freq()
:
Frequency tables - freq()
:
Support for grouping variables, test with:
+ freq(gender)Support for (un)selecting columns:
Check for hms::is.hms
Now prints in markdown at default in non-interactive sessions
No longer adds the factor level column and sorts factors on count again
Now prints in markdown at default in non-interactive +sessions
No longer adds the factor level column and sorts factors on count +again
Support for class difftime
New argument na
, to choose which character to print for empty values
New argument header
to turn the header info off (default when markdown = TRUE
)
New argument title
to manually setbthe title of the frequency table
New argument na
, to choose which character to print
+for empty values
New argument header
to turn the header info off
+(default when markdown = TRUE
)
New argument title
to manually setbthe title of the
+frequency table
first_isolate
now tries to find columns to use as input when arguments are left blank
Improvements for MDRO algorithm (function mdro
)
Data set septic_patients
is now a data.frame
, not a tibble anymore
Removed diacritics from all authors (columns microorganisms$ref
and microorganisms.old$ref
) to comply with CRAN policy to only allow ASCII characters
first_isolate
now tries to find columns to use as
+input when arguments are left blank
Improvements for MDRO algorithm (function
+mdro
)
Data set septic_patients
is now a
+data.frame
, not a tibble anymore
Removed diacritics from all authors (columns
+microorganisms$ref
and microorganisms.old$ref
)
+to comply with CRAN policy to only allow ASCII characters
Fix for mo_property
not working properly
Fix for eucast_rules
where some Streptococci would become ceftazidime R in EUCAST rule 4.5
Support for named vectors of class mo
, useful for top_freq()
ggplot_rsi
and scale_y_percent
have breaks
argument
Fix for eucast_rules
where some Streptococci would
+become ceftazidime R in EUCAST rule 4.5
Support for named vectors of class mo
, useful for
+top_freq()
ggplot_rsi
and scale_y_percent
have
+breaks
argument
AI improvements for as.mo
:
Fix for join
functions
Speed improvement for is.rsi.eligible
, now 15-20 times faster
In g.test
, when sum(x)
is below 1000 or any of the expected values is below 5, Fisher’s Exact Test will be suggested
ab_name
will try to fall back on as.atc
when no results are found
Speed improvement for is.rsi.eligible
, now 15-20
+times faster
In g.test
, when sum(x)
is below 1000 or
+any of the expected values is below 5, Fisher’s Exact Test will be
+suggested
ab_name
will try to fall back on as.atc
+when no results are found
Removed the addin to view data sets
Percentages will now will rounded more logically (e.g. in freq
function)
Percentages will now will rounded more logically (e.g. in
+freq
function)
crayon
, to support formatted text in the consoletidyr
is now mandatory (went to Import
field) since portion_df
and count_df
rely on itcrayon
, to support formatted
+text in the consoletidyr
is now mandatory (went to
+Import
field) since portion_df
and
+count_df
rely on itThe data set microorganisms
now contains all microbial taxonomic data from ITIS (kingdoms Bacteria, Fungi and Protozoa), the Integrated Taxonomy Information System, available via https://itis.gov. The data set now contains more than 18,000 microorganisms with all known bacteria, fungi and protozoa according ITIS with genus, species, subspecies, family, order, class, phylum and subkingdom. The new data set microorganisms.old
contains all previously known taxonomic names from those kingdoms.
The data set microorganisms
now contains all
+microbial taxonomic data from ITIS (kingdoms Bacteria, Fungi
+and Protozoa), the Integrated Taxonomy Information System, available via
+https://itis.gov. The data
+set now contains more than 18,000 microorganisms with all known
+bacteria, fungi and protozoa according ITIS with genus, species,
+subspecies, family, order, class, phylum and subkingdom. The new data
+set microorganisms.old
contains all previously known
+taxonomic names from those kingdoms.
New functions based on the existing function mo_property
:
mo_phylum
, mo_class
, mo_order
, mo_family
, mo_genus
, mo_species
, mo_subspecies
+New functions based on the existing function
+mo_property
:
mo_phylum
, mo_class
,
+mo_order
, mo_family
, mo_genus
,
+mo_species
, mo_subspecies
mo_fullname
, mo_shortname
+mo_fullname
,
+mo_shortname
mo_type
, mo_gramstain
+mo_type
,
+mo_gramstain
mo_ref
They also come with support for German, Dutch, French, Italian, Spanish and Portuguese:
+They also come with support for German, Dutch, French, Italian, +Spanish and Portuguese:
mo_gramstain("E. coli")
@@ -1648,7 +2703,8 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
# [1] "Gram negativo"
mo_fullname("S. group A", language = "pt") # Portuguese
# [1] "Streptococcus grupo A"
Furthermore, former taxonomic names will give a note about the current taxonomic name:
+Furthermore, former taxonomic names will give a note about the +current taxonomic name:
mo_gramstain("Esc blattae")
@@ -1656,12 +2712,24 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
# [1] "Gram negative"
Functions count_R
, count_IR
, count_I
, count_SI
and count_S
to selectively count resistant or susceptible isolates
count_df
(which works like portion_df
) to get all counts of S, I and R of a data set with antibiotic columns, with support for grouped variablesFunctions count_R
, count_IR
,
+count_I
, count_SI
and count_S
to
+selectively count resistant or susceptible isolates
count_df
(which works like
+portion_df
) to get all counts of S, I and R of a data set
+with antibiotic columns, with support for grouped variablesFunction is.rsi.eligible
to check for columns that have valid antimicrobial results, but do not have the rsi
class yet. Transform the columns of your raw data with: data %>% mutate_if(is.rsi.eligible, as.rsi)
Function is.rsi.eligible
to check for columns that
+have valid antimicrobial results, but do not have the rsi
+class yet. Transform the columns of your raw data with:
+data %>% mutate_if(is.rsi.eligible, as.rsi)
Functions as.mo
and is.mo
as replacements for as.bactid
and is.bactid
(since the microoganisms
data set not only contains bacteria). These last two functions are deprecated and will be removed in a future release. The as.mo
function determines microbial IDs using intelligent rules:
Functions as.mo
and is.mo
as
+replacements for as.bactid
and is.bactid
+(since the microoganisms
data set not only contains
+bacteria). These last two functions are deprecated and will be removed
+in a future release. The as.mo
function determines
+microbial IDs using intelligent rules:
as.mo("E. coli")
@@ -1670,7 +2738,8 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
# [1] B_STPHY_AUR
as.mo("S group A")
# [1] B_STRPTC_GRA
And with great speed too - on a quite regular Linux server from 2007 it takes us less than 0.02 seconds to transform 25,000 items:
+And with great speed too - on a quite regular Linux server from 2007 +it takes us less than 0.02 seconds to transform 25,000 items:
thousands_of_E_colis <- rep("E. coli", 25000)
@@ -1679,27 +2748,44 @@ This works for all drug combinations, such as ampicillin/sulbactam, ceftazidime/
# min median max neval
# 0.01817717 0.01843957 0.03878077 100
Added argument reference_df
for as.mo
, so users can supply their own microbial IDs, name or codes as a reference table
Added argument reference_df
for as.mo
,
+so users can supply their own microbial IDs, name or codes as a
+reference table
Renamed all previous references to bactid
to mo
, like:
EUCAST_rules
, first_isolate
and key_antibiotics
+Renamed all previous references to bactid
to
+mo
, like:
EUCAST_rules
,
+first_isolate
and key_antibiotics
microorganisms
and septic_patients
+microorganisms
and
+septic_patients
Function labels_rsi_count
to print datalabels on a RSI ggplot2
model
Functions as.atc
and is.atc
to transform/look up antibiotic ATC codes as defined by the WHO. The existing function guess_atc
is now an alias of as.atc
.
Function ab_property
and its aliases: ab_name
, ab_tradenames
, ab_certe
, ab_umcg
and ab_trivial_nl
Function labels_rsi_count
to print datalabels on a
+RSI ggplot2
model
Functions as.atc
and is.atc
to
+transform/look up antibiotic ATC codes as defined by the WHO. The
+existing function guess_atc
is now an alias of
+as.atc
.
Function ab_property
and its aliases:
+ab_name
, ab_tradenames
, ab_certe
,
+ab_umcg
and ab_trivial_nl
Introduction to AMR as a vignette
Removed clipboard functions as it violated the CRAN policy
Renamed septic_patients$sex
to septic_patients$gender
Removed clipboard functions as it violated the CRAN +policy
Renamed septic_patients$sex
to
+septic_patients$gender
Added three antimicrobial agents to the antibiotics
data set: Terbinafine (D01BA02), Rifaximin (A07AA11) and Isoconazole (D01AC05)
Added three antimicrobial agents to the antibiotics
+data set: Terbinafine (D01BA02), Rifaximin (A07AA11) and Isoconazole
+(D01AC05)
Added 163 trade names to the antibiotics
data set, it now contains 298 different trade names in total, e.g.:
Added 163 trade names to the antibiotics
data set,
+it now contains 298 different trade names in total, e.g.:
For first_isolate
, rows will be ignored when there’s no species available
Function ratio
is now deprecated and will be removed in a future release, as it is not really the scope of this package
Fix for as.mic
for values ending in zeroes after a real number
Small fix where B. fragilis would not be found in the microorganisms.umcg
data set
Added prevalence
column to the microorganisms
data set
Added arguments minimum
and as_percent
to portion_df
For first_isolate
, rows will be ignored when there’s
+no species available
Function ratio
is now deprecated and will be removed
+in a future release, as it is not really the scope of this
+package
Fix for as.mic
for values ending in zeroes after a
+real number
Small fix where B. fragilis would not be found in the
+microorganisms.umcg
data set
Added prevalence
column to the
+microorganisms
data set
Added arguments minimum
and as_percent
+to portion_df
Support for quasiquotation in the functions series count_*
and portions_*
, and n_rsi
. This allows to check for more than 2 vectors or columns.
Support for quasiquotation in the functions series
+count_*
and portions_*
, and
+n_rsi
. This allows to check for more than 2 vectors or
+columns.
Edited ggplot_rsi
and geom_rsi
so they can cope with count_df
. The new fun
argument has value portion_df
at default, but can be set to count_df
.
Fix for ggplot_rsi
when the ggplot2
package was not loaded
Added datalabels function labels_rsi_count
to ggplot_rsi
Added possibility to set any argument to geom_rsi
(and ggplot_rsi
) so you can set your own preferences
Fix for joins, where predefined suffices would not be honoured
Added argument quote
to the freq
function
Added generic function diff
for frequency tables
Added longest en shortest character length in the frequency table (freq
) header of class character
Edited ggplot_rsi
and geom_rsi
so they
+can cope with count_df
. The new fun
argument
+has value portion_df
at default, but can be set to
+count_df
.
Fix for ggplot_rsi
when the ggplot2
+package was not loaded
Added datalabels function labels_rsi_count
to
+ggplot_rsi
Added possibility to set any argument to geom_rsi
+(and ggplot_rsi
) so you can set your own
+preferences
Fix for joins, where predefined suffices would not be +honoured
Added argument quote
to the freq
+function
Added generic function diff
for frequency
+tables
Added longest en shortest character length in the frequency table
+(freq
) header of class character
Support for types (classes) list and matrix for freq
Support for types (classes) list and matrix for
+freq
For lists, subsetting is possible:
my_list = list(age = septic_patients$age, gender = septic_patients$gender)
-my_list %>% freq(age)
-my_list %>% freq(gender)
rsi_df
was removed in favour of new functions portion_R
, portion_IR
, portion_I
, portion_SI
and portion_S
to selectively calculate resistance or susceptibility. These functions are 20 to 30 times faster than the old rsi
function. The old function still works, but is deprecated.
-portion_df
to get all portions of S, I and R of a data set with antibiotic columns, with support for grouped variablesrsi_df
was removed in favour
+of new functions portion_R
, portion_IR
,
+portion_I
, portion_SI
and
+portion_S
to selectively calculate resistance or
+susceptibility. These functions are 20 to 30 times faster than the old
+rsi
function. The old function still works, but is
+deprecated.
+portion_df
to get all portions of S, I and
+R of a data set with antibiotic columns, with support for grouped
+variablesggplot2
-geom_rsi
, facet_rsi
, scale_y_percent
, scale_rsi_colours
and theme_rsi
+geom_rsi
, facet_rsi
,
+scale_y_percent
, scale_rsi_colours
and
+theme_rsi
ggplot_rsi
to apply all above functions on a data set:
+ggplot_rsi
to apply all above
+functions on a data set:
septic_patients %>% select(tobr, gent) %>% ggplot_rsi
will show portions of S, I and R immediately in a pretty plotseptic_patients %>% select(tobr, gent) %>% ggplot_rsi
+will show portions of S, I and R immediately in a pretty plot?ggplot_rsi
as.bactid
and is.bactid
to transform/ look up microbial ID’s.guess_bactid
is now an alias of as.bactid
+as.bactid
and is.bactid
to
+transform/ look up microbial ID’s.guess_bactid
is now an alias of
+as.bactid
kurtosis
and skewness
that are lacking in base R - they are generic functions and have support for vectors, data.frames and matricesg.test
to perform the X2 distributed G-test, which use is the same as chisq.test
+kurtosis
and skewness
that are lacking in base
+R - they are generic functions and have support for vectors, data.frames
+and matricesg.test
to perform the X2
+distributed G-test, which
+use is the same as chisq.test
ratio
to transform a vector of values to a preset ratioratio(c(10, 500, 10), ratio = "1:2:1")
would return 130, 260, 130
ratio
to transform a vector of values to
+a preset ratioratio(c(10, 500, 10), ratio = "1:2:1")
would return
+130, 260, 130
%in%
or %like%
(and give them keyboard shortcuts), or to view the datasets that come with this packagep.symbol
to transform p values to their related symbols: 0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
+%in%
or %like%
(and give them keyboard
+shortcuts), or to view the datasets that come with this packagep.symbol
to transform p values to their
+related symbols:
+0 '***' 0.001 '**' 0.01 '*' 0.05 '.' 0.1 ' ' 1
clipboard_import
and clipboard_export
as helper functions to quickly copy and paste from/to software like Excel and SPSS. These functions use the clipr
package, but are a little altered to also support headless Linux servers (so you can use it in RStudio Server)clipboard_import
and
+clipboard_export
as helper functions to quickly copy and
+paste from/to software like Excel and SPSS. These functions use the
+clipr
package, but are a little altered to also support
+headless Linux servers (so you can use it in RStudio Server)freq
):
rsi
(antimicrobial resistance) to use as inputtable
to use as input: freq(table(x, y))
+rsi
(antimicrobial resistance) to use as
+inputtable
to use as input:
+freq(table(x, y))
hist
and plot
to use a frequency table as input: hist(freq(df$age))
+hist
and
+plot
to use a frequency table as input:
+hist(freq(df$age))
as.vector
, as.data.frame
, as_tibble
and format
+as.vector
, as.data.frame
,
+as_tibble
and format
freq(mydata, mycolumn)
is the same as mydata %>% freq(mycolumn)
+freq(mydata, mycolumn)
is
+the same as mydata %>% freq(mycolumn)
top_freq
function to return the top/below n items as vectoroptions(max.print.freq = n)
where n is your preset valuetop_freq
function to return the top/below
+n items as vectoroptions(max.print.freq = n)
where n is
+your preset valueresistance_predict
and added more examplesresistance_predict
+and added more examplesseptic_patients
data set to better reflect the realitymic
and rsi
classes now returns all values - use freq
to check distributionskey_antibiotics
function are now generic: 6 for broadspectrum ABs, 6 for Gram-positive specific and 6 for Gram-negative specific ABsseptic_patients
data set to
+better reflect the realitymic
and rsi
classes now
+returns all values - use freq
to check distributionskey_antibiotics
function are now
+generic: 6 for broadspectrum ABs, 6 for Gram-positive specific and 6 for
+Gram-negative specific ABsabname
function%like%
now supports multiple patternsdata.frame
s with altered console printing to make it look like a frequency table. Because of this, the argument toConsole
is not longer needed.freq
where the class of an item would be lostseptic_patients
dataset and the column bactid
now has the new class "bactid"
+data.frame
s with
+altered console printing to make it look like a frequency table. Because
+of this, the argument toConsole
is not longer needed.freq
where the class of an item would be
+lostseptic_patients
+dataset and the column bactid
now has the new class
+"bactid"
microorganisms
dataset (especially for Salmonella) and the column bactid
now has the new class "bactid"
+microorganisms
dataset
+(especially for Salmonella) and the column bactid
+now has the new class "bactid"
rsi
and mic
functions:
+rsi
+and mic
functions:
as.rsi("<=0.002; S")
will return S
as.mic("<=0.002; S")
will return <=0.002
+as.mic("<=0.002; S")
will return
+<=0.002
as.mic("<= 0.002")
now worksrsi
and mic
do not add the attribute package.version
anymore"groups"
option for atc_property(..., property)
. It will return a vector of the ATC hierarchy as defined by the WHO. The new function atc_groups
is a convenient wrapper around this.atc_property
as it requires the host set by url
to be responsivefirst_isolate
algorithm to exclude isolates where bacteria ID or genus is unavailable924b62
) from the dplyr
package v0.7.5 and aboveguess_bactid
(now called as.bactid
)
-yourdata %>% select(genus, species) %>% as.bactid()
now also worksas.mic("<= 0.002")
now worksrsi
and mic
do not add the
+attribute package.version
anymore"groups"
option for
+atc_property(..., property)
. It will return a vector of the
+ATC hierarchy as defined by the WHO. The
+new function atc_groups
is a convenient wrapper around
+this.atc_property
as it requires the
+host set by url
to be responsivefirst_isolate
algorithm to exclude isolates
+where bacteria ID or genus is unavailable924b62
)
+from the dplyr
package v0.7.5 and aboveguess_bactid
(now called as.bactid
)
+yourdata %>% select(genus, species) %>% as.bactid()
+now also worksn_rsi
to count cases where antibiotic test results were available, to be used in conjunction with dplyr::summarise
, see ?rsiguess_bactid
to determine the ID of a microorganism based on genus/species or known abbreviations like MRSAguess_atc
to determine the ATC of an antibiotic based on name, trade name, or known abbreviationsfreq
to create frequency tables, with additional info in a headerMDRO
to determine Multi Drug Resistant Organisms (MDRO) with support for country-specific guidelines.
+n_rsi
to count cases where antibiotic test
+results were available, to be used in conjunction with
+dplyr::summarise
, see ?rsiguess_bactid
to determine the
+ID of a microorganism based on genus/species or known
+abbreviations like MRSAguess_atc
to determine the
+ATC of an antibiotic based on name, trade name, or known
+abbreviationsfreq
to create frequency
+tables, with additional info in a headerMDRO
to determine Multi Drug Resistant
+Organisms (MDRO) with support for country-specific guidelines.
BRMO
and MRGN
are wrappers for Dutch and German guidelines, respectivelyBRMO
and MRGN
are wrappers for
+Dutch and German guidelines, respectively"points"
or "keyantibiotics"
, see ?first_isolate
+"points"
or "keyantibiotics"
, see
+?first_isolate
tibble
s and data.table
stibble
s and
+data.table
srsi
class for vectors that contain only invalid antimicrobial interpretationsrsi
class for vectors that contain only invalid
+antimicrobial interpretationsablist
to antibiotics
bactlist
to microorganisms
+bactlist
to
+microorganisms
antibiotics
datasetmicroorganisms
datasetseptic_patients
+antibiotics
datasetmicroorganisms
+datasetseptic_patients
join
functionsjoin
+functions%like%
to make it case insensitivefirst_isolate
and EUCAST_rules
column names are now case-insensitiveas.rsi
and as.mic
now add the package name and version as attributesfirst_isolate
and
+EUCAST_rules
column names are now case-insensitiveas.rsi
and as.mic
now add the
+package name and version as attributesREADME.md
with more examplestestthat
packageEUCAST_rules
applies for amoxicillin even if ampicillin is missingEUCAST_rules
applies for amoxicillin even if ampicillin
+is missing
+rsi
and mic
classesrsi
and mic
+classesWelcome to the AMR
package.
This example data set has the exact same structure as an export file from WHONET. Such files can be used with this package, as this example data set shows. The antibiotic results are from our example_isolates data set. All patient names are created using online surname generators and are only in place for practice purposes.
WHONET
WHONET
as.mo()
to use the data for intel
diff --git a/docs/reference/catalogue_of_life_version.html b/docs/reference/catalogue_of_life_version.html
index 0adbedb7..a06ce87b 100644
--- a/docs/reference/catalogue_of_life_version.html
+++ b/docs/reference/catalogue_of_life_version.html
@@ -17,7 +17,7 @@
@@ -200,11 +200,13 @@ This package contains the complete taxonomic tree of almost all microorganisms (
diff --git a/docs/reference/count.html b/docs/reference/count.html
index d35f444e..9c6a5887 100644
--- a/docs/reference/count.html
+++ b/docs/reference/count.html
@@ -18,7 +18,7 @@ count_resistant() should be used to count resistant isolates, count_susceptible(
diff --git a/docs/reference/custom_eucast_rules.html b/docs/reference/custom_eucast_rules.html
index 8b973fa8..eb4bc8cd 100644
--- a/docs/reference/custom_eucast_rules.html
+++ b/docs/reference/custom_eucast_rules.html
@@ -17,7 +17,7 @@
diff --git a/docs/reference/dosage.html b/docs/reference/dosage.html
index 84972a57..f5a67eff 100644
--- a/docs/reference/dosage.html
+++ b/docs/reference/dosage.html
@@ -17,7 +17,7 @@
@@ -161,7 +161,9 @@
EUCAST breakpoints used in this package are based on the dosages in this data set. They can be retrieved with eucast_dosage()
.
dosage
dosage
A data set containing 2,000 microbial isolates with their full antibiograms. The data set reflects reality and can be used to practice AMR data analysis. For examples, please read the tutorial on our website.
-example_isolates
example_isolates
A data set containing 3,000 microbial isolates that are not cleaned up and consequently not ready for AMR data analysis. This data set can be used for practice.
-example_isolates_unclean
example_isolates_unclean
Data set containing defined intrinsic resistance by EUCAST of all bug-drug combinations.
-intrinsic_resistant
intrinsic_resistant
Data set containing reference data to interpret MIC and disk diffusion to R/SI values, according to international guidelines. Currently implemented guidelines are EUCAST (2011-2021) and CLSI (2010-2021). Use as.rsi()
to transform MICs or disks measurements to R/SI values.
rsi_translation
rsi_translation