mirror of
				https://github.com/msberends/AMR.git
				synced 2025-10-25 07:16:18 +02:00 
			
		
		
		
	documentation
This commit is contained in:
		| @@ -1,6 +1,6 @@ | |||||||
| Package: AMR | Package: AMR | ||||||
| Version: 1.8.2.9086 | Version: 1.8.2.9087 | ||||||
| Date: 2023-01-06 | Date: 2023-01-07 | ||||||
| Title: Antimicrobial Resistance Data Analysis | Title: Antimicrobial Resistance Data Analysis | ||||||
| Description: Functions to simplify and standardise antimicrobial resistance (AMR) | Description: Functions to simplify and standardise antimicrobial resistance (AMR) | ||||||
|   data analysis and to work with microbial and antimicrobial properties by |   data analysis and to work with microbial and antimicrobial properties by | ||||||
|   | |||||||
							
								
								
									
										2
									
								
								NEWS.md
									
									
									
									
									
								
							
							
						
						
									
										2
									
								
								NEWS.md
									
									
									
									
									
								
							| @@ -1,4 +1,4 @@ | |||||||
| # AMR 1.8.2.9086 | # AMR 1.8.2.9087 | ||||||
|  |  | ||||||
| *(this beta version will eventually become v2.0! We're happy to reach a new major milestone soon!)* | *(this beta version will eventually become v2.0! We're happy to reach a new major milestone soon!)* | ||||||
|  |  | ||||||
|   | |||||||
							
								
								
									
										6
									
								
								R/mo.R
									
									
									
									
									
								
							
							
						
						
									
										6
									
								
								R/mo.R
									
									
									
									
									
								
							| @@ -83,7 +83,7 @@ | |||||||
| #' | #' | ||||||
| #' ### Microbial Prevalence of Pathogens in Humans | #' ### Microbial Prevalence of Pathogens in Humans | ||||||
| #' | #' | ||||||
| #' The coercion rules consider the prevalence of microorganisms in humans grouped into three groups, which is available as the `prevalence` columns in the [microorganisms] data set. The grouping into human pathogenic prevalence is explained in the section *Matching Score for Microorganisms* below. | #' The coercion rules consider the prevalence of microorganisms in humans, which is available as the `prevalence` column in the [microorganisms] data set. The grouping into human pathogenic prevalence is explained in the section *Matching Score for Microorganisms* below. | ||||||
| #' @inheritSection mo_matching_score Matching Score for Microorganisms | #' @inheritSection mo_matching_score Matching Score for Microorganisms | ||||||
| #' | #' | ||||||
| #  (source as a section here, so it can be inherited by other man pages) | #  (source as a section here, so it can be inherited by other man pages) | ||||||
| @@ -536,7 +536,7 @@ mo_cleaning_regex <- function() { | |||||||
|     "|", |     "|", | ||||||
|     "([({]|\\[).+([})]|\\])", |     "([({]|\\[).+([})]|\\])", | ||||||
|     "|", |     "|", | ||||||
|     "(^| )(e?spp|e?ssp|e?ss|e?sp|e?subsp|sube?species|biovar|biotype|serovar|serogr.?up|e?species|group|complex)[.]*( |$))" |     "(^| )(e?spp|e?ssp|e?ss|e?sp|e?subsp|sube?species|biovar|biotype|serovar|serogr.?up|e?species)[.]*( |$|(complex|group)$))" | ||||||
|   ) |   ) | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -786,7 +786,7 @@ print.mo_uncertainties <- function(x, ...) { | |||||||
|     return(invisible(NULL)) |     return(invisible(NULL)) | ||||||
|   } |   } | ||||||
|  |  | ||||||
|   cat(word_wrap("Matching scores are based on the resemblance between the input and the full taxonomic name, and the pathogenicity in humans according to Bartlett ", font_italic("et al."), " (2022). See `?mo_matching_score`.\n\n", add_fn = font_blue)) |   cat(word_wrap("Matching scores are based on the resemblance between the input and the full taxonomic name, and the pathogenicity in humans. See `?mo_matching_score`.\n\n", add_fn = font_blue)) | ||||||
|   if (has_colour()) { |   if (has_colour()) { | ||||||
|     cat(word_wrap("Colour keys: ", |     cat(word_wrap("Colour keys: ", | ||||||
|       font_red_bg(" 0.000-0.499 "), |       font_red_bg(" 0.000-0.499 "), | ||||||
|   | |||||||
| @@ -44,13 +44,14 @@ | |||||||
| #' where: | #' where: | ||||||
| #' | #' | ||||||
| #' * \eqn{x} is the user input; | #' * \eqn{x} is the user input; | ||||||
| #' * \ifelse{html}{\out{<i>n</i> is a taxonomic name (genus, species, and subspecies);}}{\eqn{n} is a taxonomic name (genus, species, and subspecies);} | #' * \eqn{n} is a taxonomic name (genus, species, and subspecies); | ||||||
| #' * \ifelse{html}{\out{<i>l<sub>n</sub></i> is the length of <i>n</i>;}}{l_n is the length of \eqn{n};} | #' * \eqn{l_n} is the length of \eqn{n}; | ||||||
| #' * \ifelse{html}{\out{<i>lev</i> is the <a href="https://en.wikipedia.org/wiki/Levenshtein_distance">Levenshtein distance function</a> (counting any insertion as 1, and any deletion or substitution as 2) that is needed to change <i>x</i> into <i>n</i>;}}{lev is the Levenshtein distance function (counting any insertion as 1, and any deletion or substitution as 2) that is needed to change \eqn{x} into \eqn{n};} | #' * \ifelse{html}{\out{<i>lev</i> is the  | ||||||
| #' * \ifelse{html}{\out{<i>p<sub>n</sub></i> is the human pathogenic prevalence group of <i>n</i>, as described below;}}{p_n is the human pathogenic prevalence group of \eqn{n}, as described below;} | #' * \eqn{lev} is the [Levenshtein distance function](https://en.wikipedia.org/wiki/Levenshtein_distance) (counting any insertion as 1, and any deletion or substitution as 2) that is needed to change \eqn{x} into \eqn{n}; | ||||||
| #' * \ifelse{html}{\out{<i>k<sub>n</sub></i> is the taxonomic kingdom of <i>n</i>, set as Bacteria = 1, Fungi = 2, Protozoa = 3, Archaea = 4, others = 5.}}{l_n is the taxonomic kingdom of \eqn{n}, set as Bacteria = 1, Fungi = 2, Protozoa = 3, Archaea = 4, others = 5.} | #' * \eqn{p_{n}} is the human pathogenic prevalence group of \eqn{n}, as described below; | ||||||
|  | #' * \eqn{k_n} is the taxonomic kingdom of \eqn{n}, set as Bacteria = 1, Fungi = 2, Protozoa = 3, Archaea = 4, others = 5. | ||||||
| #' | #' | ||||||
| #' The grouping into human pathogenic prevalence (\eqn{p}) is based on recent work from Bartlett *et al.* (2022, \doi{10.1099/mic.0.001269}) who extensively studied medical-scientific literature to categorise all bacterial species into these groups: | #' The grouping into human pathogenic prevalence \eqn{p} is based on recent work from Bartlett *et al.* (2022, \doi{10.1099/mic.0.001269}) who extensively studied medical-scientific literature to categorise all bacterial species into these groups: | ||||||
| #'  | #'  | ||||||
| #' - **Established**, if a taxonomic species has infected at least three persons in three or more references. These records have `prevalence = 1.0` in the [microorganisms] data set; | #' - **Established**, if a taxonomic species has infected at least three persons in three or more references. These records have `prevalence = 1.0` in the [microorganisms] data set; | ||||||
| #' - **Putative**, if a taxonomic species has fewer than three known cases. These records have `prevalence = 1.25` in the [microorganisms] data set. | #' - **Putative**, if a taxonomic species has fewer than three known cases. These records have `prevalence = 1.25` in the [microorganisms] data set. | ||||||
| @@ -69,6 +70,8 @@ | |||||||
| #' @export | #' @export | ||||||
| #' @inheritSection AMR Reference Data Publicly Available | #' @inheritSection AMR Reference Data Publicly Available | ||||||
| #' @examples | #' @examples | ||||||
|  | #' mo_reset_session() | ||||||
|  | #'  | ||||||
| #' as.mo("E. coli") | #' as.mo("E. coli") | ||||||
| #' mo_uncertainties() | #' mo_uncertainties() | ||||||
| #' | #' | ||||||
|   | |||||||
| @@ -36,31 +36,31 @@ | |||||||
| #' @param ... other arguments passed on to [as.mo()], such as 'minimum_matching_score', 'ignore_pattern', and 'remove_from_input' | #' @param ... other arguments passed on to [as.mo()], such as 'minimum_matching_score', 'ignore_pattern', and 'remove_from_input' | ||||||
| #' @param ab any (vector of) text that can be coerced to a valid antibiotic drug code with [as.ab()] | #' @param ab any (vector of) text that can be coerced to a valid antibiotic drug code with [as.ab()] | ||||||
| #' @param open browse the URL using [`browseURL()`][utils::browseURL()] | #' @param open browse the URL using [`browseURL()`][utils::browseURL()] | ||||||
| #' @details All functions will, at default, **not** keep old taxonomic properties, as synonyms are automatically replaced with the current taxonomy. Take for example *Escherichia blattae*, which was renamed to *Shimwellia blattae* in 2010: | #' @details All functions will, at default, **not** keep old taxonomic properties, as synonyms are automatically replaced with the current taxonomy. Take for example *Enterobacter aerogenes*, which was initially named in 1960 but renamed to *Klebsiella aerogenes* in 2017: | ||||||
| #' - `mo_genus("Escherichia blattae")` will return `"Shemwellia"` (with a note about the renaming) | #' - `mo_genus("Enterobacter aerogenes")` will return `"Klebsiella"` (with a note about the renaming) | ||||||
| #' - `mo_genus("Escherichia blattae", keep_synonyms = TRUE)` will return `"Escherichia"` (with a warning that the name is outdated) | #' - `mo_genus("Enterobacter aerogenes", keep_synonyms = TRUE)` will return `"Enterobacter"` (with a once-per-session warning that the name is outdated) | ||||||
| #' - `mo_ref("Escherichia blattae")` will return `"Priest et al., 2010"` (with a note) | #' - `mo_ref("Enterobacter aerogenes")` will return `"Tindall et al., 2017"` (with a note) | ||||||
| #' - `mo_ref("Escherichia blattae", keep_synonyms = TRUE)` will return `"Burgess et al., 1973"` (with a warning) | #' - `mo_ref("Enterobacter aerogenes", keep_synonyms = TRUE)` will return `"Hormaeche et al., 1960"` (with a warning) | ||||||
| #' | #' | ||||||
| #' The short name ([mo_shortname()]) returns the first character of the genus and the full species, such as `"E. coli"`, for species and subspecies. Exceptions are abbreviations of staphylococci (such as *"CoNS"*, Coagulase-Negative Staphylococci) and beta-haemolytic streptococci (such as *"GBS"*, Group B Streptococci). Please bear in mind that e.g. *E. coli* could mean *Escherichia coli* (kingdom of Bacteria) as well as *Entamoeba coli* (kingdom of Protozoa). Returning to the full name will be done using [as.mo()] internally, giving priority to bacteria and human pathogens, i.e. `"E. coli"` will be considered *Escherichia coli*. In other words, `mo_fullname(mo_shortname("Entamoeba coli"))` returns `"Escherichia coli"`. | #' The short name ([mo_shortname()]) returns the first character of the genus and the full species, such as `"E. coli"`, for species and subspecies. Exceptions are abbreviations of staphylococci (such as *"CoNS"*, Coagulase-Negative Staphylococci) and beta-haemolytic streptococci (such as *"GBS"*, Group B Streptococci). Please bear in mind that e.g. *E. coli* could mean *Escherichia coli* (kingdom of Bacteria) as well as *Entamoeba coli* (kingdom of Protozoa). Returning to the full name will be done using [as.mo()] internally, giving priority to bacteria and human pathogens, i.e. `"E. coli"` will be considered *Escherichia coli*. As a result, `mo_fullname(mo_shortname("Entamoeba coli"))` returns `"Escherichia coli"`. | ||||||
| #' | #' | ||||||
| #' Since the top-level of the taxonomy is sometimes referred to as 'kingdom' and sometimes as 'domain', the functions [mo_kingdom()] and [mo_domain()] return the exact same results. | #' Since the top-level of the taxonomy is sometimes referred to as 'kingdom' and sometimes as 'domain', the functions [mo_kingdom()] and [mo_domain()] return the exact same results. | ||||||
| #' | #' | ||||||
| #' Determination of human pathogenicity ([mo_pathogenicity()]) is strongly based on Bartlett *et al.* (2022, \doi{10.1099/mic.0.001269}). This function returns a [factor] with the levels *Pathogenic*, *Potentially pathogenic*, *Non-pathogenic*, and *Unknown*. | #' Determination of human pathogenicity ([mo_pathogenicity()]) is strongly based on Bartlett *et al.* (2022, \doi{10.1099/mic.0.001269}). This function returns a [factor] with the levels *Pathogenic*, *Potentially pathogenic*, *Non-pathogenic*, and *Unknown*. | ||||||
| #' | #' | ||||||
| #' Determination of the Gram stain ([mo_gramstain()]) will be based on the taxonomic kingdom and phylum. Originally, Cavalier-Smith defined the so-called subkingdoms Negibacteria and Posibacteria (2002, [PMID 11837318](https://pubmed.ncbi.nlm.nih.gov/11837318/)), and only considered these phyla as Posibacteria: Actinobacteria, Chloroflexi, Firmicutes, and Tenericutes. These phyla were renamed to Actinomycetota, Chloroflexota, Bacillota, and Mycoplasmatota (2021, [PMID 34694987](https://pubmed.ncbi.nlm.nih.gov/34694987/)). Bacteria in these phyla are considered Gram-positive in this `AMR` package, except for members of the class Negativicutes (within phylum Bacillota) which are Gram-negative. All other bacteria are considered Gram-negative. Species outside the kingdom of Bacteria will return a value `NA`. Functions [mo_is_gram_negative()] and [mo_is_gram_positive()] always return `TRUE` or `FALSE` (or `NA` when the input is `NA` or the MO code is `UNKNOWN`), thus always return `FALSE` for species outside the taxonomic kingdom of Bacteria. | #' Determination of the Gram stain ([mo_gramstain()]) will be based on the taxonomic kingdom and phylum. Originally, Cavalier-Smith defined the so-called subkingdoms Negibacteria and Posibacteria (2002, [PMID 11837318](https://pubmed.ncbi.nlm.nih.gov/11837318/)), and only considered these phyla as Posibacteria: Actinobacteria, Chloroflexi, Firmicutes, and Tenericutes. These phyla were later renamed to Actinomycetota, Chloroflexota, Bacillota, and Mycoplasmatota (2021, [PMID 34694987](https://pubmed.ncbi.nlm.nih.gov/34694987/)). Bacteria in these phyla are considered Gram-positive in this `AMR` package, except for members of the class Negativicutes (within phylum Bacillota) which are Gram-negative. All other bacteria are considered Gram-negative. Species outside the kingdom of Bacteria will return a value `NA`. Functions [mo_is_gram_negative()] and [mo_is_gram_positive()] always return `TRUE` or `FALSE` (or `NA` when the input is `NA` or the MO code is `UNKNOWN`), thus always return `FALSE` for species outside the taxonomic kingdom of Bacteria. | ||||||
| #' | #' | ||||||
| #' Determination of yeasts ([mo_is_yeast()]) will be based on the taxonomic kingdom and class. *Budding yeasts* are fungi of the phylum Ascomycota, class Saccharomycetes (also called Hemiascomycetes). *True yeasts* are aggregated into the underlying order Saccharomycetales. Thus, for all microorganisms that are member of the taxonomic class Saccharomycetes, the function will return `TRUE`. It returns `FALSE` otherwise (or `NA` when the input is `NA` or the MO code is `UNKNOWN`). | #' Determination of yeasts ([mo_is_yeast()]) will be based on the taxonomic kingdom and class. *Budding yeasts* are fungi of the phylum Ascomycota, class Saccharomycetes (also called Hemiascomycetes). *True yeasts* are aggregated into the underlying order Saccharomycetales. Thus, for all microorganisms that are member of the taxonomic class Saccharomycetes, the function will return `TRUE`. It returns `FALSE` otherwise (or `NA` when the input is `NA` or the MO code is `UNKNOWN`). | ||||||
| #' | #' | ||||||
| #' Determination of intrinsic resistance ([mo_is_intrinsic_resistant()]) will be based on the [intrinsic_resistant] data set, which is based on `r format_eucast_version_nr(3.3)`. The [mo_is_intrinsic_resistant()] function can be vectorised over both argument `x` (input for microorganisms) and `ab` (input for antibiotics). | #' Determination of intrinsic resistance ([mo_is_intrinsic_resistant()]) will be based on the [intrinsic_resistant] data set, which is based on `r format_eucast_version_nr(3.3)`. The [mo_is_intrinsic_resistant()] function can be vectorised over both argument `x` (input for microorganisms) and `ab` (input for antibiotics). | ||||||
| #' | #' | ||||||
| #' All output [will be translated][translate] where possible. |  | ||||||
| #' |  | ||||||
| #' The function [mo_url()] will return the direct URL to the online database entry, which also shows the scientific reference of the concerned species. | #' The function [mo_url()] will return the direct URL to the online database entry, which also shows the scientific reference of the concerned species. | ||||||
| #' | #' | ||||||
| #' SNOMED codes ([mo_snomed()]) are from the version of `r documentation_date(TAXONOMY_VERSION$SNOMED$accessed_date)`. See *Source* and the [microorganisms] data set for more info. | #' SNOMED codes ([mo_snomed()]) are from the version of `r documentation_date(TAXONOMY_VERSION$SNOMED$accessed_date)`. See *Source* and the [microorganisms] data set for more info. | ||||||
| #' | #' | ||||||
| #' Old taxonomic names (so-called 'synonyms') can be retrieved with [mo_synonyms()], the current taxonomic name can be retrieved with [mo_current()]. Both functions return full names. | #' Old taxonomic names (so-called 'synonyms') can be retrieved with [mo_synonyms()], the current taxonomic name can be retrieved with [mo_current()]. Both functions return full names. | ||||||
|  | #' | ||||||
|  | #' All output [will be translated][translate] where possible. | ||||||
| #' @section Matching Score for Microorganisms: | #' @section Matching Score for Microorganisms: | ||||||
| #' This function uses [as.mo()] internally, which uses an advanced algorithm to translate arbitrary user input to valid taxonomy using a so-called matching score. You can read about this public algorithm on the [MO matching score page][mo_matching_score()]. | #' This function uses [as.mo()] internally, which uses an advanced algorithm to translate arbitrary user input to valid taxonomy using a so-called matching score. You can read about this public algorithm on the [MO matching score page][mo_matching_score()]. | ||||||
| #' @inheritSection as.mo Source | #' @inheritSection as.mo Source | ||||||
| @@ -145,10 +145,10 @@ | |||||||
| #' | #' | ||||||
| #' # Lancefield classification, see ?as.mo ------------------------------------ | #' # Lancefield classification, see ?as.mo ------------------------------------ | ||||||
| #' | #' | ||||||
| #' mo_fullname("S. pyo") | #' mo_fullname("Strep Group B") | ||||||
| #' mo_fullname("S. pyo", Lancefield = TRUE) | #' mo_fullname("Strep Group B", Lancefield = TRUE) | ||||||
| #' mo_shortname("S. pyo") | #' mo_shortname("Strep Group B") | ||||||
| #' mo_shortname("S. pyo", Lancefield = TRUE) | #' mo_shortname("Strep Group B", Lancefield = TRUE) | ||||||
| #' | #' | ||||||
| #' | #' | ||||||
| #' # language support  -------------------------------------------------------- | #' # language support  -------------------------------------------------------- | ||||||
| @@ -159,7 +159,7 @@ | |||||||
| #' mo_gramstain("Klebsiella pneumoniae", language = "el") # Greek | #' mo_gramstain("Klebsiella pneumoniae", language = "el") # Greek | ||||||
| #' mo_gramstain("Klebsiella pneumoniae", language = "uk") # Ukrainian | #' mo_gramstain("Klebsiella pneumoniae", language = "uk") # Ukrainian | ||||||
| #'  | #'  | ||||||
| #' # mo_type is equal to mo_kingdom, but mo_kingdom will remain official | #' # mo_type is equal to mo_kingdom, but mo_kingdom will remain untranslated | ||||||
| #' mo_kingdom("Klebsiella pneumoniae") | #' mo_kingdom("Klebsiella pneumoniae") | ||||||
| #' mo_type("Klebsiella pneumoniae") | #' mo_type("Klebsiella pneumoniae") | ||||||
| #' mo_kingdom("Klebsiella pneumoniae", language = "zh") # Chinese, no effect | #' mo_kingdom("Klebsiella pneumoniae", language = "zh") # Chinese, no effect | ||||||
|   | |||||||
							
								
								
									
										15
									
								
								man/as.mo.Rd
									
									
									
									
									
								
							
							
						
						
									
										15
									
								
								man/as.mo.Rd
									
									
									
									
									
								
							| @@ -108,7 +108,7 @@ There are three helper functions that can be run after using the \code{\link[=as | |||||||
|  |  | ||||||
| \subsection{Microbial Prevalence of Pathogens in Humans}{ | \subsection{Microbial Prevalence of Pathogens in Humans}{ | ||||||
|  |  | ||||||
| The coercion rules consider the prevalence of microorganisms in humans grouped into three groups, which is available as the \code{prevalence} columns in the \link{microorganisms} data set. The grouping into human pathogenic prevalence is explained in the section \emph{Matching Score for Microorganisms} below. | The coercion rules consider the prevalence of microorganisms in humans, which is available as the \code{prevalence} column in the \link{microorganisms} data set. The grouping into human pathogenic prevalence is explained in the section \emph{Matching Score for Microorganisms} below. | ||||||
| } | } | ||||||
| } | } | ||||||
| \section{Source}{ | \section{Source}{ | ||||||
| @@ -136,14 +136,15 @@ With ambiguous user input in \code{\link[=as.mo]{as.mo()}} and all the \code{\li | |||||||
| where: | where: | ||||||
| \itemize{ | \itemize{ | ||||||
| \item \eqn{x} is the user input; | \item \eqn{x} is the user input; | ||||||
| \item \ifelse{html}{\out{<i>n</i> is a taxonomic name (genus, species, and subspecies);}}{\eqn{n} is a taxonomic name (genus, species, and subspecies);} | \item \eqn{n} is a taxonomic name (genus, species, and subspecies); | ||||||
| \item \ifelse{html}{\out{<i>l<sub>n</sub></i> is the length of <i>n</i>;}}{l_n is the length of \eqn{n};} | \item \eqn{l_n} is the length of \eqn{n}; | ||||||
| \item \ifelse{html}{\out{<i>lev</i> is the <a href="https://en.wikipedia.org/wiki/Levenshtein_distance">Levenshtein distance function</a> (counting any insertion as 1, and any deletion or substitution as 2) that is needed to change <i>x</i> into <i>n</i>;}}{lev is the Levenshtein distance function (counting any insertion as 1, and any deletion or substitution as 2) that is needed to change \eqn{x} into \eqn{n};} | \item \ifelse{html}{\out{\if{html}{\out{<i>}}lev\if{html}{\out{</i>}} is the | ||||||
| \item \ifelse{html}{\out{<i>p<sub>n</sub></i> is the human pathogenic prevalence group of <i>n</i>, as described below;}}{p_n is the human pathogenic prevalence group of \eqn{n}, as described below;} | \item \eqn{lev} is the \href{https://en.wikipedia.org/wiki/Levenshtein_distance}{Levenshtein distance function} (counting any insertion as 1, and any deletion or substitution as 2) that is needed to change \eqn{x} into \eqn{n}; | ||||||
| \item \ifelse{html}{\out{<i>k<sub>n</sub></i> is the taxonomic kingdom of <i>n</i>, set as Bacteria = 1, Fungi = 2, Protozoa = 3, Archaea = 4, others = 5.}}{l_n is the taxonomic kingdom of \eqn{n}, set as Bacteria = 1, Fungi = 2, Protozoa = 3, Archaea = 4, others = 5.} | \item \eqn{p_{n}} is the human pathogenic prevalence group of \eqn{n}, as described below; | ||||||
|  | \item \eqn{k_n} is the taxonomic kingdom of \eqn{n}, set as Bacteria = 1, Fungi = 2, Protozoa = 3, Archaea = 4, others = 5. | ||||||
| } | } | ||||||
|  |  | ||||||
| The grouping into human pathogenic prevalence (\eqn{p}) is based on recent work from Bartlett \emph{et al.} (2022, \doi{10.1099/mic.0.001269}) who extensively studied medical-scientific literature to categorise all bacterial species into these groups: | The grouping into human pathogenic prevalence \eqn{p} is based on recent work from Bartlett \emph{et al.} (2022, \doi{10.1099/mic.0.001269}) who extensively studied medical-scientific literature to categorise all bacterial species into these groups: | ||||||
| \itemize{ | \itemize{ | ||||||
| \item \strong{Established}, if a taxonomic species has infected at least three persons in three or more references. These records have \code{prevalence = 1.0} in the \link{microorganisms} data set; | \item \strong{Established}, if a taxonomic species has infected at least three persons in three or more references. These records have \code{prevalence = 1.0} in the \link{microorganisms} data set; | ||||||
| \item \strong{Putative}, if a taxonomic species has fewer than three known cases. These records have \code{prevalence = 1.25} in the \link{microorganisms} data set. | \item \strong{Putative}, if a taxonomic species has fewer than three known cases. These records have \code{prevalence = 1.25} in the \link{microorganisms} data set. | ||||||
|   | |||||||
| @@ -28,14 +28,15 @@ With ambiguous user input in \code{\link[=as.mo]{as.mo()}} and all the \code{\li | |||||||
| where: | where: | ||||||
| \itemize{ | \itemize{ | ||||||
| \item \eqn{x} is the user input; | \item \eqn{x} is the user input; | ||||||
| \item \ifelse{html}{\out{<i>n</i> is a taxonomic name (genus, species, and subspecies);}}{\eqn{n} is a taxonomic name (genus, species, and subspecies);} | \item \eqn{n} is a taxonomic name (genus, species, and subspecies); | ||||||
| \item \ifelse{html}{\out{<i>l<sub>n</sub></i> is the length of <i>n</i>;}}{l_n is the length of \eqn{n};} | \item \eqn{l_n} is the length of \eqn{n}; | ||||||
| \item \ifelse{html}{\out{<i>lev</i> is the <a href="https://en.wikipedia.org/wiki/Levenshtein_distance">Levenshtein distance function</a> (counting any insertion as 1, and any deletion or substitution as 2) that is needed to change <i>x</i> into <i>n</i>;}}{lev is the Levenshtein distance function (counting any insertion as 1, and any deletion or substitution as 2) that is needed to change \eqn{x} into \eqn{n};} | \item \ifelse{html}{\out{\if{html}{\out{<i>}}lev\if{html}{\out{</i>}} is the | ||||||
| \item \ifelse{html}{\out{<i>p<sub>n</sub></i> is the human pathogenic prevalence group of <i>n</i>, as described below;}}{p_n is the human pathogenic prevalence group of \eqn{n}, as described below;} | \item \eqn{lev} is the \href{https://en.wikipedia.org/wiki/Levenshtein_distance}{Levenshtein distance function} (counting any insertion as 1, and any deletion or substitution as 2) that is needed to change \eqn{x} into \eqn{n}; | ||||||
| \item \ifelse{html}{\out{<i>k<sub>n</sub></i> is the taxonomic kingdom of <i>n</i>, set as Bacteria = 1, Fungi = 2, Protozoa = 3, Archaea = 4, others = 5.}}{l_n is the taxonomic kingdom of \eqn{n}, set as Bacteria = 1, Fungi = 2, Protozoa = 3, Archaea = 4, others = 5.} | \item \eqn{p_{n}} is the human pathogenic prevalence group of \eqn{n}, as described below; | ||||||
|  | \item \eqn{k_n} is the taxonomic kingdom of \eqn{n}, set as Bacteria = 1, Fungi = 2, Protozoa = 3, Archaea = 4, others = 5. | ||||||
| } | } | ||||||
|  |  | ||||||
| The grouping into human pathogenic prevalence (\eqn{p}) is based on recent work from Bartlett \emph{et al.} (2022, \doi{10.1099/mic.0.001269}) who extensively studied medical-scientific literature to categorise all bacterial species into these groups: | The grouping into human pathogenic prevalence \eqn{p} is based on recent work from Bartlett \emph{et al.} (2022, \doi{10.1099/mic.0.001269}) who extensively studied medical-scientific literature to categorise all bacterial species into these groups: | ||||||
| \itemize{ | \itemize{ | ||||||
| \item \strong{Established}, if a taxonomic species has infected at least three persons in three or more references. These records have \code{prevalence = 1.0} in the \link{microorganisms} data set; | \item \strong{Established}, if a taxonomic species has infected at least three persons in three or more references. These records have \code{prevalence = 1.0} in the \link{microorganisms} data set; | ||||||
| \item \strong{Putative}, if a taxonomic species has fewer than three known cases. These records have \code{prevalence = 1.25} in the \link{microorganisms} data set. | \item \strong{Putative}, if a taxonomic species has fewer than three known cases. These records have \code{prevalence = 1.25} in the \link{microorganisms} data set. | ||||||
| @@ -61,6 +62,8 @@ All data sets in this \code{AMR} package (about microorganisms, antibiotics, R/S | |||||||
| } | } | ||||||
|  |  | ||||||
| \examples{ | \examples{ | ||||||
|  | mo_reset_session() | ||||||
|  |  | ||||||
| as.mo("E. coli") | as.mo("E. coli") | ||||||
| mo_uncertainties() | mo_uncertainties() | ||||||
|  |  | ||||||
|   | |||||||
| @@ -294,33 +294,33 @@ mo_property( | |||||||
| Use these functions to return a specific property of a microorganism based on the latest accepted taxonomy. All input values will be evaluated internally with \code{\link[=as.mo]{as.mo()}}, which makes it possible to use microbial abbreviations, codes and names as input. See \emph{Examples}. | Use these functions to return a specific property of a microorganism based on the latest accepted taxonomy. All input values will be evaluated internally with \code{\link[=as.mo]{as.mo()}}, which makes it possible to use microbial abbreviations, codes and names as input. See \emph{Examples}. | ||||||
| } | } | ||||||
| \details{ | \details{ | ||||||
| All functions will, at default, \strong{not} keep old taxonomic properties, as synonyms are automatically replaced with the current taxonomy. Take for example \emph{Escherichia blattae}, which was renamed to \emph{Shimwellia blattae} in 2010: | All functions will, at default, \strong{not} keep old taxonomic properties, as synonyms are automatically replaced with the current taxonomy. Take for example \emph{Enterobacter aerogenes}, which was initially named in 1960 but renamed to \emph{Klebsiella aerogenes} in 2017: | ||||||
| \itemize{ | \itemize{ | ||||||
| \item \code{mo_genus("Escherichia blattae")} will return \code{"Shemwellia"} (with a note about the renaming) | \item \code{mo_genus("Enterobacter aerogenes")} will return \code{"Klebsiella"} (with a note about the renaming) | ||||||
| \item \code{mo_genus("Escherichia blattae", keep_synonyms = TRUE)} will return \code{"Escherichia"} (with a warning that the name is outdated) | \item \code{mo_genus("Enterobacter aerogenes", keep_synonyms = TRUE)} will return \code{"Enterobacter"} (with a once-per-session warning that the name is outdated) | ||||||
| \item \code{mo_ref("Escherichia blattae")} will return \code{"Priest et al., 2010"} (with a note) | \item \code{mo_ref("Enterobacter aerogenes")} will return \code{"Tindall et al., 2017"} (with a note) | ||||||
| \item \code{mo_ref("Escherichia blattae", keep_synonyms = TRUE)} will return \code{"Burgess et al., 1973"} (with a warning) | \item \code{mo_ref("Enterobacter aerogenes", keep_synonyms = TRUE)} will return \code{"Hormaeche et al., 1960"} (with a warning) | ||||||
| } | } | ||||||
|  |  | ||||||
| The short name (\code{\link[=mo_shortname]{mo_shortname()}}) returns the first character of the genus and the full species, such as \code{"E. coli"}, for species and subspecies. Exceptions are abbreviations of staphylococci (such as \emph{"CoNS"}, Coagulase-Negative Staphylococci) and beta-haemolytic streptococci (such as \emph{"GBS"}, Group B Streptococci). Please bear in mind that e.g. \emph{E. coli} could mean \emph{Escherichia coli} (kingdom of Bacteria) as well as \emph{Entamoeba coli} (kingdom of Protozoa). Returning to the full name will be done using \code{\link[=as.mo]{as.mo()}} internally, giving priority to bacteria and human pathogens, i.e. \code{"E. coli"} will be considered \emph{Escherichia coli}. In other words, \code{mo_fullname(mo_shortname("Entamoeba coli"))} returns \code{"Escherichia coli"}. | The short name (\code{\link[=mo_shortname]{mo_shortname()}}) returns the first character of the genus and the full species, such as \code{"E. coli"}, for species and subspecies. Exceptions are abbreviations of staphylococci (such as \emph{"CoNS"}, Coagulase-Negative Staphylococci) and beta-haemolytic streptococci (such as \emph{"GBS"}, Group B Streptococci). Please bear in mind that e.g. \emph{E. coli} could mean \emph{Escherichia coli} (kingdom of Bacteria) as well as \emph{Entamoeba coli} (kingdom of Protozoa). Returning to the full name will be done using \code{\link[=as.mo]{as.mo()}} internally, giving priority to bacteria and human pathogens, i.e. \code{"E. coli"} will be considered \emph{Escherichia coli}. As a result, \code{mo_fullname(mo_shortname("Entamoeba coli"))} returns \code{"Escherichia coli"}. | ||||||
|  |  | ||||||
| Since the top-level of the taxonomy is sometimes referred to as 'kingdom' and sometimes as 'domain', the functions \code{\link[=mo_kingdom]{mo_kingdom()}} and \code{\link[=mo_domain]{mo_domain()}} return the exact same results. | Since the top-level of the taxonomy is sometimes referred to as 'kingdom' and sometimes as 'domain', the functions \code{\link[=mo_kingdom]{mo_kingdom()}} and \code{\link[=mo_domain]{mo_domain()}} return the exact same results. | ||||||
|  |  | ||||||
| Determination of human pathogenicity (\code{\link[=mo_pathogenicity]{mo_pathogenicity()}}) is strongly based on Bartlett \emph{et al.} (2022, \doi{10.1099/mic.0.001269}). This function returns a \link{factor} with the levels \emph{Pathogenic}, \emph{Potentially pathogenic}, \emph{Non-pathogenic}, and \emph{Unknown}. | Determination of human pathogenicity (\code{\link[=mo_pathogenicity]{mo_pathogenicity()}}) is strongly based on Bartlett \emph{et al.} (2022, \doi{10.1099/mic.0.001269}). This function returns a \link{factor} with the levels \emph{Pathogenic}, \emph{Potentially pathogenic}, \emph{Non-pathogenic}, and \emph{Unknown}. | ||||||
|  |  | ||||||
| Determination of the Gram stain (\code{\link[=mo_gramstain]{mo_gramstain()}}) will be based on the taxonomic kingdom and phylum. Originally, Cavalier-Smith defined the so-called subkingdoms Negibacteria and Posibacteria (2002, \href{https://pubmed.ncbi.nlm.nih.gov/11837318/}{PMID 11837318}), and only considered these phyla as Posibacteria: Actinobacteria, Chloroflexi, Firmicutes, and Tenericutes. These phyla were renamed to Actinomycetota, Chloroflexota, Bacillota, and Mycoplasmatota (2021, \href{https://pubmed.ncbi.nlm.nih.gov/34694987/}{PMID 34694987}). Bacteria in these phyla are considered Gram-positive in this \code{AMR} package, except for members of the class Negativicutes (within phylum Bacillota) which are Gram-negative. All other bacteria are considered Gram-negative. Species outside the kingdom of Bacteria will return a value \code{NA}. Functions \code{\link[=mo_is_gram_negative]{mo_is_gram_negative()}} and \code{\link[=mo_is_gram_positive]{mo_is_gram_positive()}} always return \code{TRUE} or \code{FALSE} (or \code{NA} when the input is \code{NA} or the MO code is \code{UNKNOWN}), thus always return \code{FALSE} for species outside the taxonomic kingdom of Bacteria. | Determination of the Gram stain (\code{\link[=mo_gramstain]{mo_gramstain()}}) will be based on the taxonomic kingdom and phylum. Originally, Cavalier-Smith defined the so-called subkingdoms Negibacteria and Posibacteria (2002, \href{https://pubmed.ncbi.nlm.nih.gov/11837318/}{PMID 11837318}), and only considered these phyla as Posibacteria: Actinobacteria, Chloroflexi, Firmicutes, and Tenericutes. These phyla were later renamed to Actinomycetota, Chloroflexota, Bacillota, and Mycoplasmatota (2021, \href{https://pubmed.ncbi.nlm.nih.gov/34694987/}{PMID 34694987}). Bacteria in these phyla are considered Gram-positive in this \code{AMR} package, except for members of the class Negativicutes (within phylum Bacillota) which are Gram-negative. All other bacteria are considered Gram-negative. Species outside the kingdom of Bacteria will return a value \code{NA}. Functions \code{\link[=mo_is_gram_negative]{mo_is_gram_negative()}} and \code{\link[=mo_is_gram_positive]{mo_is_gram_positive()}} always return \code{TRUE} or \code{FALSE} (or \code{NA} when the input is \code{NA} or the MO code is \code{UNKNOWN}), thus always return \code{FALSE} for species outside the taxonomic kingdom of Bacteria. | ||||||
|  |  | ||||||
| Determination of yeasts (\code{\link[=mo_is_yeast]{mo_is_yeast()}}) will be based on the taxonomic kingdom and class. \emph{Budding yeasts} are fungi of the phylum Ascomycota, class Saccharomycetes (also called Hemiascomycetes). \emph{True yeasts} are aggregated into the underlying order Saccharomycetales. Thus, for all microorganisms that are member of the taxonomic class Saccharomycetes, the function will return \code{TRUE}. It returns \code{FALSE} otherwise (or \code{NA} when the input is \code{NA} or the MO code is \code{UNKNOWN}). | Determination of yeasts (\code{\link[=mo_is_yeast]{mo_is_yeast()}}) will be based on the taxonomic kingdom and class. \emph{Budding yeasts} are fungi of the phylum Ascomycota, class Saccharomycetes (also called Hemiascomycetes). \emph{True yeasts} are aggregated into the underlying order Saccharomycetales. Thus, for all microorganisms that are member of the taxonomic class Saccharomycetes, the function will return \code{TRUE}. It returns \code{FALSE} otherwise (or \code{NA} when the input is \code{NA} or the MO code is \code{UNKNOWN}). | ||||||
|  |  | ||||||
| Determination of intrinsic resistance (\code{\link[=mo_is_intrinsic_resistant]{mo_is_intrinsic_resistant()}}) will be based on the \link{intrinsic_resistant} data set, which is based on \href{https://www.eucast.org/expert_rules_and_expected_phenotypes/}{'EUCAST Expert Rules' and 'EUCAST Intrinsic Resistance and Unusual Phenotypes' v3.3} (2021). The \code{\link[=mo_is_intrinsic_resistant]{mo_is_intrinsic_resistant()}} function can be vectorised over both argument \code{x} (input for microorganisms) and \code{ab} (input for antibiotics). | Determination of intrinsic resistance (\code{\link[=mo_is_intrinsic_resistant]{mo_is_intrinsic_resistant()}}) will be based on the \link{intrinsic_resistant} data set, which is based on \href{https://www.eucast.org/expert_rules_and_expected_phenotypes/}{'EUCAST Expert Rules' and 'EUCAST Intrinsic Resistance and Unusual Phenotypes' v3.3} (2021). The \code{\link[=mo_is_intrinsic_resistant]{mo_is_intrinsic_resistant()}} function can be vectorised over both argument \code{x} (input for microorganisms) and \code{ab} (input for antibiotics). | ||||||
|  |  | ||||||
| All output \link[=translate]{will be translated} where possible. |  | ||||||
|  |  | ||||||
| The function \code{\link[=mo_url]{mo_url()}} will return the direct URL to the online database entry, which also shows the scientific reference of the concerned species. | The function \code{\link[=mo_url]{mo_url()}} will return the direct URL to the online database entry, which also shows the scientific reference of the concerned species. | ||||||
|  |  | ||||||
| SNOMED codes (\code{\link[=mo_snomed]{mo_snomed()}}) are from the version of 1 July, 2021. See \emph{Source} and the \link{microorganisms} data set for more info. | SNOMED codes (\code{\link[=mo_snomed]{mo_snomed()}}) are from the version of 1 July, 2021. See \emph{Source} and the \link{microorganisms} data set for more info. | ||||||
|  |  | ||||||
| Old taxonomic names (so-called 'synonyms') can be retrieved with \code{\link[=mo_synonyms]{mo_synonyms()}}, the current taxonomic name can be retrieved with \code{\link[=mo_current]{mo_current()}}. Both functions return full names. | Old taxonomic names (so-called 'synonyms') can be retrieved with \code{\link[=mo_synonyms]{mo_synonyms()}}, the current taxonomic name can be retrieved with \code{\link[=mo_current]{mo_current()}}. Both functions return full names. | ||||||
|  |  | ||||||
|  | All output \link[=translate]{will be translated} where possible. | ||||||
| } | } | ||||||
| \section{Matching Score for Microorganisms}{ | \section{Matching Score for Microorganisms}{ | ||||||
|  |  | ||||||
| @@ -417,10 +417,10 @@ mo_shortname("Staph. epidermidis", Becker = TRUE) | |||||||
|  |  | ||||||
| # Lancefield classification, see ?as.mo ------------------------------------ | # Lancefield classification, see ?as.mo ------------------------------------ | ||||||
|  |  | ||||||
| mo_fullname("S. pyo") | mo_fullname("Strep Group B") | ||||||
| mo_fullname("S. pyo", Lancefield = TRUE) | mo_fullname("Strep Group B", Lancefield = TRUE) | ||||||
| mo_shortname("S. pyo") | mo_shortname("Strep Group B") | ||||||
| mo_shortname("S. pyo", Lancefield = TRUE) | mo_shortname("Strep Group B", Lancefield = TRUE) | ||||||
|  |  | ||||||
|  |  | ||||||
| # language support  -------------------------------------------------------- | # language support  -------------------------------------------------------- | ||||||
| @@ -431,7 +431,7 @@ mo_gramstain("Klebsiella pneumoniae", language = "es") # Spanish | |||||||
| mo_gramstain("Klebsiella pneumoniae", language = "el") # Greek | mo_gramstain("Klebsiella pneumoniae", language = "el") # Greek | ||||||
| mo_gramstain("Klebsiella pneumoniae", language = "uk") # Ukrainian | mo_gramstain("Klebsiella pneumoniae", language = "uk") # Ukrainian | ||||||
|  |  | ||||||
| # mo_type is equal to mo_kingdom, but mo_kingdom will remain official | # mo_type is equal to mo_kingdom, but mo_kingdom will remain untranslated | ||||||
| mo_kingdom("Klebsiella pneumoniae") | mo_kingdom("Klebsiella pneumoniae") | ||||||
| mo_type("Klebsiella pneumoniae") | mo_type("Klebsiella pneumoniae") | ||||||
| mo_kingdom("Klebsiella pneumoniae", language = "zh") # Chinese, no effect | mo_kingdom("Klebsiella pneumoniae", language = "zh") # Chinese, no effect | ||||||
|   | |||||||
		Reference in New Issue
	
	Block a user