AMR/man/first_isolate.Rd

% Generated by roxygen2: do not edit by hand
% Please edit documentation in R/first_isolate.R
\name{first_isolate}
\alias{first_isolate}
\alias{filter_first_isolate}
\title{Determine First (Weighted) Isolates}
\source{
Methodology of this function is strictly based on:
\itemize{
\item \strong{M39 Analysis and Presentation of Cumulative Antimicrobial Susceptibility Test Data, 4th Edition}, 2014, \emph{Clinical and Laboratory Standards Institute (CLSI)}. \url{https://clsi.org/standards/products/microbiology/documents/m39/}.
\item Hindler JF and Stelling J (2007). \strong{Analysis and Presentation of Cumulative Antibiograms: A New Consensus Guideline from the Clinical and Laboratory Standards Institute.} Clinical Infectious Diseases, 44(6), 867–873. \doi{10.1086/511864}
}
}
\usage{
first_isolate(
  x = NULL,
  col_date = NULL,
  col_patient_id = NULL,
  col_mo = NULL,
  col_testcode = NULL,
  col_specimen = NULL,
  col_icu = NULL,
  col_keyantimicrobials = NULL,
  episode_days = 365,
  testcodes_exclude = NULL,
  icu_exclude = FALSE,
  specimen_group = NULL,
  type = "points",
  method = c("phenotype-based", "episode-based", "patient-based", "isolate-based"),
  ignore_I = TRUE,
  points_threshold = 2,
  info = interactive(),
  include_unknown = FALSE,
  include_untested_rsi = TRUE,
  ...
)

filter_first_isolate(
  x = NULL,
  col_date = NULL,
  col_patient_id = NULL,
  col_mo = NULL,
  episode_days = 365,
  method = c("phenotype-based", "episode-based", "patient-based", "isolate-based"),
  ...
)
}
\arguments{
\item{x}{a \link{data.frame} containing isolates. Can be left blank for automatic determination, see \emph{Examples}.}

\item{col_date}{column name of the result date (or date that is was received on the lab), defaults to the first column with a date class}

\item{col_patient_id}{column name of the unique IDs of the patients, defaults to the first column that starts with 'patient' or 'patid' (case insensitive)}

\item{col_mo}{column name of the IDs of the microorganisms (see \code{\link[=as.mo]{as.mo()}}), defaults to the first column of class \code{\link{mo}}. Values will be coerced using \code{\link[=as.mo]{as.mo()}}.}

\item{col_testcode}{column name of the test codes. Use \code{col_testcode = NULL} to \strong{not} exclude certain test codes (such as test codes for screening). In that case \code{testcodes_exclude} will be ignored.}

\item{col_specimen}{column name of the specimen type or group}

\item{col_icu}{column name of the logicals (\code{TRUE}/\code{FALSE}) whether a ward or department is an Intensive Care Unit (ICU)}

\item{col_keyantimicrobials}{(only useful when \code{method = "phenotype-based"}) column name of the key antimicrobials to determine first (weighted) isolates, see \code{\link[=key_antimicrobials]{key_antimicrobials()}}. Defaults to the first column that starts with 'key' followed by 'ab' or 'antibiotics' or 'antimicrobials' (case insensitive). Use \code{col_keyantimicrobials = FALSE} to prevent this. Can also be the output of \code{\link[=key_antimicrobials]{key_antimicrobials()}}.}

\item{episode_days}{episode in days after which a genus/species combination will be determined as 'first isolate' again. The default of 365 days is based on the guideline by CLSI, see \emph{Source}.}

\item{testcodes_exclude}{a \link{character} vector with test codes that should be excluded (case-insensitive)}

\item{icu_exclude}{a \link{logical} to indicate whether ICU isolates should be excluded (rows with value \code{TRUE} in the column set with \code{col_icu})}

\item{specimen_group}{value in the column set with \code{col_specimen} to filter on}

\item{type}{type to determine weighed isolates; can be \code{"keyantimicrobials"} or \code{"points"}, see \emph{Details}}

\item{method}{the method to apply, either \code{"phenotype-based"}, \code{"episode-based"}, \code{"patient-based"} or \code{"isolate-based"} (can be abbreviated), see \emph{Details}. The default is \code{"phenotype-based"} if antimicrobial test results are present in the data, and \code{"episode-based"} otherwise.}

\item{ignore_I}{\link{logical} to indicate whether antibiotic interpretations with \code{"I"} will be ignored when \code{type = "keyantimicrobials"}, see \emph{Details}}

\item{points_threshold}{minimum number of points to require before differences in the antibiogram will lead to inclusion of an isolate when \code{type = "points"}, see \emph{Details}}

\item{info}{a \link{logical} to indicate info should be printed, defaults to \code{TRUE} only in interactive mode}

\item{include_unknown}{a \link{logical} to indicate whether 'unknown' microorganisms should be included too, i.e. microbial code \code{"UNKNOWN"}, which defaults to \code{FALSE}. For WHONET users, this means that all records with organism code \code{"con"} (\emph{contamination}) will be excluded at default. Isolates with a microbial ID of \code{NA} will always be excluded as first isolate.}

\item{include_untested_rsi}{a \link{logical} to indicate whether also rows without antibiotic results are still eligible for becoming a first isolate. Use \code{include_untested_rsi = FALSE} to always return \code{FALSE} for such rows. This checks the data set for columns of class \verb{<rsi>} and consequently requires transforming columns with antibiotic results using \code{\link[=as.rsi]{as.rsi()}} first.}

\item{...}{arguments passed on to \code{\link[=first_isolate]{first_isolate()}} when using \code{\link[=filter_first_isolate]{filter_first_isolate()}}, otherwise arguments passed on to \code{\link[=key_antimicrobials]{key_antimicrobials()}} (such as \code{universal}, \code{gram_negative}, \code{gram_positive})}
}
\value{
A \code{\link{logical}} vector
}
\description{
Determine first (weighted) isolates of all microorganisms of every patient per episode and (if needed) per specimen type. These functions support all four methods as summarised by Hindler \emph{et al.} in 2007 (\doi{10.1086/511864}). To determine patient episodes not necessarily based on microorganisms, use \code{\link[=is_new_episode]{is_new_episode()}} that also supports grouping with the \code{dplyr} package.
}
\details{
To conduct epidemiological analyses on antimicrobial resistance data, only so-called first isolates should be included to prevent overestimation and underestimation of antimicrobial resistance. Different methods can be used to do so, see below.

These functions are context-aware. This means that then the \code{x} argument can be left blank, see \emph{Examples}.

The \code{\link[=first_isolate]{first_isolate()}} function is a wrapper around the \code{\link[=is_new_episode]{is_new_episode()}} function, but more efficient for data sets containing microorganism codes or names.

All isolates with a microbial ID of \code{NA} will be excluded as first isolate.
\subsection{Different methods}{

According to Hindler \emph{et al.} (2007, \doi{10.1086/511864}), there are different methods (algorithms) to select first isolates with increasing reliability: isolate-based, patient-based, episode-based and phenotype-based. All methods select on a combination of the taxonomic genus and species (not subspecies).

All mentioned methods are covered in the \code{\link[=first_isolate]{first_isolate()}} function:\tabular{ll}{
   \strong{Method} \tab \strong{Function to apply} \cr
   \strong{Isolate-based} \tab \code{first_isolate(x, method = "isolate-based")} \cr
   \emph{(= all isolates)} \tab  \cr
    \tab  \cr
    \tab  \cr
   \strong{Patient-based} \tab \code{first_isolate(x, method = "patient-based")} \cr
   \emph{(= first isolate per patient)} \tab  \cr
    \tab  \cr
    \tab  \cr
   \strong{Episode-based} \tab \code{first_isolate(x, method = "episode-based")}, or: \cr
   \emph{(= first isolate per episode)} \tab  \cr
   - 7-Day interval from initial isolate \tab - \code{first_isolate(x, method = "e", episode_days = 7)} \cr
   - 30-Day interval from initial isolate \tab - \code{first_isolate(x, method = "e", episode_days = 30)} \cr
    \tab  \cr
    \tab  \cr
   \strong{Phenotype-based} \tab \code{first_isolate(x, method = "phenotype-based")}, or: \cr
   \emph{(= first isolate per phenotype)} \tab  \cr
   - Major difference in any antimicrobial result \tab - \code{first_isolate(x, type = "points")} \cr
   - Any difference in key antimicrobial results \tab - \code{first_isolate(x, type = "keyantimicrobials")} \cr
}

\subsection{Isolate-based}{

This method does not require any selection, as all isolates should be included. It does, however, respect all arguments set in the \code{\link[=first_isolate]{first_isolate()}} function. For example, the default setting for \code{include_unknown} (\code{FALSE}) will omit selection of rows without a microbial ID.
}

\subsection{Patient-based}{

To include every genus-species combination per patient once, set the \code{episode_days} to \code{Inf}. Although often inappropriate, this method makes sure that no duplicate isolates are selected from the same patient. In a large longitudinal data set, this could mean that isolates are \emph{excluded} that were found years after the initial isolate.
}

\subsection{Episode-based}{

To include every genus-species combination per patient episode once, set the \code{episode_days} to a sensible number of days. Depending on the type of analysis, this could be 14, 30, 60 or 365. Short episodes are common for analysing specific hospital or ward data, long episodes are common for analysing regional and national data.

This is the most common method to correct for duplicate isolates. Patients are categorised into episodes based on their ID and dates (e.g., the date of specimen receipt or laboratory result). While this is a common method, it does not take into account antimicrobial test results. This means that e.g. a methicillin-resistant \emph{Staphylococcus aureus} (MRSA) isolate cannot be differentiated from a wildtype \emph{Staphylococcus aureus} isolate.
}

\subsection{Phenotype-based}{

This is a more reliable method, since it also \emph{weighs} the antibiogram (antimicrobial test results) yielding so-called 'first weighted isolates'. There are two different methods to weigh the antibiogram:
\enumerate{
\item Using \code{type = "points"} and argument \code{points_threshold}

This method weighs \emph{all} antimicrobial agents available in the data set. Any difference from I to S or R (or vice versa) counts as 0.5 points, a difference from S to R (or vice versa) counts as 1 point. When the sum of points exceeds \code{points_threshold}, which defaults to \code{2}, an isolate will be selected as a first weighted isolate.

All antimicrobials are internally selected using the \code{\link[=all_antimicrobials]{all_antimicrobials()}} function. The output of this function does not need to be passed to the \code{\link[=first_isolate]{first_isolate()}} function.
\item Using \code{type = "keyantimicrobials"} and argument \code{ignore_I}

This method only weighs specific antimicrobial agents, called \emph{key antimicrobials}. Any difference from S to R (or vice versa) in these key antimicrobials will select an isolate as a first weighted isolate. With \code{ignore_I = FALSE}, also differences from I to S or R (or vice versa) will lead to this.

Key antimicrobials are internally selected using the \code{\link[=key_antimicrobials]{key_antimicrobials()}} function, but can also be added manually as a variable to the data and set in the \code{col_keyantimicrobials} argument. Another option is to pass the output of the \code{\link[=key_antimicrobials]{key_antimicrobials()}} function directly to the \code{col_keyantimicrobials} argument.
}

The default method is phenotype-based (using \code{type = "points"}) and episode-based (using \code{episode_days = 365}). This makes sure that every genus-species combination is selected per patient once per year, while taking into account all antimicrobial test results. If no antimicrobial test results are available in the data set, only the episode-based method is applied at default.
}

}
}
\section{Stable Lifecycle}{

\if{html}{\figure{lifecycle_stable.svg}{options: style=margin-bottom:5px} \cr}
The \link[=lifecycle]{lifecycle} of this function is \strong{stable}. In a stable function, major changes are unlikely. This means that the unlying code will generally evolve by adding new arguments; removing arguments or changing the meaning of existing arguments will be avoided.

If the unlying code needs breaking changes, they will occur gradually. For example, a argument will be deprecated and first continue to work, but will emit an message informing you of the change. Next, typically after at least one newly released version on CRAN, the message will be transformed to an error.
}

\section{Read more on Our Website!}{

On our website \url{https://msberends.github.io/AMR/} you can find \href{https://msberends.github.io/AMR/articles/AMR.html}{a comprehensive tutorial} about how to conduct AMR data analysis, the \href{https://msberends.github.io/AMR/reference/}{complete documentation of all functions} and \href{https://msberends.github.io/AMR/articles/WHONET.html}{an example analysis using WHONET data}. As we would like to better understand the backgrounds and needs of our users, please \href{https://msberends.github.io/AMR/survey.html}{participate in our survey}!
}

\examples{
# `example_isolates` is a data set available in the AMR package.
# See ?example_isolates.

example_isolates[first_isolate(example_isolates), ]
\donttest{
# faster way, only works in R 3.2 and later:
example_isolates[first_isolate(), ]

# get all first Gram-negatives
example_isolates[which(first_isolate() & mo_is_gram_negative()), ]

if (require("dplyr")) {
  # filter on first isolates using dplyr:
  example_isolates \%>\%
    filter(first_isolate())
 
  # short-hand version:
  example_isolates \%>\%
    filter_first_isolate()
    
 # grouped determination of first isolates (also prints group names):
 example_isolates \%>\%
   group_by(hospital_id) \%>\%
   mutate(first = first_isolate())
  
  # now let's see if first isolates matter:
  A <- example_isolates \%>\%
    group_by(hospital_id) \%>\%
    summarise(count = n_rsi(GEN),            # gentamicin availability
              resistance = resistance(GEN))  # gentamicin resistance
 
  B <- example_isolates \%>\%
    filter_first_isolate() \%>\%               # the 1st isolate filter
    group_by(hospital_id) \%>\%
    summarise(count = n_rsi(GEN),            # gentamicin availability
              resistance = resistance(GEN))  # gentamicin resistance
 
  # Have a look at A and B.
  # B is more reliable because every isolate is counted only once.
  # Gentamicin resistance in hospital D appears to be 4.2\% higher than
  # when you (erroneously) would have used all isolates for analysis.
}
}
}
\seealso{
\code{\link[=key_antimicrobials]{key_antimicrobials()}}
}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
+								% Generated by roxygen2: do not edit by hand
-												new class bactid

											
										
										
											2018-07-23 14:14:03 +02:00
+								% Please edit documentation in R/first_isolate.R
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
+								\name{first_isolate}
 								\alias{first_isolate}
-												dplyr 0.8.0 support, fixes #7

											
										
										
											2018-12-22 22:39:34 +01:00
+								\alias{filter_first_isolate}
-												(v1.5.0.9006) major documentation update

											
										
										
											2021-01-18 16:57:56 +01:00
+								\title{Determine First (Weighted) Isolates}
-												more unit tests

											
										
										
											2018-04-20 13:45:34 +02:00
+								\source{
-												(v1.1.0.9004) lose dependencies

											
										
										
											2020-05-16 13:05:47 +02:00
+								Methodology of this function is strictly based on:
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								\itemize{
 								\item \strong{M39 Analysis and Presentation of Cumulative Antimicrobial Susceptibility Test Data, 4th Edition}, 2014, \emph{Clinical and Laboratory Standards Institute (CLSI)}. \url{https://clsi.org/standards/products/microbiology/documents/m39/}.
 								\item Hindler JF and Stelling J (2007). \strong{Analysis and Presentation of Cumulative Antibiograms: A New Consensus Guideline from the Clinical and Laboratory Standards Institute.} Clinical Infectious Diseases, 44(6), 867–873. \doi{10.1086/511864}
 								}
-												more unit tests

											
										
										
											2018-04-20 13:45:34 +02:00
+								}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
+								\usage{
-												(v0.8.0.9036) complete documentation rewrite

											
										
										
											2019-11-28 22:32:17 +01:00
+								first_isolate(
-												(v1.5.0.9016) only_rsi_columns update, documentation

											
										
										
											2021-02-08 14:18:42 +01:00
+								  x = NULL,
-												(v0.8.0.9036) complete documentation rewrite

											
										
										
											2019-11-28 22:32:17 +01:00
+								  col_date = NULL,
 								  col_patient_id = NULL,
 								  col_mo = NULL,
 								  col_testcode = NULL,
 								  col_specimen = NULL,
 								  col_icu = NULL,
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								  col_keyantimicrobials = NULL,
-												(v0.8.0.9036) complete documentation rewrite

											
										
										
											2019-11-28 22:32:17 +01:00
+								  episode_days = 365,
 								  testcodes_exclude = NULL,
 								  icu_exclude = FALSE,
 								  specimen_group = NULL,
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								  type = "points",
 								  method = c("phenotype-based", "episode-based", "patient-based", "isolate-based"),
-												(v0.8.0.9036) complete documentation rewrite

											
										
										
											2019-11-28 22:32:17 +01:00
+								  ignore_I = TRUE,
 								  points_threshold = 2,
-												(v1.0.0.9005) info printing only in interactive mode

											
										
										
											2020-02-21 21:13:38 +01:00
+								  info = interactive(),
-												(v0.8.0.9036) complete documentation rewrite

											
										
										
											2019-11-28 22:32:17 +01:00
+								  include_unknown = FALSE,
-												(v1.5.0.9039) handle first isolates for missing antibiograms

											
										
										
											2021-03-08 02:38:32 +01:00
+								  include_untested_rsi = TRUE,
-												(v0.8.0.9036) complete documentation rewrite

											
										
										
											2019-11-28 22:32:17 +01:00
+								  ...
 								)
 								filter_first_isolate(
-												(v1.5.0.9016) only_rsi_columns update, documentation

											
										
										
											2021-02-08 14:18:42 +01:00
+								  x = NULL,
-												(v0.8.0.9036) complete documentation rewrite

											
										
										
											2019-11-28 22:32:17 +01:00
+								  col_date = NULL,
 								  col_patient_id = NULL,
 								  col_mo = NULL,
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								  episode_days = 365,
 								  method = c("phenotype-based", "episode-based", "patient-based", "isolate-based"),
-												(v0.8.0.9036) complete documentation rewrite

											
										
										
											2019-11-28 22:32:17 +01:00
+								  ...
 								)
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
+								}
 								\arguments{
-												(v1.5.0.9016) only_rsi_columns update, documentation

											
										
										
											2021-02-08 14:18:42 +01:00
+								\item{x}{a \link{data.frame} containing isolates. Can be left blank for automatic determination, see \emph{Examples}.}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												(v1.4.0.9024) is_new_episode()

											
										
										
											2020-11-17 16:57:41 +01:00
+								\item{col_date}{column name of the result date (or date that is was received on the lab), defaults to the first column with a date class}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												keyab automatic

											
										
										
											2018-12-10 15:14:29 +01:00
+								\item{col_patient_id}{column name of the unique IDs of the patients, defaults to the first column that starts with 'patient' or 'patid' (case insensitive)}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												(v0.8.0.9036) complete documentation rewrite

											
										
										
											2019-11-28 22:32:17 +01:00
+								\item{col_mo}{column name of the IDs of the microorganisms (see \code{\link[=as.mo]{as.mo()}}), defaults to the first column of class \code{\link{mo}}. Values will be coerced using \code{\link[=as.mo]{as.mo()}}.}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												(v1.4.0.9041) updates based on review

											
										
										
											2020-12-17 16:22:25 +01:00
+								\item{col_testcode}{column name of the test codes. Use \code{col_testcode = NULL} to \strong{not} exclude certain test codes (such as test codes for screening). In that case \code{testcodes_exclude} will be ignored.}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												fix clipboard on linux

											
										
										
											2018-04-02 11:11:21 +02:00
+								\item{col_specimen}{column name of the specimen type or group}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												fix clipboard on linux

											
										
										
											2018-04-02 11:11:21 +02:00
+								\item{col_icu}{column name of the logicals (\code{TRUE}/\code{FALSE}) whether a ward or department is an Intensive Care Unit (ICU)}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								\item{col_keyantimicrobials}{(only useful when \code{method = "phenotype-based"}) column name of the key antimicrobials to determine first (weighted) isolates, see \code{\link[=key_antimicrobials]{key_antimicrobials()}}. Defaults to the first column that starts with 'key' followed by 'ab' or 'antibiotics' or 'antimicrobials' (case insensitive). Use \code{col_keyantimicrobials = FALSE} to prevent this. Can also be the output of \code{\link[=key_antimicrobials]{key_antimicrobials()}}.}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												(v1.5.0.9006) major documentation update

											
										
										
											2021-01-18 16:57:56 +01:00
+								\item{episode_days}{episode in days after which a genus/species combination will be determined as 'first isolate' again. The default of 365 days is based on the guideline by CLSI, see \emph{Source}.}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												(v1.6.0.9021) join functions update

											
										
										
											2021-05-12 18:15:03 +02:00
+								\item{testcodes_exclude}{a \link{character} vector with test codes that should be excluded (case-insensitive)}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												(v1.6.0.9021) join functions update

											
										
										
											2021-05-12 18:15:03 +02:00
+								\item{icu_exclude}{a \link{logical} to indicate whether ICU isolates should be excluded (rows with value \code{TRUE} in the column set with \code{col_icu})}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												(v1.4.0.9043) documentation update

											
										
										
											2020-12-22 00:51:17 +01:00
+								\item{specimen_group}{value in the column set with \code{col_specimen} to filter on}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								\item{type}{type to determine weighed isolates; can be \code{"keyantimicrobials"} or \code{"points"}, see \emph{Details}}
-												- Added new algorithm to determine weighted isolates, can now be `points` or `keyantibiotics, see `?first_isolate`
- Function `first_isolate` supports tidyverse-like evaluation of parameters (no need to quote them anymore)
- Functions `as.rsi` and `as.mic` now add the package name and version as attribute

											
										
										
											2018-03-19 20:39:23 +01:00
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								\item{method}{the method to apply, either \code{"phenotype-based"}, \code{"episode-based"}, \code{"patient-based"} or \code{"isolate-based"} (can be abbreviated), see \emph{Details}. The default is \code{"phenotype-based"} if antimicrobial test results are present in the data, and \code{"episode-based"} otherwise.}
-												- Added new algorithm to determine weighted isolates, can now be `points` or `keyantibiotics, see `?first_isolate`
- Function `first_isolate` supports tidyverse-like evaluation of parameters (no need to quote them anymore)
- Functions `as.rsi` and `as.mic` now add the package name and version as attribute

											
										
										
											2018-03-19 20:39:23 +01:00
-												(v1.6.0.9021) join functions update

											
										
										
											2021-05-12 18:15:03 +02:00
+								\item{ignore_I}{\link{logical} to indicate whether antibiotic interpretations with \code{"I"} will be ignored when \code{type = "keyantimicrobials"}, see \emph{Details}}
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
 								\item{points_threshold}{minimum number of points to require before differences in the antibiogram will lead to inclusion of an isolate when \code{type = "points"}, see \emph{Details}}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
-												(v1.6.0.9009) key_antibiotics update

											
										
										
											2021-04-23 16:13:26 +02:00
+								\item{info}{a \link{logical} to indicate info should be printed, defaults to \code{TRUE} only in interactive mode}
-												- For functions `first_isolate`, `EUCAST_rules` the antibiotic column names are case-insensitive
- Functions `first_isolate`, `EUCAST_rules` and `rsi_predict` supports tidyverse-like evaluation of parameters (no need to quote columns them anymore)
- Functions `clipboard_import` and `clipboard_export` as helper functions to quickly copy and paste from/to software like Excel and SPSS
- Renamed dataset `bactlist` to `microorganisms`

											
										
										
											2018-03-23 14:46:02 +01:00
-												(v1.6.0.9021) join functions update

											
										
										
											2021-05-12 18:15:03 +02:00
+								\item{include_unknown}{a \link{logical} to indicate whether 'unknown' microorganisms should be included too, i.e. microbial code \code{"UNKNOWN"}, which defaults to \code{FALSE}. For WHONET users, this means that all records with organism code \code{"con"} (\emph{contamination}) will be excluded at default. Isolates with a microbial ID of \code{NA} will always be excluded as first isolate.}
-												(v1.5.0.9039) handle first isolates for missing antibiograms

											
										
										
											2021-03-08 02:38:32 +01:00
-												(v1.6.0.9021) join functions update

											
										
										
											2021-05-12 18:15:03 +02:00
+								\item{include_untested_rsi}{a \link{logical} to indicate whether also rows without antibiotic results are still eligible for becoming a first isolate. Use \code{include_untested_rsi = FALSE} to always return \code{FALSE} for such rows. This checks the data set for columns of class \verb{<rsi>} and consequently requires transforming columns with antibiotic results using \code{\link[=as.rsi]{as.rsi()}} first.}
-												(v0.7.1.9031) include_unknown for first_isolate()

											
										
										
											2019-08-08 22:39:42 +02:00
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								\item{...}{arguments passed on to \code{\link[=first_isolate]{first_isolate()}} when using \code{\link[=filter_first_isolate]{filter_first_isolate()}}, otherwise arguments passed on to \code{\link[=key_antimicrobials]{key_antimicrobials()}} (such as \code{universal}, \code{gram_negative}, \code{gram_positive})}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
+								}
 								\value{
-												(v0.8.0.9036) complete documentation rewrite

											
										
										
											2019-11-28 22:32:17 +01:00
+								A \code{\link{logical}} vector
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
+								}
 								\description{
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								Determine first (weighted) isolates of all microorganisms of every patient per episode and (if needed) per specimen type. These functions support all four methods as summarised by Hindler \emph{et al.} in 2007 (\doi{10.1086/511864}). To determine patient episodes not necessarily based on microorganisms, use \code{\link[=is_new_episode]{is_new_episode()}} that also supports grouping with the \code{dplyr} package.
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
+								}
 								\details{
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								To conduct epidemiological analyses on antimicrobial resistance data, only so-called first isolates should be included to prevent overestimation and underestimation of antimicrobial resistance. Different methods can be used to do so, see below.
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
-												(v1.5.0.9010) MDRO vignette update, get_episode for < day

											
										
										
											2021-01-24 14:48:56 +01:00
+								These functions are context-aware. This means that then the \code{x} argument can be left blank, see \emph{Examples}.
-												(v1.4.0.9032) auto-data guessing for functions

											
										
										
											2020-12-07 16:06:42 +01:00
-												(v1.4.0.9025) is_new_episode()

											
										
										
											2020-11-23 21:50:27 +01:00
+								The \code{\link[=first_isolate]{first_isolate()}} function is a wrapper around the \code{\link[=is_new_episode]{is_new_episode()}} function, but more efficient for data sets containing microorganism codes or names.
-												dplyr 0.8.0 support, fixes #7

											
										
										
											2018-12-22 22:39:34 +01:00
-												(v0.7.1.9031) include_unknown for first_isolate()

											
										
										
											2019-08-08 22:39:42 +02:00
+								All isolates with a microbial ID of \code{NA} will be excluded as first isolate.
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								\subsection{Different methods}{
-												(v1.4.0.9024) is_new_episode()

											
										
										
											2020-11-17 16:57:41 +01:00
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								According to Hindler \emph{et al.} (2007, \doi{10.1086/511864}), there are different methods (algorithms) to select first isolates with increasing reliability: isolate-based, patient-based, episode-based and phenotype-based. All methods select on a combination of the taxonomic genus and species (not subspecies).
-												(v1.4.0.9024) is_new_episode()

											
										
										
											2020-11-17 16:57:41 +01:00
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								All mentioned methods are covered in the \code{\link[=first_isolate]{first_isolate()}} function:\tabular{ll}{
 								   \strong{Method} \tab \strong{Function to apply} \cr
 								   \strong{Isolate-based} \tab \code{first_isolate(x, method = "isolate-based")} \cr
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								   \emph{(= all isolates)} \tab  \cr
 								    \tab  \cr
 								    \tab  \cr
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								   \strong{Patient-based} \tab \code{first_isolate(x, method = "patient-based")} \cr
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								   \emph{(= first isolate per patient)} \tab  \cr
 								    \tab  \cr
 								    \tab  \cr
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								   \strong{Episode-based} \tab \code{first_isolate(x, method = "episode-based")}, or: \cr
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								   \emph{(= first isolate per episode)} \tab  \cr
 								   - 7-Day interval from initial isolate \tab - \code{first_isolate(x, method = "e", episode_days = 7)} \cr
 								   - 30-Day interval from initial isolate \tab - \code{first_isolate(x, method = "e", episode_days = 30)} \cr
 								    \tab  \cr
 								    \tab  \cr
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								   \strong{Phenotype-based} \tab \code{first_isolate(x, method = "phenotype-based")}, or: \cr
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								   \emph{(= first isolate per phenotype)} \tab  \cr
 								   - Major difference in any antimicrobial result \tab - \code{first_isolate(x, type = "points")} \cr
 								   - Any difference in key antimicrobial results \tab - \code{first_isolate(x, type = "keyantimicrobials")} \cr
 								}
-												(v0.7.1.9031) include_unknown for first_isolate()

											
										
										
											2019-08-08 22:39:42 +02:00
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								\subsection{Isolate-based}{
-												(v1.4.0.9024) is_new_episode()

											
										
										
											2020-11-17 16:57:41 +01:00
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								This method does not require any selection, as all isolates should be included. It does, however, respect all arguments set in the \code{\link[=first_isolate]{first_isolate()}} function. For example, the default setting for \code{include_unknown} (\code{FALSE}) will omit selection of rows without a microbial ID.
-												dplyr 0.8.0 support, fixes #7

											
										
										
											2018-12-22 22:39:34 +01:00
+								}
-												(v0.8.0.9036) complete documentation rewrite

											
										
										
											2019-11-28 22:32:17 +01:00
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								\subsection{Patient-based}{
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								To include every genus-species combination per patient once, set the \code{episode_days} to \code{Inf}. Although often inappropriate, this method makes sure that no duplicate isolates are selected from the same patient. In a large longitudinal data set, this could mean that isolates are \emph{excluded} that were found years after the initial isolate.
-												new algorithm key abs

											
										
										
											2018-07-17 13:02:05 +02:00
+								}
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
 								\subsection{Episode-based}{
 								To include every genus-species combination per patient episode once, set the \code{episode_days} to a sensible number of days. Depending on the type of analysis, this could be 14, 30, 60 or 365. Short episodes are common for analysing specific hospital or ward data, long episodes are common for analysing regional and national data.
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								This is the most common method to correct for duplicate isolates. Patients are categorised into episodes based on their ID and dates (e.g., the date of specimen receipt or laboratory result). While this is a common method, it does not take into account antimicrobial test results. This means that e.g. a methicillin-resistant \emph{Staphylococcus aureus} (MRSA) isolate cannot be differentiated from a wildtype \emph{Staphylococcus aureus} isolate.
-												(v1.4.0.9024) is_new_episode()

											
										
										
											2020-11-17 16:57:41 +01:00
+								}
-												new algorithm key abs

											
										
										
											2018-07-17 13:02:05 +02:00
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								\subsection{Phenotype-based}{
-												add MIC values
add badges to readme

											
										
										
											2018-03-13 11:57:30 +01:00
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								This is a more reliable method, since it also \emph{weighs} the antibiogram (antimicrobial test results) yielding so-called 'first weighted isolates'. There are two different methods to weigh the antibiogram:
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								\enumerate{
-												(v1.4.0.9043) documentation update

											
										
										
											2020-12-22 00:51:17 +01:00
+								\item Using \code{type = "points"} and argument \code{points_threshold}
-												new algorithm key abs

											
										
										
											2018-07-17 13:02:05 +02:00
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								This method weighs \emph{all} antimicrobial agents available in the data set. Any difference from I to S or R (or vice versa) counts as 0.5 points, a difference from S to R (or vice versa) counts as 1 point. When the sum of points exceeds \code{points_threshold}, which defaults to \code{2}, an isolate will be selected as a first weighted isolate.
 								All antimicrobials are internally selected using the \code{\link[=all_antimicrobials]{all_antimicrobials()}} function. The output of this function does not need to be passed to the \code{\link[=first_isolate]{first_isolate()}} function.
 								\item Using \code{type = "keyantimicrobials"} and argument \code{ignore_I}
 								This method only weighs specific antimicrobial agents, called \emph{key antimicrobials}. Any difference from S to R (or vice versa) in these key antimicrobials will select an isolate as a first weighted isolate. With \code{ignore_I = FALSE}, also differences from I to S or R (or vice versa) will lead to this.
 								Key antimicrobials are internally selected using the \code{\link[=key_antimicrobials]{key_antimicrobials()}} function, but can also be added manually as a variable to the data and set in the \code{col_keyantimicrobials} argument. Another option is to pass the output of the \code{\link[=key_antimicrobials]{key_antimicrobials()}} function directly to the \code{col_keyantimicrobials} argument.
-												(v0.8.0.9036) complete documentation rewrite

											
										
										
											2019-11-28 22:32:17 +01:00
+								}
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								The default method is phenotype-based (using \code{type = "points"}) and episode-based (using \code{episode_days = 365}). This makes sure that every genus-species combination is selected per patient once per year, while taking into account all antimicrobial test results. If no antimicrobial test results are available in the data set, only the episode-based method is applied at default.
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
+								}
-												new algorithm key abs

											
										
										
											2018-07-17 13:02:05 +02:00
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								}
 								}
-												(v1.5.0.9006) major documentation update

											
										
										
											2021-01-18 16:57:56 +01:00
+								\section{Stable Lifecycle}{
-												(v1.0.0.9007) small doc fix

											
										
										
											2020-02-22 17:03:47 +01:00
 								\if{html}{\figure{lifecycle_stable.svg}{options: style=margin-bottom:5px} \cr}
-												(v1.2.0.9026) move to github

											
										
										
											2020-07-08 14:48:06 +02:00
+								The \link[=lifecycle]{lifecycle} of this function is \strong{stable}. In a stable function, major changes are unlikely. This means that the unlying code will generally evolve by adding new arguments; removing arguments or changing the meaning of existing arguments will be avoided.
-												(v1.0.0.9007) small doc fix

											
										
										
											2020-02-22 17:03:47 +01:00
-												(v1.4.0.9043) documentation update

											
										
										
											2020-12-22 00:51:17 +01:00
+								If the unlying code needs breaking changes, they will occur gradually. For example, a argument will be deprecated and first continue to work, but will emit an message informing you of the change. Next, typically after at least one newly released version on CRAN, the message will be transformed to an error.
-												(v1.0.0.9007) small doc fix

											
										
										
											2020-02-22 17:03:47 +01:00
+								}
-												(v1.5.0.9006) major documentation update

											
										
										
											2021-01-18 16:57:56 +01:00
+								\section{Read more on Our Website!}{
-												big website update, licence txt update

											
										
										
											2019-01-02 23:24:07 +01:00
-												(v1.5.0.9014) only_rsi_columns, is.rsi.eligible improvement

											
										
										
											2021-02-02 23:57:35 +01:00
+								On our website \url{https://msberends.github.io/AMR/} you can find \href{https://msberends.github.io/AMR/articles/AMR.html}{a comprehensive tutorial} about how to conduct AMR data analysis, the \href{https://msberends.github.io/AMR/reference/}{complete documentation of all functions} and \href{https://msberends.github.io/AMR/articles/WHONET.html}{an example analysis using WHONET data}. As we would like to better understand the backgrounds and needs of our users, please \href{https://msberends.github.io/AMR/survey.html}{participate in our survey}!
-												big website update, licence txt update

											
										
										
											2019-01-02 23:24:07 +01:00
+								}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
+								\examples{
-												(v1.5.0.9010) MDRO vignette update, get_episode for < day

											
										
										
											2021-01-24 14:48:56 +01:00
+								# `example_isolates` is a data set available in the AMR package.
-												(v0.7.1.9063) septic_patients -> example_isolates

											
										
										
											2019-08-27 16:45:42 +02:00
+								# See ?example_isolates.
-												- Added new algorithm to determine weighted isolates, can now be `points` or `keyantibiotics, see `?first_isolate`
- Function `first_isolate` supports tidyverse-like evaluation of parameters (no need to quote them anymore)
- Functions `as.rsi` and `as.mic` now add the package name and version as attribute

											
										
										
											2018-03-19 20:39:23 +01:00
-												(v1.5.0.9016) only_rsi_columns update, documentation

											
										
										
											2021-02-08 14:18:42 +01:00
+								example_isolates[first_isolate(example_isolates), ]
-												(v1.3.0.9035) mdro() for EUCAST 3.2, examples cleanup

											
										
										
											2020-09-29 23:35:46 +02:00
+								\donttest{
-												(v1.5.0.9016) only_rsi_columns update, documentation

											
										
										
											2021-02-08 14:18:42 +01:00
+								# faster way, only works in R 3.2 and later:
 								example_isolates[first_isolate(), ]
-												(v1.5.0.9015) unit test fix, grouped first isolates

											
										
										
											2021-02-04 16:48:16 +01:00
+								# get all first Gram-negatives
 								example_isolates[which(first_isolate() & mo_is_gram_negative()), ]
-												(v1.3.0.9035) mdro() for EUCAST 3.2, examples cleanup

											
										
										
											2020-09-29 23:35:46 +02:00
+								if (require("dplyr")) {
-												(v1.5.0.9015) unit test fix, grouped first isolates

											
										
										
											2021-02-04 16:48:16 +01:00
+								  # filter on first isolates using dplyr:
-												(v1.3.0.9035) mdro() for EUCAST 3.2, examples cleanup

											
										
										
											2020-09-29 23:35:46 +02:00
+								  example_isolates \%>\%
-												(v1.5.0.9015) unit test fix, grouped first isolates

											
										
										
											2021-02-04 16:48:16 +01:00
+								    filter(first_isolate())
-												(v1.3.0.9035) mdro() for EUCAST 3.2, examples cleanup

											
										
										
											2020-09-29 23:35:46 +02:00
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								  # short-hand version:
-												(v1.3.0.9035) mdro() for EUCAST 3.2, examples cleanup

											
										
										
											2020-09-29 23:35:46 +02:00
+								  example_isolates \%>\%
 								    filter_first_isolate()
-												(v1.5.0.9015) unit test fix, grouped first isolates

											
										
										
											2021-02-04 16:48:16 +01:00
 								 # grouped determination of first isolates (also prints group names):
 								 example_isolates \%>\%
 								   group_by(hospital_id) \%>\%
 								   mutate(first = first_isolate())
-												(v1.0.1.9009) prepare for next release

											
										
										
											2020-04-15 11:30:28 +02:00
-												(v1.4.0.9024) is_new_episode()

											
										
										
											2020-11-17 16:57:41 +01:00
+								  # now let's see if first isolates matter:
-												(v1.3.0.9035) mdro() for EUCAST 3.2, examples cleanup

											
										
										
											2020-09-29 23:35:46 +02:00
+								  A <- example_isolates \%>\%
 								    group_by(hospital_id) \%>\%
 								    summarise(count = n_rsi(GEN),            # gentamicin availability
 								              resistance = resistance(GEN))  # gentamicin resistance
 								  B <- example_isolates \%>\%
-												(v1.6.0.9013) website update

											
										
										
											2021-04-29 17:16:30 +02:00
+								    filter_first_isolate() \%>\%               # the 1st isolate filter
-												(v1.3.0.9035) mdro() for EUCAST 3.2, examples cleanup

											
										
										
											2020-09-29 23:35:46 +02:00
+								    group_by(hospital_id) \%>\%
 								    summarise(count = n_rsi(GEN),            # gentamicin availability
 								              resistance = resistance(GEN))  # gentamicin resistance
 								  # Have a look at A and B.
 								  # B is more reliable because every isolate is counted only once.
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								  # Gentamicin resistance in hospital D appears to be 4.2\% higher than
-												(v1.3.0.9035) mdro() for EUCAST 3.2, examples cleanup

											
										
										
											2020-09-29 23:35:46 +02:00
+								  # when you (erroneously) would have used all isolates for analysis.
 								}
-												first commit

											
										
										
											2018-02-21 11:52:31 +01:00
+								}
 								}
-												new algorithm key abs

											
										
										
											2018-07-17 13:02:05 +02:00
+								\seealso{
-												(v1.6.0.9010) big first_isolate() update

											
										
										
											2021-04-26 23:57:37 +02:00
+								\code{\link[=key_antimicrobials]{key_antimicrobials()}}
-												new algorithm key abs

											
										
										
											2018-07-17 13:02:05 +02:00
+								}