AMR/man/join.Rd

75 lines
2.8 KiB
Plaintext
Raw Normal View History

2018-02-21 11:52:31 +01:00
% Generated by roxygen2: do not edit by hand
2018-07-23 14:14:03 +02:00
% Please edit documentation in R/join_microorganisms.R
2018-02-21 11:52:31 +01:00
\name{join}
\alias{join}
\alias{inner_join_microorganisms}
2018-02-21 11:52:31 +01:00
\alias{inner_join}
\alias{left_join_microorganisms}
\alias{right_join_microorganisms}
\alias{full_join_microorganisms}
\alias{semi_join_microorganisms}
\alias{anti_join_microorganisms}
\title{Join \link{microorganisms} to a Data Set}
2018-02-21 11:52:31 +01:00
\usage{
2018-10-12 16:35:18 +02:00
inner_join_microorganisms(x, by = NULL, suffix = c("2", ""), ...)
2018-02-21 11:52:31 +01:00
2018-10-12 16:35:18 +02:00
left_join_microorganisms(x, by = NULL, suffix = c("2", ""), ...)
2018-02-21 11:52:31 +01:00
2018-10-12 16:35:18 +02:00
right_join_microorganisms(x, by = NULL, suffix = c("2", ""), ...)
2018-02-21 11:52:31 +01:00
2018-10-12 16:35:18 +02:00
full_join_microorganisms(x, by = NULL, suffix = c("2", ""), ...)
2018-02-21 11:52:31 +01:00
2018-10-12 16:35:18 +02:00
semi_join_microorganisms(x, by = NULL, ...)
2018-02-21 11:52:31 +01:00
2018-10-12 16:35:18 +02:00
anti_join_microorganisms(x, by = NULL, ...)
2018-02-21 11:52:31 +01:00
}
\arguments{
2021-05-12 18:15:03 +02:00
\item{x}{existing data set to join, or \link{character} vector. In case of a \link{character} vector, the resulting \link{data.frame} will contain a column 'x' with these values.}
2018-02-21 11:52:31 +01:00
2020-12-17 16:22:25 +01:00
\item{by}{a variable to join by - if left empty will search for a column with class \code{\link{mo}} (created with \code{\link[=as.mo]{as.mo()}}) or will be \code{"mo"} if that column name exists in \code{x}, could otherwise be a column name of \code{x} with values that exist in \code{microorganisms$mo} (such as \code{by = "bacteria_id"}), or another column in \link{microorganisms} (but then it should be named, like \code{by = c("bacteria_id" = "fullname")})}
2018-02-21 11:52:31 +01:00
2021-05-12 18:15:03 +02:00
\item{suffix}{if there are non-joined duplicate variables in \code{x} and \code{y}, these suffixes will be added to the output to disambiguate them. Should be a \link{character} vector of length 2.}
2021-04-29 17:16:30 +02:00
\item{...}{ignored, only in place to allow future extensions}
2018-02-21 11:52:31 +01:00
}
2021-05-12 18:15:03 +02:00
\value{
a \link{data.frame}
}
2018-02-21 11:52:31 +01:00
\description{
2021-05-12 18:15:03 +02:00
Join the data set \link{microorganisms} easily to an existing data set or to a \link{character} vector.
2018-02-21 11:52:31 +01:00
}
\details{
\strong{Note:} As opposed to the \code{join()} functions of \code{dplyr}, \link{character} vectors are supported and at default existing columns will get a suffix \code{"2"} and the newly joined columns will not get a suffix.
2020-05-16 13:05:47 +02:00
If the \code{dplyr} package is installed, their join functions will be used. Otherwise, the much slower \code{\link[=merge]{merge()}} and \code{\link[=interaction]{interaction()}} functions from base \R will be used.
2018-02-21 11:52:31 +01:00
}
2018-02-22 20:48:48 +01:00
\examples{
2018-10-12 16:35:18 +02:00
left_join_microorganisms(as.mo("K. pneumoniae"))
2021-05-12 18:15:03 +02:00
left_join_microorganisms("B_KLBSL_PNMN")
2022-08-28 10:31:50 +02:00
df <- data.frame(
date = seq(
from = as.Date("2018-01-01"),
to = as.Date("2018-01-07"),
by = 1
),
bacteria = as.mo(c(
"S. aureus", "MRSA", "MSSA", "STAAUR",
"E. coli", "E. coli", "E. coli"
)),
stringsAsFactors = FALSE
)
2022-08-27 20:49:37 +02:00
colnames(df)
df_joined <- left_join_microorganisms(df, "bacteria")
colnames(df_joined)
\donttest{
if (require("dplyr")) {
example_isolates \%>\%
2022-08-28 10:31:50 +02:00
left_join_microorganisms() \%>\%
colnames()
}
2018-02-22 20:48:48 +01:00
}
2020-05-16 13:05:47 +02:00
}