mirror of https://github.com/msberends/AMR.git
216 lines
9.4 KiB
R
Executable File
216 lines
9.4 KiB
R
Executable File
# ==================================================================== #
|
|
# TITLE #
|
|
# Antimicrobial Resistance (AMR) Data Analysis for R #
|
|
# #
|
|
# SOURCE #
|
|
# https://github.com/msberends/AMR #
|
|
# #
|
|
# LICENCE #
|
|
# (c) 2018-2022 Berends MS, Luz CF et al. #
|
|
# Developed at the University of Groningen, the Netherlands, in #
|
|
# collaboration with non-profit organisations Certe Medical #
|
|
# Diagnostics & Advice, and University Medical Center Groningen. #
|
|
# #
|
|
# This R package is free software; you can freely use and distribute #
|
|
# it for both personal and commercial purposes under the terms of the #
|
|
# GNU General Public License version 2.0 (GNU GPL-2), as published by #
|
|
# the Free Software Foundation. #
|
|
# We created this package for both routine data analysis and academic #
|
|
# research and it was publicly released in the hope that it will be #
|
|
# useful, but it comes WITHOUT ANY WARRANTY OR LIABILITY. #
|
|
# #
|
|
# Visit our website for the full manual and a complete tutorial about #
|
|
# how to conduct AMR data analysis: https://msberends.github.io/AMR/ #
|
|
# ==================================================================== #
|
|
|
|
#' Translate Strings from the AMR Package
|
|
#'
|
|
#' For language-dependent output of AMR functions, like [mo_name()], [mo_gramstain()], [mo_type()] and [ab_name()].
|
|
#' @param x text to translate
|
|
#' @param lang language to choose. Use one of these supported language names or ISO-639-1 codes: `r paste0('"', sapply(LANGUAGES_SUPPORTED_NAMES, function(x) x[[1]]), '" ("' , LANGUAGES_SUPPORTED, '")', collapse = ", ")`.
|
|
#' @details The currently `r length(LANGUAGES_SUPPORTED)` supported languages are `r vector_and(sapply(LANGUAGES_SUPPORTED_NAMES, function(x) x[[1]]), quotes = FALSE, sort = FALSE)`. All these languages have translations available for all antimicrobial agents and colloquial microorganism names.
|
|
#'
|
|
#' Please read about adding or updating a language in [our Wiki](https://github.com/msberends/AMR/wiki/).
|
|
#'
|
|
#' ## Changing the Default Language
|
|
#' The system language will be used at default (as returned by `Sys.getenv("LANG")` or, if `LANG` is not set, [Sys.getlocale("LC_COLLATE")]), if that language is supported. But the language to be used can be overwritten in two ways and will be checked in this order:
|
|
#'
|
|
#' 1. Setting the R option `AMR_locale`, either by using `set_AMR_locale()` or by running e.g. `options(AMR_locale = "de")`.
|
|
#'
|
|
#' Note that setting an \R option only works in the same session. Save the command `options(AMR_locale = "(your language)")` to your `.Rprofile` file to apply it for every session.
|
|
#' 2. Setting the system variable `LANGUAGE` or `LANG`, e.g. by adding `LANGUAGE="de_DE.utf8"` to your `.Renviron` file in your home directory.
|
|
#'
|
|
#' Thus, if the R option `AMR_locale` is set, the system variables `LANGUAGE` and `LANG` will be ignored.
|
|
#' @rdname translate
|
|
#' @name translate
|
|
#' @export
|
|
#' @examples
|
|
#' # Current settings (based on system language)
|
|
#' ab_name("Ciprofloxacin")
|
|
#' mo_name("Coagulase-negative Staphylococcus")
|
|
#'
|
|
#' # setting another language
|
|
#' set_AMR_locale("Greek")
|
|
#' ab_name("Ciprofloxacin")
|
|
#' mo_name("Coagulase-negative Staphylococcus")
|
|
#'
|
|
#' set_AMR_locale("Spanish")
|
|
#' ab_name("Ciprofloxacin")
|
|
#' mo_name("Coagulase-negative Staphylococcus")
|
|
#'
|
|
#' # set_AMR_locale() understands endonyms, English exonyms, and ISO-639-1:
|
|
#' set_AMR_locale("Deutsch")
|
|
#' set_AMR_locale("German")
|
|
#' set_AMR_locale("de")
|
|
#'
|
|
#' # reset to system default
|
|
#' reset_AMR_locale()
|
|
get_AMR_locale <- function() {
|
|
if (!is.null(getOption("AMR_locale", default = NULL))) {
|
|
return(validate_language(getOption("AMR_locale"), extra_txt = "set with `options(AMR_locale = ...)`"))
|
|
}
|
|
|
|
lang <- ""
|
|
# now check the LANGUAGE system variable - return it if set
|
|
if (!identical("", Sys.getenv("LANGUAGE"))) {
|
|
lang <- Sys.getenv("LANGUAGE")
|
|
}
|
|
if (!identical("", Sys.getenv("LANG"))) {
|
|
lang <- Sys.getenv("LANG")
|
|
}
|
|
if (lang == "") {
|
|
lang <- Sys.getlocale("LC_COLLATE")
|
|
}
|
|
|
|
lang <- find_language(lang)
|
|
if (lang != "en" && interactive() && message_not_thrown_before("get_AMR_locale", entire_session = TRUE)) {
|
|
message_("Assuming the ", LANGUAGES_SUPPORTED_NAMES[[lang]]$exonym, " language (",
|
|
LANGUAGES_SUPPORTED_NAMES[[lang]]$endonym, ") for the AMR package. Change this with `set_AMR_locale()`. ",
|
|
"This note will be shown once per session.")
|
|
}
|
|
lang
|
|
}
|
|
|
|
#' @rdname translate
|
|
#' @export
|
|
set_AMR_locale <- function(lang) {
|
|
lang <- validate_language(lang)
|
|
options(AMR_locale = lang)
|
|
message_("Using the ", LANGUAGES_SUPPORTED_NAMES[[lang]]$exonym, " language (", LANGUAGES_SUPPORTED_NAMES[[lang]]$endonym, ") for the AMR package for this session.")
|
|
}
|
|
|
|
#' @rdname translate
|
|
#' @export
|
|
reset_AMR_locale <- function() {
|
|
options(AMR_locale = NULL)
|
|
}
|
|
|
|
#' @rdname translate
|
|
#' @export
|
|
translate_AMR <- function(x, language = get_AMR_locale()) {
|
|
translate_into_language(x, language = language)
|
|
}
|
|
|
|
validate_language <- function(language, extra_txt = character(0)) {
|
|
if (trimws(tolower(language)) %in% c("en", "english", "", "false", NA)) {
|
|
return("en")
|
|
}
|
|
lang <- find_language(language, fallback = FALSE)
|
|
stop_ifnot(length(lang) > 0 && lang %in% LANGUAGES_SUPPORTED,
|
|
"unsupported language for AMR package", extra_txt, ": \"", language, "\". Use one of these language names or ISO-639-1 codes: ",
|
|
paste0('"', vapply(FUN.VALUE = character(1), LANGUAGES_SUPPORTED_NAMES, function(x) x[[1]]),
|
|
'" ("' , LANGUAGES_SUPPORTED, '")', collapse = ", "),
|
|
call = FALSE)
|
|
lang
|
|
}
|
|
|
|
find_language <- function(lang, fallback = TRUE) {
|
|
lang <- Map(function(l, n, check = lang) {
|
|
grepl(paste0("^(", l[1], "|", l[2], "|",
|
|
n, "(_|$)|", toupper(n), "(_|$))"),
|
|
check,
|
|
ignore.case = FALSE,
|
|
perl = TRUE,
|
|
useBytes = FALSE)
|
|
},
|
|
LANGUAGES_SUPPORTED_NAMES,
|
|
LANGUAGES_SUPPORTED,
|
|
USE.NAMES = TRUE)
|
|
lang <- names(which(lang == TRUE))
|
|
if (isTRUE(fallback) && length(lang) == 0) {
|
|
# other language -> set to English
|
|
lang <- "en"
|
|
}
|
|
lang
|
|
}
|
|
|
|
# translate strings based on inst/translations.tsv
|
|
translate_into_language <- function(from,
|
|
language = get_AMR_locale(),
|
|
only_unknown = FALSE,
|
|
only_affect_ab_names = FALSE,
|
|
only_affect_mo_names = FALSE) {
|
|
|
|
if (is.null(language)) {
|
|
return(from)
|
|
}
|
|
if (language %in% c("en", "", NA)) {
|
|
return(from)
|
|
}
|
|
|
|
df_trans <- TRANSLATIONS # internal data file
|
|
from.bak <- from
|
|
from_unique <- unique(from)
|
|
from_unique_translated <- from_unique
|
|
|
|
# get ISO-639-1 of language
|
|
lang <- validate_language(language)
|
|
# only keep lines where translation is available for this language
|
|
df_trans <- df_trans[which(!is.na(df_trans[, lang, drop = TRUE])), , drop = FALSE]
|
|
# and where the original string is not equal to the string in the target language
|
|
df_trans <- df_trans[which(df_trans[, "pattern", drop = TRUE] != df_trans[, lang, drop = TRUE]), , drop = FALSE]
|
|
if (only_unknown == TRUE) {
|
|
df_trans <- subset(df_trans, pattern %like% "unknown")
|
|
}
|
|
if (only_affect_ab_names == TRUE) {
|
|
df_trans <- subset(df_trans, affect_ab_name == TRUE)
|
|
}
|
|
if (only_affect_mo_names == TRUE) {
|
|
df_trans <- subset(df_trans, affect_mo_name == TRUE)
|
|
}
|
|
if (NROW(df_trans) == 0) {
|
|
return(from)
|
|
}
|
|
|
|
# default: case sensitive if value if 'case_sensitive' is missing:
|
|
df_trans$case_sensitive[is.na(df_trans$case_sensitive)] <- TRUE
|
|
# default: not using regular expressions if 'regular_expr' is missing:
|
|
df_trans$regular_expr[is.na(df_trans$regular_expr)] <- FALSE
|
|
|
|
# check if text to look for is in one of the patterns
|
|
any_form_in_patterns <- tryCatch(
|
|
any(from_unique %like% paste0("(", paste(gsub(" +\\(.*", "", df_trans$pattern), collapse = "|"), ")")),
|
|
error = function(e) {
|
|
warning_("Translation not possible. Please open an issue on GitHub (https://github.com/msberends/AMR/issues).")
|
|
return(FALSE)
|
|
})
|
|
|
|
if (NROW(df_trans) == 0 | !any_form_in_patterns) {
|
|
return(from)
|
|
}
|
|
|
|
lapply(seq_len(nrow(df_trans)),
|
|
function(i) from_unique_translated <<- gsub(pattern = df_trans$pattern[i],
|
|
replacement = df_trans[i, lang, drop = TRUE],
|
|
x = from_unique_translated,
|
|
ignore.case = !df_trans$case_sensitive[i] & df_trans$regular_expr[i],
|
|
fixed = !df_trans$regular_expr[i],
|
|
perl = df_trans$regular_expr[i]))
|
|
|
|
# force UTF-8 for diacritics
|
|
from_unique_translated <- enc2utf8(from_unique_translated)
|
|
|
|
# a kind of left join to get all results back
|
|
from_unique_translated[match(from.bak, from_unique)]
|
|
}
|