2018-02-21 11:52:31 +01:00
# ==================================================================== #
2023-07-08 17:30:05 +02:00
# TITLE: #
2022-10-05 09:12:22 +02:00
# AMR: An R Package for Working with Antimicrobial Resistance Data #
2018-02-21 11:52:31 +01:00
# #
2023-07-08 17:30:05 +02:00
# SOURCE CODE: #
2020-07-08 14:48:06 +02:00
# https://github.com/msberends/AMR #
2018-02-21 11:52:31 +01:00
# #
2023-07-08 17:30:05 +02:00
# PLEASE CITE THIS SOFTWARE AS: #
2022-10-05 09:12:22 +02:00
# Berends MS, Luz CF, Friedrich AW, Sinha BNM, Albers CJ, Glasner C #
# (2022). AMR: An R Package for Working with Antimicrobial Resistance #
# Data. Journal of Statistical Software, 104(3), 1-31. #
2023-05-27 10:39:22 +02:00
# https://doi.org/10.18637/jss.v104.i03 #
2022-10-05 09:12:22 +02:00
# #
2022-12-27 15:16:15 +01:00
# Developed at the University of Groningen and the University Medical #
# Center Groningen in The Netherlands, in collaboration with many #
# colleagues from around the world, see our website. #
2018-02-21 11:52:31 +01:00
# #
2019-01-02 23:24:07 +01:00
# This R package is free software; you can freely use and distribute #
# it for both personal and commercial purposes under the terms of the #
# GNU General Public License version 2.0 (GNU GPL-2), as published by #
# the Free Software Foundation. #
2020-01-05 17:22:09 +01:00
# We created this package for both routine data analysis and academic #
# research and it was publicly released in the hope that it will be #
# useful, but it comes WITHOUT ANY WARRANTY OR LIABILITY. #
2020-10-08 11:16:03 +02:00
# #
# Visit our website for the full manual and a complete tutorial about #
2021-02-02 23:57:35 +01:00
# how to conduct AMR data analysis: https://msberends.github.io/AMR/ #
2018-02-21 11:52:31 +01:00
# ==================================================================== #
2021-11-28 23:01:26 +01:00
# these are allowed MIC values and will become [factor] levels
2022-10-05 09:12:22 +02:00
operators <- c ( " <" , " <=" , " " , " >=" , " >" )
2022-08-28 10:31:50 +02:00
valid_mic_levels <- c (
c ( t ( vapply (
2022-10-05 09:12:22 +02:00
FUN.VALUE = character ( 6 ) , operators ,
function ( x ) paste0 ( x , " 0.000" , c ( 1 : 4 , 6 , 8 ) )
) ) ) ,
c ( t ( vapply (
FUN.VALUE = character ( 90 ) , operators ,
function ( x ) paste0 ( x , " 0.00" , c ( 1 : 9 , 11 : 19 , 21 : 29 , 31 : 39 , 41 : 49 , 51 : 59 , 61 : 69 , 71 : 79 , 81 : 89 , 91 : 99 ) )
2022-08-28 10:31:50 +02:00
) ) ) ,
unique ( c ( t ( vapply (
2022-10-05 09:12:22 +02:00
FUN.VALUE = character ( 106 ) , operators ,
2022-08-28 10:31:50 +02:00
function ( x ) {
paste0 ( x , sort ( as.double ( paste0 (
" 0.0" ,
2022-10-05 09:12:22 +02:00
sort ( c ( 1 : 99 , 125 , 128 , 156 , 165 , 256 , 512 , 625 ) )
2022-08-28 10:31:50 +02:00
) ) ) )
}
) ) ) ) ,
unique ( c ( t ( vapply (
2022-10-05 09:12:22 +02:00
FUN.VALUE = character ( 103 ) , operators ,
2022-08-28 10:31:50 +02:00
function ( x ) {
paste0 ( x , sort ( as.double ( paste0 (
" 0." ,
c ( 1 : 99 , 125 , 128 , 256 , 512 )
) ) ) )
}
) ) ) ) ,
c ( t ( vapply (
2022-10-05 09:12:22 +02:00
FUN.VALUE = character ( 10 ) , operators ,
2022-08-28 10:31:50 +02:00
function ( x ) paste0 ( x , sort ( c ( 1 : 9 , 1.5 ) ) )
) ) ) ,
c ( t ( vapply (
2022-10-05 09:12:22 +02:00
FUN.VALUE = character ( 45 ) , operators ,
2022-08-28 10:31:50 +02:00
function ( x ) paste0 ( x , c ( 10 : 98 ) [9 : 98 %% 2 == TRUE ] )
) ) ) ,
c ( t ( vapply (
2022-10-05 09:12:22 +02:00
FUN.VALUE = character ( 17 ) , operators ,
2022-08-28 10:31:50 +02:00
function ( x ) paste0 ( x , sort ( c ( 2 ^c ( 7 : 11 ) , 192 , 80 * c ( 2 : 12 ) ) ) )
) ) )
)
2021-11-28 23:01:26 +01:00
2021-01-18 16:57:56 +01:00
#' Transform Input to Minimum Inhibitory Concentrations (MIC)
2018-02-21 11:52:31 +01:00
#'
2021-11-28 23:01:26 +01:00
#' This transforms vectors to a new class [`mic`], which treats the input as decimal numbers, while maintaining operators (such as ">=") and only allowing valid MIC values known to the field of (medical) microbiology.
2018-02-21 11:52:31 +01:00
#' @rdname as.mic
2021-05-12 18:15:03 +02:00
#' @param x a [character] or [numeric] vector
#' @param na.rm a [logical] indicating whether missing values should be removed
2022-05-16 12:52:50 +02:00
#' @param ... arguments passed on to methods
2023-01-21 23:47:20 +01:00
#' @details To interpret MIC values as SIR values, use [as.sir()] on MIC values. It supports guidelines from EUCAST (`r min(as.integer(gsub("[^0-9]", "", subset(clinical_breakpoints, guideline %like% "EUCAST")$guideline)))`-`r max(as.integer(gsub("[^0-9]", "", subset(clinical_breakpoints, guideline %like% "EUCAST")$guideline)))`) and CLSI (`r min(as.integer(gsub("[^0-9]", "", subset(clinical_breakpoints, guideline %like% "CLSI")$guideline)))`-`r max(as.integer(gsub("[^0-9]", "", subset(clinical_breakpoints, guideline %like% "CLSI")$guideline)))`).
2022-08-28 10:31:50 +02:00
#'
2021-05-12 18:15:03 +02:00
#' This class for MIC values is a quite a special data type: formally it is an ordered [factor] with valid MIC values as [factor] levels (to make sure only valid MIC values are retained), but for any mathematical operation it acts as decimal numbers:
2022-08-28 10:31:50 +02:00
#'
2021-03-07 13:52:39 +01:00
#' ```
#' x <- random_mic(10)
#' x
2022-10-19 11:47:57 +02:00
#' #> Class 'mic'
2021-03-07 13:52:39 +01:00
#' #> [1] 16 1 8 8 64 >=128 0.0625 32 32 16
2022-08-28 10:31:50 +02:00
#'
2021-03-07 13:52:39 +01:00
#' is.factor(x)
#' #> [1] TRUE
2022-08-28 10:31:50 +02:00
#'
2021-03-07 13:52:39 +01:00
#' x[1] * 2
#' #> [1] 32
2022-08-28 10:31:50 +02:00
#'
2021-03-07 13:52:39 +01:00
#' median(x)
#' #> [1] 26
#' ```
2022-08-28 10:31:50 +02:00
#'
2021-05-12 18:15:03 +02:00
#' This makes it possible to maintain operators that often come with MIC values, such ">=" and "<=", even when filtering using [numeric] values in data analysis, e.g.:
2022-08-28 10:31:50 +02:00
#'
2021-03-07 13:52:39 +01:00
#' ```
#' x[x > 4]
2022-10-19 11:47:57 +02:00
#' #> Class 'mic'
2021-03-07 13:52:39 +01:00
#' #> [1] 16 8 8 64 >=128 32 32 16
2022-08-28 10:31:50 +02:00
#'
2021-03-07 13:52:39 +01:00
#' df <- data.frame(x, hospital = "A")
#' subset(df, x > 4) # or with dplyr: df %>% filter(x > 4)
#' #> x hospital
#' #> 1 16 A
#' #> 5 64 A
#' #> 6 >=128 A
#' #> 8 32 A
#' #> 9 32 A
#' #> 10 16 A
#' ```
2022-08-28 10:31:50 +02:00
#'
2021-03-07 21:16:45 +01:00
#' The following [generic functions][groupGeneric()] are implemented for the MIC class: `!`, `!=`, `%%`, `%/%`, `&`, `*`, `+`, `-`, `/`, `<`, `<=`, `==`, `>`, `>=`, `^`, `|`, [abs()], [acos()], [acosh()], [all()], [any()], [asin()], [asinh()], [atan()], [atanh()], [ceiling()], [cos()], [cosh()], [cospi()], [cummax()], [cummin()], [cumprod()], [cumsum()], [digamma()], [exp()], [expm1()], [floor()], [gamma()], [lgamma()], [log()], [log1p()], [log2()], [log10()], [max()], [mean()], [min()], [prod()], [range()], [round()], [sign()], [signif()], [sin()], [sinh()], [sinpi()], [sqrt()], [sum()], [tan()], [tanh()], [tanpi()], [trigamma()] and [trunc()]. Some functions of the `stats` package are also implemented: [median()], [quantile()], [mad()], [IQR()], [fivenum()]. Also, [boxplot.stats()] is supported. Since [sd()] and [var()] are non-generic functions, these could not be extended. Use [mad()] as an alternative, or use e.g. `sd(as.numeric(x))` where `x` is your vector of MIC values.
2022-08-28 10:31:50 +02:00
#'
2022-05-09 21:33:27 +02:00
#' Using [as.double()] or [as.numeric()] on MIC values will remove the operators and return a numeric vector. Do **not** use [as.integer()] on MIC values as by the \R convention on [factor]s, it will return the index of the factor levels (which is often useless for regular users).
2022-08-28 10:31:50 +02:00
#'
2022-10-19 11:47:57 +02:00
#' Use [droplevels()] to drop unused levels. At default, it will return a plain factor. Use `droplevels(..., as.mic = TRUE)` to maintain the `mic` class.
2021-05-12 18:15:03 +02:00
#' @return Ordered [factor] with additional class [`mic`], that in mathematical operations acts as decimal numbers. Bare in mind that the outcome of any mathematical operation on MICs will return a [numeric] value.
2019-11-28 23:00:37 +01:00
#' @aliases mic
2018-02-21 11:52:31 +01:00
#' @export
2023-01-21 23:47:20 +01:00
#' @seealso [as.sir()]
2018-02-22 20:48:48 +01:00
#' @examples
#' mic_data <- as.mic(c(">=32", "1.0", "1", "1.00", 8, "<=0.128", "8", "16", "16"))
2022-08-21 16:37:20 +02:00
#' mic_data
2018-02-22 20:48:48 +01:00
#' is.mic(mic_data)
2018-04-02 16:05:09 +02:00
#'
2023-01-21 23:47:20 +01:00
#' # this can also coerce combined MIC/SIR values:
2022-08-21 16:37:20 +02:00
#' as.mic("<=0.002; S")
2022-08-28 10:31:50 +02:00
#'
2022-08-21 16:37:20 +02:00
#' # mathematical processing treats MICs as numeric values
2021-03-05 15:36:39 +01:00
#' fivenum(mic_data)
#' quantile(mic_data)
#' all(mic_data < 512)
2018-06-19 10:05:38 +02:00
#'
2019-05-10 16:44:59 +02:00
#' # interpret MIC values
2023-01-21 23:47:20 +01:00
#' as.sir(
2022-08-28 10:31:50 +02:00
#' x = as.mic(2),
#' mo = as.mo("Streptococcus pneumoniae"),
#' ab = "AMX",
#' guideline = "EUCAST"
#' )
2023-01-21 23:47:20 +01:00
#' as.sir(
2022-08-28 10:31:50 +02:00
#' x = as.mic(c(0.01, 2, 4, 8)),
#' mo = as.mo("Streptococcus pneumoniae"),
#' ab = "AMX",
#' guideline = "EUCAST"
#' )
2019-05-10 16:44:59 +02:00
#'
2021-02-25 10:33:08 +01:00
#' # plot MIC values, see ?plot
2018-02-22 20:48:48 +01:00
#' plot(mic_data)
2021-02-25 10:33:08 +01:00
#' plot(mic_data, mo = "E. coli", ab = "cipro")
2022-08-28 10:31:50 +02:00
#'
2022-08-27 20:49:37 +02:00
#' if (require("ggplot2")) {
#' autoplot(mic_data, mo = "E. coli", ab = "cipro")
#' }
#' if (require("ggplot2")) {
#' autoplot(mic_data, mo = "E. coli", ab = "cipro", language = "nl") # Dutch
#' }
#' if (require("ggplot2")) {
#' autoplot(mic_data, mo = "E. coli", ab = "cipro", language = "uk") # Ukrainian
#' }
2018-02-21 11:52:31 +01:00
as.mic <- function ( x , na.rm = FALSE ) {
2023-07-08 17:30:05 +02:00
meet_criteria ( x , allow_NA = TRUE )
2020-10-19 17:09:19 +02:00
meet_criteria ( na.rm , allow_class = " logical" , has_length = 1 )
2022-08-28 10:31:50 +02:00
2018-02-21 11:52:31 +01:00
if ( is.mic ( x ) ) {
x
} else {
2022-10-05 09:12:22 +02:00
if ( is.numeric ( x ) ) {
x <- format ( x , scientific = FALSE )
} else {
x <- as.character ( unlist ( x ) )
}
2022-11-14 15:20:39 +01:00
if ( isTRUE ( na.rm ) ) {
2018-02-21 11:52:31 +01:00
x <- x [ ! is.na ( x ) ]
}
2022-10-05 09:12:22 +02:00
x [trimws2 ( x ) == " " ] <- NA
2018-02-21 11:52:31 +01:00
x.bak <- x
2022-08-28 10:31:50 +02:00
2018-06-19 10:05:38 +02:00
# comma to period
2019-10-11 17:21:02 +02:00
x <- gsub ( " ," , " ." , x , fixed = TRUE )
2020-02-20 13:19:23 +01:00
# transform Unicode for >= and <=
x <- gsub ( " \u2264" , " <=" , x , fixed = TRUE )
x <- gsub ( " \u2265" , " >=" , x , fixed = TRUE )
2021-11-28 23:01:26 +01:00
# remove other invalid characters
x <- gsub ( " [^a-zA-Z0-9.><= ]+" , " " , x , perl = TRUE )
2018-06-19 10:05:38 +02:00
# remove space between operator and number ("<= 0.002" -> "<=0.002")
2021-03-07 21:16:45 +01:00
x <- gsub ( " (<|=|>) +" , " \\1" , x , perl = TRUE )
2019-10-08 22:21:33 +02:00
# transform => to >= and =< to <=
2019-10-11 17:21:02 +02:00
x <- gsub ( " =<" , " <=" , x , fixed = TRUE )
2020-02-20 13:19:23 +01:00
x <- gsub ( " =>" , " >=" , x , fixed = TRUE )
2020-07-30 12:37:01 +02:00
# dots without a leading zero must start with 0
2021-03-07 21:16:45 +01:00
x <- gsub ( " ([^0-9]|^)[.]" , " \\10." , x , perl = TRUE )
2020-04-29 14:33:44 +02:00
# values like "<=0.2560.512" should be 0.512
2021-03-07 21:16:45 +01:00
x <- gsub ( " .*[.].*[.]" , " 0." , x , perl = TRUE )
2018-02-21 11:52:31 +01:00
# remove ending .0
2021-03-07 21:16:45 +01:00
x <- gsub ( " [.]+0$" , " " , x , perl = TRUE )
2018-02-21 11:52:31 +01:00
# remove all after last digit
2021-03-07 21:16:45 +01:00
x <- gsub ( " [^0-9]+$" , " " , x , perl = TRUE )
2019-10-08 22:21:33 +02:00
# keep only one zero before dot
2021-03-07 21:16:45 +01:00
x <- gsub ( " 0+[.]" , " 0." , x , perl = TRUE )
2019-10-08 22:21:33 +02:00
# starting 00 is probably 0.0 if there's no dot yet
2021-04-23 09:59:36 +02:00
x [x %unlike% " [.]" ] <- gsub ( " ^00" , " 0.0" , x [ ! x %like% " [.]" ] )
2018-02-21 11:52:31 +01:00
# remove last zeroes
2021-03-07 21:16:45 +01:00
x <- gsub ( " ([.].?)0+$" , " \\1" , x , perl = TRUE )
x <- gsub ( " (.*[.])0+$" , " \\10" , x , perl = TRUE )
2018-12-29 22:24:19 +01:00
# remove ending .0 again
2019-10-11 17:21:02 +02:00
x [x %like% " [.]" ] <- gsub ( " 0+$" , " " , x [x %like% " [.]" ] )
2020-04-29 14:33:44 +02:00
# never end with dot
2021-03-07 21:16:45 +01:00
x <- gsub ( " [.]$" , " " , x , perl = TRUE )
2019-10-08 22:21:33 +02:00
# trim it
2022-10-05 09:12:22 +02:00
x <- trimws2 ( x )
2022-08-28 10:31:50 +02:00
2019-05-10 16:44:59 +02:00
## previously unempty values now empty - should return a warning later on
2018-08-24 11:08:20 +02:00
x [x.bak != " " & x == " " ] <- " invalid"
2022-08-28 10:31:50 +02:00
2023-02-09 13:07:39 +01:00
na_before <- x [is.na ( x ) | x == " " ] %pm>% length ( )
2021-11-28 23:01:26 +01:00
x [ ! x %in% valid_mic_levels ] <- NA
2023-02-09 13:07:39 +01:00
na_after <- x [is.na ( x ) | x == " " ] %pm>% length ( )
2022-08-28 10:31:50 +02:00
2018-02-21 11:52:31 +01:00
if ( na_before != na_after ) {
2023-02-09 13:07:39 +01:00
list_missing <- x.bak [is.na ( x ) & ! is.na ( x.bak ) & x.bak != " " ] %pm>%
unique ( ) %pm>%
sort ( ) %pm>%
2021-02-04 16:48:16 +01:00
vector_and ( quotes = TRUE )
2022-11-28 19:39:52 +01:00
cur_col <- get_current_column ( )
warning_ ( " in `as.mic()`: " , na_after - na_before , " result" ,
2023-01-23 15:01:21 +01:00
ifelse ( na_after - na_before > 1 , " s" , " " ) ,
ifelse ( is.null ( cur_col ) , " " , paste0 ( " in column '" , cur_col , " '" ) ) ,
" truncated (" ,
round ( ( ( na_after - na_before ) / length ( x ) ) * 100 ) ,
" %) that were invalid MICs: " ,
list_missing ,
call = FALSE
2022-08-28 10:31:50 +02:00
)
2018-02-21 11:52:31 +01:00
}
2022-08-28 10:31:50 +02:00
2021-11-28 23:01:26 +01:00
set_clean_class ( factor ( x , levels = valid_mic_levels , ordered = TRUE ) ,
2022-08-28 10:31:50 +02:00
new_class = c ( " mic" , " ordered" , " factor" )
)
2018-02-21 11:52:31 +01:00
}
}
2020-02-20 13:19:23 +01:00
all_valid_mics <- function ( x ) {
2020-10-19 17:09:19 +02:00
if ( ! inherits ( x , c ( " mic" , " character" , " factor" , " numeric" , " integer" ) ) ) {
return ( FALSE )
}
2020-06-26 10:21:22 +02:00
x_mic <- tryCatch ( suppressWarnings ( as.mic ( x [ ! is.na ( x ) ] ) ) ,
2022-08-28 10:31:50 +02:00
error = function ( e ) NA
)
2020-12-17 16:22:25 +01:00
! any ( is.na ( x_mic ) ) && ! all ( is.na ( x ) )
2020-02-20 13:19:23 +01:00
}
2021-11-28 23:01:26 +01:00
#' @rdname as.mic
2022-10-19 11:47:57 +02:00
#' @details `NA_mic_` is a missing value of the new `mic` class, analogous to e.g. base \R's [`NA_character_`][base::NA].
2022-05-09 21:33:27 +02:00
#' @format NULL
2021-11-28 23:01:26 +01:00
#' @export
NA_mic_ <- set_clean_class ( factor ( NA , levels = valid_mic_levels , ordered = TRUE ) ,
2022-08-28 10:31:50 +02:00
new_class = c ( " mic" , " ordered" , " factor" )
)
2021-11-28 23:01:26 +01:00
2018-02-21 11:52:31 +01:00
#' @rdname as.mic
#' @export
is.mic <- function ( x ) {
2020-02-10 14:18:15 +01:00
inherits ( x , " mic" )
2018-02-21 11:52:31 +01:00
}
2020-05-28 16:48:55 +02:00
#' @method as.double mic
2018-02-21 11:52:31 +01:00
#' @export
#' @noRd
as.double.mic <- function ( x , ... ) {
2021-03-07 21:16:45 +01:00
as.double ( gsub ( " [<=>]+" , " " , as.character ( x ) , perl = TRUE ) )
2018-02-21 11:52:31 +01:00
}
2020-05-28 16:48:55 +02:00
#' @method as.numeric mic
2018-02-21 11:52:31 +01:00
#' @export
#' @noRd
as.numeric.mic <- function ( x , ... ) {
2021-03-07 21:16:45 +01:00
as.numeric ( gsub ( " [<=>]+" , " " , as.character ( x ) , perl = TRUE ) )
2018-02-21 11:52:31 +01:00
}
2022-05-09 21:33:27 +02:00
#' @rdname as.mic
2020-05-28 16:48:55 +02:00
#' @method droplevels mic
2023-02-22 14:38:57 +01:00
#' @param as.mic a [logical] to indicate whether the `mic` class should be kept - the default is `FALSE`
2018-12-29 22:24:19 +01:00
#' @export
2022-05-16 12:52:50 +02:00
droplevels.mic <- function ( x , as.mic = FALSE , ... ) {
x <- droplevels.factor ( x , ... )
2021-02-25 10:33:08 +01:00
if ( as.mic == TRUE ) {
class ( x ) <- c ( " mic" , " ordered" , " factor" )
}
2018-12-29 22:24:19 +01:00
x
}
2020-08-28 21:55:47 +02:00
# will be exported using s3_register() in R/zzz.R
2020-08-26 11:33:54 +02:00
pillar_shaft.mic <- function ( x , ... ) {
2020-12-09 09:40:50 +01:00
crude_numbers <- as.double ( x )
operators <- gsub ( " [^<=>]+" , " " , as.character ( x ) )
2022-03-15 17:35:02 +01:00
operators [ ! is.na ( operators ) & operators != " " ] <- font_silver ( operators [ ! is.na ( operators ) & operators != " " ] , collapse = NULL )
2022-03-10 19:33:25 +01:00
out <- trimws ( paste0 ( operators , trimws ( format ( crude_numbers ) ) ) )
2020-08-28 21:55:47 +02:00
out [is.na ( x ) ] <- font_na ( NA )
2022-03-10 19:33:25 +01:00
# maketrailing zeroes almost invisible
out [out %like% " [.]" ] <- gsub ( " ([.]?0+)$" , font_white ( " \\1" ) , out [out %like% " [.]" ] , perl = TRUE )
create_pillar_column ( out , align = " right" , width = max ( nchar ( font_stripstyle ( out ) ) ) )
2020-08-26 11:33:54 +02:00
}
2020-08-28 21:55:47 +02:00
# will be exported using s3_register() in R/zzz.R
2020-08-26 11:33:54 +02:00
type_sum.mic <- function ( x , ... ) {
" mic"
}
2020-05-28 16:48:55 +02:00
#' @method print mic
2018-02-21 11:52:31 +01:00
#' @export
#' @noRd
print.mic <- function ( x , ... ) {
2022-10-19 11:47:57 +02:00
cat ( " Class 'mic'" ,
2022-08-28 10:31:50 +02:00
ifelse ( length ( levels ( x ) ) < length ( valid_mic_levels ) , font_red ( " with dropped levels" ) , " " ) ,
" \n" ,
sep = " "
)
2018-08-01 22:37:28 +02:00
print ( as.character ( x ) , quote = FALSE )
2021-03-07 13:52:39 +01:00
att <- attributes ( x )
if ( " na.action" %in% names ( att ) ) {
cat ( font_silver ( paste0 ( " (NA " , class ( att $ na.action ) , " : " , paste0 ( att $ na.action , collapse = " , " ) , " )\n" ) ) )
}
2018-02-21 11:52:31 +01:00
}
2020-05-28 16:48:55 +02:00
#' @method summary mic
2018-02-21 11:52:31 +01:00
#' @export
#' @noRd
summary.mic <- function ( object , ... ) {
2021-03-07 13:52:39 +01:00
summary ( as.double ( object ) , ... )
2018-02-21 11:52:31 +01:00
}
2021-03-07 21:16:45 +01:00
#' @method as.matrix mic
#' @export
#' @noRd
as.matrix.mic <- function ( x , ... ) {
as.matrix ( as.double ( x ) , ... )
}
2020-05-28 16:48:55 +02:00
#' @method [ mic
2020-04-13 21:09:56 +02:00
#' @export
#' @noRd
" [.mic" <- function ( x , ... ) {
y <- NextMethod ( )
attributes ( y ) <- attributes ( x )
y
}
2020-05-28 16:48:55 +02:00
#' @method [[ mic
2020-04-13 21:09:56 +02:00
#' @export
#' @noRd
" [[.mic" <- function ( x , ... ) {
y <- NextMethod ( )
attributes ( y ) <- attributes ( x )
y
}
2020-05-28 16:48:55 +02:00
#' @method [<- mic
2020-04-13 21:09:56 +02:00
#' @export
#' @noRd
" [<-.mic" <- function ( i , j , ... , value ) {
value <- as.mic ( value )
y <- NextMethod ( )
attributes ( y ) <- attributes ( i )
y
}
2020-05-28 16:48:55 +02:00
#' @method [[<- mic
2020-04-13 21:09:56 +02:00
#' @export
#' @noRd
" [[<-.mic" <- function ( i , j , ... , value ) {
value <- as.mic ( value )
y <- NextMethod ( )
attributes ( y ) <- attributes ( i )
y
}
2020-05-28 16:48:55 +02:00
#' @method c mic
2020-04-13 21:09:56 +02:00
#' @export
#' @noRd
2021-05-03 13:06:43 +02:00
c.mic <- function ( ... ) {
as.mic ( unlist ( lapply ( list ( ... ) , as.character ) ) )
2020-04-13 21:09:56 +02:00
}
2020-09-25 14:44:50 +02:00
#' @method unique mic
#' @export
#' @noRd
unique.mic <- function ( x , incomparables = FALSE , ... ) {
y <- NextMethod ( )
attributes ( y ) <- attributes ( x )
y
}
2020-09-28 01:08:55 +02:00
2021-07-06 16:35:14 +02:00
#' @method rep mic
#' @export
#' @noRd
rep.mic <- function ( x , ... ) {
y <- NextMethod ( )
attributes ( y ) <- attributes ( x )
y
}
2021-03-07 13:52:39 +01:00
#' @method sort mic
2021-03-05 15:36:39 +01:00
#' @export
#' @noRd
2021-03-07 13:52:39 +01:00
sort.mic <- function ( x , decreasing = FALSE , ... ) {
if ( decreasing == TRUE ) {
ord <- order ( - as.double ( x ) )
} else {
ord <- order ( as.double ( x ) )
2021-03-05 15:36:39 +01:00
}
2021-03-07 13:52:39 +01:00
x [ord ]
2021-03-05 15:36:39 +01:00
}
2021-03-07 13:52:39 +01:00
#' @method hist mic
2021-03-07 21:16:45 +01:00
#' @importFrom graphics hist
2021-03-05 15:36:39 +01:00
#' @export
#' @noRd
2021-03-07 13:52:39 +01:00
hist.mic <- function ( x , ... ) {
2022-03-02 15:38:55 +01:00
warning_ ( " in `hist()`: use `plot()` or ggplot2's `autoplot()` for optimal plotting of MIC values" )
2021-03-07 13:52:39 +01:00
hist ( log2 ( x ) )
2021-03-05 15:36:39 +01:00
}
2021-03-07 13:52:39 +01:00
# will be exported using s3_register() in R/zzz.R
get_skimmers.mic <- function ( column ) {
skimr :: sfl (
skim_type = " mic" ,
2022-08-28 10:31:50 +02:00
p0 = ~ stats :: quantile ( ., probs = 0 , na.rm = TRUE , names = FALSE ) ,
p25 = ~ stats :: quantile ( ., probs = 0.25 , na.rm = TRUE , names = FALSE ) ,
p50 = ~ stats :: quantile ( ., probs = 0.5 , na.rm = TRUE , names = FALSE ) ,
p75 = ~ stats :: quantile ( ., probs = 0.75 , na.rm = TRUE , names = FALSE ) ,
p100 = ~ stats :: quantile ( ., probs = 1 , na.rm = TRUE , names = FALSE ) ,
hist = ~ skimr :: inline_hist ( log2 ( stats :: na.omit ( .) ) , 5 )
2021-03-07 13:52:39 +01:00
)
2021-03-05 15:36:39 +01:00
}
2021-03-07 13:52:39 +01:00
# Miscellaneous mathematical functions ------------------------------------
#' @method mean mic
2021-03-05 15:36:39 +01:00
#' @export
#' @noRd
2021-03-07 13:52:39 +01:00
mean.mic <- function ( x , trim = 0 , na.rm = FALSE , ... ) {
mean ( as.double ( x ) , trim = trim , na.rm = na.rm , ... )
2021-03-05 15:36:39 +01:00
}
2021-03-07 13:52:39 +01:00
#' @method median mic
2021-03-07 21:16:45 +01:00
#' @importFrom stats median
2021-03-05 15:36:39 +01:00
#' @export
#' @noRd
2021-03-07 13:52:39 +01:00
median.mic <- function ( x , na.rm = FALSE , ... ) {
2021-03-07 21:16:45 +01:00
median ( as.double ( x ) , na.rm = na.rm , ... )
2021-03-05 15:36:39 +01:00
}
2021-03-07 13:52:39 +01:00
#' @method quantile mic
2021-03-07 21:16:45 +01:00
#' @importFrom stats quantile
2021-03-05 15:36:39 +01:00
#' @export
#' @noRd
2021-03-07 13:52:39 +01:00
quantile.mic <- function ( x , probs = seq ( 0 , 1 , 0.25 ) , na.rm = FALSE ,
names = TRUE , type = 7 , ... ) {
2021-03-07 21:16:45 +01:00
quantile ( as.double ( x ) , probs = probs , na.rm = na.rm , names = names , type = type , ... )
2021-03-05 15:36:39 +01:00
}
2021-03-07 13:52:39 +01:00
# Math (see ?groupGeneric) ----------------------------------------------
#' @method abs mic
2021-03-05 15:36:39 +01:00
#' @export
#' @noRd
2021-03-07 13:52:39 +01:00
abs.mic <- function ( x ) {
abs ( as.double ( x ) )
2021-03-05 15:36:39 +01:00
}
2021-03-07 13:52:39 +01:00
#' @method sign mic
2021-03-05 15:36:39 +01:00
#' @export
#' @noRd
2021-03-07 13:52:39 +01:00
sign.mic <- function ( x ) {
sign ( as.double ( x ) )
2021-03-05 15:36:39 +01:00
}
2021-03-07 13:52:39 +01:00
#' @method sqrt mic
2021-03-05 15:36:39 +01:00
#' @export
#' @noRd
2021-03-07 13:52:39 +01:00
sqrt.mic <- function ( x ) {
sqrt ( as.double ( x ) )
2021-03-05 15:36:39 +01:00
}
#' @method floor mic
#' @export
#' @noRd
floor.mic <- function ( x ) {
floor ( as.double ( x ) )
}
#' @method ceiling mic
#' @export
#' @noRd
ceiling.mic <- function ( x ) {
ceiling ( as.double ( x ) )
}
2021-03-07 13:52:39 +01:00
#' @method trunc mic
#' @export
#' @noRd
trunc.mic <- function ( x , ... ) {
trunc ( as.double ( x ) , ... )
}
#' @method round mic
#' @export
#' @noRd
round.mic <- function ( x , digits = 0 ) {
round ( as.double ( x ) , digits = digits )
}
#' @method signif mic
#' @export
#' @noRd
signif.mic <- function ( x , digits = 6 ) {
signif ( as.double ( x ) , digits = digits )
}
#' @method exp mic
#' @export
#' @noRd
exp.mic <- function ( x ) {
exp ( as.double ( x ) )
}
#' @method log mic
#' @export
#' @noRd
log.mic <- function ( x , base = exp ( 1 ) ) {
log ( as.double ( x ) , base = base )
}
#' @method log10 mic
#' @export
#' @noRd
log10.mic <- function ( x ) {
log10 ( as.double ( x ) )
}
#' @method log2 mic
#' @export
#' @noRd
log2.mic <- function ( x ) {
log2 ( as.double ( x ) )
}
#' @method expm1 mic
#' @export
#' @noRd
expm1.mic <- function ( x ) {
expm1 ( as.double ( x ) )
}
#' @method log1p mic
#' @export
#' @noRd
log1p.mic <- function ( x ) {
log1p ( as.double ( x ) )
}
#' @method cos mic
#' @export
#' @noRd
cos.mic <- function ( x ) {
cos ( as.double ( x ) )
}
#' @method sin mic
#' @export
#' @noRd
sin.mic <- function ( x ) {
sin ( as.double ( x ) )
}
#' @method tan mic
#' @export
#' @noRd
tan.mic <- function ( x ) {
tan ( as.double ( x ) )
}
#' @method cospi mic
#' @export
#' @noRd
cospi.mic <- function ( x ) {
cospi ( as.double ( x ) )
}
#' @method sinpi mic
#' @export
#' @noRd
sinpi.mic <- function ( x ) {
sinpi ( as.double ( x ) )
}
#' @method tanpi mic
#' @export
#' @noRd
tanpi.mic <- function ( x ) {
tanpi ( as.double ( x ) )
}
#' @method acos mic
#' @export
#' @noRd
acos.mic <- function ( x ) {
acos ( as.double ( x ) )
}
#' @method asin mic
#' @export
#' @noRd
asin.mic <- function ( x ) {
asin ( as.double ( x ) )
}
#' @method atan mic
#' @export
#' @noRd
atan.mic <- function ( x ) {
atan ( as.double ( x ) )
}
#' @method cosh mic
#' @export
#' @noRd
cosh.mic <- function ( x ) {
cosh ( as.double ( x ) )
}
#' @method sinh mic
#' @export
#' @noRd
sinh.mic <- function ( x ) {
sinh ( as.double ( x ) )
}
#' @method tanh mic
#' @export
#' @noRd
tanh.mic <- function ( x ) {
tanh ( as.double ( x ) )
}
#' @method acosh mic
#' @export
#' @noRd
acosh.mic <- function ( x ) {
acosh ( as.double ( x ) )
}
#' @method asinh mic
#' @export
#' @noRd
asinh.mic <- function ( x ) {
asinh ( as.double ( x ) )
}
#' @method atanh mic
#' @export
#' @noRd
atanh.mic <- function ( x ) {
atanh ( as.double ( x ) )
}
#' @method lgamma mic
#' @export
#' @noRd
lgamma.mic <- function ( x ) {
lgamma ( as.double ( x ) )
}
#' @method gamma mic
#' @export
#' @noRd
gamma.mic <- function ( x ) {
gamma ( as.double ( x ) )
}
#' @method digamma mic
#' @export
#' @noRd
digamma.mic <- function ( x ) {
digamma ( as.double ( x ) )
}
#' @method trigamma mic
#' @export
#' @noRd
trigamma.mic <- function ( x ) {
trigamma ( as.double ( x ) )
}
#' @method cumsum mic
#' @export
#' @noRd
cumsum.mic <- function ( x ) {
cumsum ( as.double ( x ) )
}
#' @method cumprod mic
#' @export
#' @noRd
cumprod.mic <- function ( x ) {
cumprod ( as.double ( x ) )
}
#' @method cummax mic
#' @export
#' @noRd
cummax.mic <- function ( x ) {
cummax ( as.double ( x ) )
}
#' @method cummin mic
#' @export
#' @noRd
cummin.mic <- function ( x ) {
cummin ( as.double ( x ) )
}
# Ops (see ?groupGeneric) -----------------------------------------------
2021-12-13 11:57:34 +01:00
is_greater <- function ( el ) {
el %like_case% " >[0-9]"
}
is_lower <- function ( el ) {
el %like_case% " <[0-9]"
}
2021-03-05 15:36:39 +01:00
#' @method + mic
#' @export
#' @noRd
`+.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) + as.double ( e2 )
}
#' @method - mic
#' @export
#' @noRd
`-.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) - as.double ( e2 )
}
#' @method * mic
#' @export
#' @noRd
`*.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) * as.double ( e2 )
}
#' @method / mic
#' @export
#' @noRd
`/.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) / as.double ( e2 )
}
#' @method ^ mic
#' @export
#' @noRd
`^.mic` <- function ( e1 , e2 ) {
2022-08-28 10:31:50 +02:00
as.double ( e1 ) ^as.double ( e2 )
2021-03-05 15:36:39 +01:00
}
#' @method %% mic
#' @export
#' @noRd
`%%.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) %% as.double ( e2 )
}
#' @method %/% mic
#' @export
#' @noRd
`%/%.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) %/% as.double ( e2 )
}
2021-03-07 13:52:39 +01:00
#' @method & mic
#' @export
#' @noRd
`&.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) & as.double ( e2 )
}
#' @method | mic
#' @export
#' @noRd
`|.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) | as.double ( e2 )
}
#' @method ! mic
#' @export
#' @noRd
`!.mic` <- function ( x ) {
! as.double ( x )
}
2021-03-05 15:36:39 +01:00
#' @method == mic
#' @export
#' @noRd
`==.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) == as.double ( e2 )
}
#' @method != mic
#' @export
#' @noRd
`!=.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) != as.double ( e2 )
}
#' @method < mic
#' @export
#' @noRd
`<.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) < as.double ( e2 )
}
#' @method <= mic
#' @export
#' @noRd
`<=.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) <= as.double ( e2 )
}
#' @method >= mic
#' @export
#' @noRd
`>=.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) >= as.double ( e2 )
}
#' @method > mic
#' @export
#' @noRd
`>.mic` <- function ( e1 , e2 ) {
as.double ( e1 ) > as.double ( e2 )
2021-12-13 11:57:34 +01:00
# doesn't work...
# nolint start
# as.double(e1) > as.double(e2) |
# (as.double(e1) == as.double(e2) & is_lower(e2) & !is_lower(e1)) |
# (as.double(e1) == as.double(e2) & is_greater(e1) & !is_greater(e2))
# nolint end
2021-03-05 15:36:39 +01:00
}
2021-03-07 13:52:39 +01:00
# Summary (see ?groupGeneric) -------------------------------------------
#' @method all mic
2021-03-05 15:36:39 +01:00
#' @export
#' @noRd
2021-03-07 13:52:39 +01:00
all.mic <- function ( ... , na.rm = FALSE ) {
all ( as.double ( c ( ... ) ) , na.rm = na.rm )
2021-03-05 15:36:39 +01:00
}
2021-03-07 13:52:39 +01:00
#' @method any mic
2021-03-05 15:36:39 +01:00
#' @export
#' @noRd
2021-03-07 13:52:39 +01:00
any.mic <- function ( ... , na.rm = FALSE ) {
any ( as.double ( c ( ... ) ) , na.rm = na.rm )
2021-03-05 15:36:39 +01:00
}
2021-03-07 13:52:39 +01:00
#' @method sum mic
#' @export
#' @noRd
sum.mic <- function ( ... , na.rm = FALSE ) {
sum ( as.double ( c ( ... ) ) , na.rm = na.rm )
}
#' @method prod mic
#' @export
#' @noRd
prod.mic <- function ( ... , na.rm = FALSE ) {
prod ( as.double ( c ( ... ) ) , na.rm = na.rm )
}
#' @method min mic
#' @export
#' @noRd
min.mic <- function ( ... , na.rm = FALSE ) {
min ( as.double ( c ( ... ) ) , na.rm = na.rm )
}
#' @method max mic
#' @export
#' @noRd
max.mic <- function ( ... , na.rm = FALSE ) {
max ( as.double ( c ( ... ) ) , na.rm = na.rm )
}
#' @method range mic
#' @export
#' @noRd
range.mic <- function ( ... , na.rm = FALSE ) {
range ( as.double ( c ( ... ) ) , na.rm = na.rm )
2020-09-28 01:08:55 +02:00
}