2018-02-21 11:52:31 +01:00
# ==================================================================== #
# TITLE #
# Antimicrobial Resistance (AMR) Analysis #
# #
# AUTHORS #
# Berends MS (m.s.berends@umcg.nl), Luz CF (c.f.luz@umcg.nl) #
# #
# LICENCE #
# This program is free software; you can redistribute it and/or modify #
# it under the terms of the GNU General Public License version 2.0, #
# as published by the Free Software Foundation. #
# #
# This program is distributed in the hope that it will be useful, #
# but WITHOUT ANY WARRANTY; without even the implied warranty of #
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the #
# GNU General Public License for more details. #
# ==================================================================== #
#' Class 'mic'
#'
2018-07-25 14:17:04 +02:00
#' This transforms a vector to a new class \code{mic}, which is an ordered factor with valid MIC values as levels. Invalid MIC values will be translated as \code{NA} with a warning.
2018-02-21 11:52:31 +01:00
#' @rdname as.mic
#' @param x vector
#' @param na.rm a logical indicating whether missing values should be removed
2018-10-17 17:32:34 +02:00
#' @return Ordered factor with new class \code{mic}
2018-07-13 17:23:46 +02:00
#' @keywords mic
2018-02-21 11:52:31 +01:00
#' @export
#' @importFrom dplyr %>%
2018-07-25 14:17:04 +02:00
#' @seealso \code{\link{as.rsi}}
2018-02-22 20:48:48 +01:00
#' @examples
#' mic_data <- as.mic(c(">=32", "1.0", "1", "1.00", 8, "<=0.128", "8", "16", "16"))
#' is.mic(mic_data)
2018-04-02 16:05:09 +02:00
#'
2018-06-19 10:05:38 +02:00
#' # this can also coerce combined MIC/RSI values:
2018-07-25 14:17:04 +02:00
#' as.mic("<=0.002; S") # will return <=0.002
2018-06-19 10:05:38 +02:00
#'
2018-02-22 20:48:48 +01:00
#' plot(mic_data)
2018-03-13 14:34:10 +01:00
#' barplot(mic_data)
2018-08-01 22:37:28 +02:00
#' freq(mic_data)
2018-02-21 11:52:31 +01:00
as.mic <- function ( x , na.rm = FALSE ) {
if ( is.mic ( x ) ) {
x
} else {
x <- x %>% unlist ( )
if ( na.rm == TRUE ) {
x <- x [ ! is.na ( x ) ]
}
x.bak <- x
2018-04-02 16:05:09 +02:00
2018-06-19 10:05:38 +02:00
# comma to period
2018-02-21 11:52:31 +01:00
x <- gsub ( ' ,' , ' .' , x , fixed = TRUE )
2018-06-19 10:05:38 +02:00
# remove space between operator and number ("<= 0.002" -> "<=0.002")
x <- gsub ( ' (<|=|>) +' , ' \\1' , x )
2018-02-21 11:52:31 +01:00
# starting dots must start with 0
2018-05-31 09:02:49 +02:00
x <- gsub ( ' ^[.]+' , ' 0.' , x )
2018-02-21 11:52:31 +01:00
# <=0.2560.512 should be 0.512
x <- gsub ( ' .*[.].*[.]' , ' 0.' , x )
# remove ending .0
2018-05-31 09:02:49 +02:00
x <- gsub ( ' [.]+0$' , ' ' , x )
2018-02-21 11:52:31 +01:00
# remove all after last digit
2018-05-31 09:02:49 +02:00
x <- gsub ( ' [^0-9]+$' , ' ' , x )
2018-02-21 11:52:31 +01:00
# remove last zeroes
2018-08-24 11:08:20 +02:00
x <- gsub ( ' ([.].?)0+$' , ' \\1' , x )
2018-06-19 10:05:38 +02:00
# force to be character
x <- as.character ( x )
2018-04-02 16:05:09 +02:00
2018-08-24 11:08:20 +02:00
# previously unempty values now empty - should return a warning later on
x [x.bak != " " & x == " " ] <- " invalid"
2018-06-19 10:05:38 +02:00
# these are alllowed MIC values and will become factor levels
2018-02-21 11:52:31 +01:00
lvls <- c ( " <0.002" , " <=0.002" , " 0.002" , " >=0.002" , " >0.002" ,
" <0.003" , " <=0.003" , " 0.003" , " >=0.003" , " >0.003" ,
" <0.004" , " <=0.004" , " 0.004" , " >=0.004" , " >0.004" ,
" <0.006" , " <=0.006" , " 0.006" , " >=0.006" , " >0.006" ,
" <0.008" , " <=0.008" , " 0.008" , " >=0.008" , " >0.008" ,
" <0.012" , " <=0.012" , " 0.012" , " >=0.012" , " >0.012" ,
2018-07-28 10:48:27 +02:00
" <0.0125" , " <=0.0125" , " 0.0125" , " >=0.0125" , " >0.0125" ,
2018-02-21 11:52:31 +01:00
" <0.016" , " <=0.016" , " 0.016" , " >=0.016" , " >0.016" ,
" <0.023" , " <=0.023" , " 0.023" , " >=0.023" , " >0.023" ,
2018-03-13 11:57:30 +01:00
" <0.025" , " <=0.025" , " 0.025" , " >=0.025" , " >0.025" ,
2018-02-21 11:52:31 +01:00
" <0.03" , " <=0.03" , " 0.03" , " >=0.03" , " >0.03" ,
" <0.032" , " <=0.032" , " 0.032" , " >=0.032" , " >0.032" ,
" <0.047" , " <=0.047" , " 0.047" , " >=0.047" , " >0.047" ,
" <0.05" , " <=0.05" , " 0.05" , " >=0.05" , " >0.05" ,
2018-07-28 10:48:27 +02:00
" <0.054" , " <=0.054" , " 0.054" , " >=0.054" , " >0.054" ,
2018-02-21 11:52:31 +01:00
" <0.06" , " <=0.06" , " 0.06" , " >=0.06" , " >0.06" ,
" <0.0625" , " <=0.0625" , " 0.0625" , " >=0.0625" , " >0.0625" ,
2018-03-13 11:57:30 +01:00
" <0.063" , " <=0.063" , " 0.063" , " >=0.063" , " >0.063" ,
2018-02-21 11:52:31 +01:00
" <0.064" , " <=0.064" , " 0.064" , " >=0.064" , " >0.064" ,
" <0.09" , " <=0.09" , " 0.09" , " >=0.09" , " >0.09" ,
" <0.094" , " <=0.094" , " 0.094" , " >=0.094" , " >0.094" ,
" <0.12" , " <=0.12" , " 0.12" , " >=0.12" , " >0.12" ,
" <0.125" , " <=0.125" , " 0.125" , " >=0.125" , " >0.125" ,
" <0.128" , " <=0.128" , " 0.128" , " >=0.128" , " >0.128" ,
2018-03-13 11:57:30 +01:00
" <0.16" , " <=0.16" , " 0.16" , " >=0.16" , " >0.16" ,
2018-02-21 11:52:31 +01:00
" <0.19" , " <=0.19" , " 0.19" , " >=0.19" , " >0.19" ,
2018-07-28 10:48:27 +02:00
" <0.23" , " <=0.23" , " 0.23" , " >=0.23" , " >0.23" ,
2018-02-21 11:52:31 +01:00
" <0.25" , " <=0.25" , " 0.25" , " >=0.25" , " >0.25" ,
" <0.256" , " <=0.256" , " 0.256" , " >=0.256" , " >0.256" ,
2018-07-28 10:48:27 +02:00
" <0.28" , " <=0.28" , " 0.28" , " >=0.28" , " >0.28" ,
2018-08-24 11:08:20 +02:00
" <0.3" , " <=0.3" , " 0.3" , " >=0.3" , " >0.3" ,
2018-03-13 11:57:30 +01:00
" <0.32" , " <=0.32" , " 0.32" , " >=0.32" , " >0.32" ,
2018-07-28 10:48:27 +02:00
" <0.36" , " <=0.36" , " 0.36" , " >=0.36" , " >0.36" ,
2018-02-21 11:52:31 +01:00
" <0.38" , " <=0.38" , " 0.38" , " >=0.38" , " >0.38" ,
" <0.5" , " <=0.5" , " 0.5" , " >=0.5" , " >0.5" ,
" <0.512" , " <=0.512" , " 0.512" , " >=0.512" , " >0.512" ,
2018-03-13 11:57:30 +01:00
" <0.64" , " <=0.64" , " 0.64" , " >=0.64" , " >0.64" ,
2018-02-21 11:52:31 +01:00
" <0.75" , " <=0.75" , " 0.75" , " >=0.75" , " >0.75" ,
" <1" , " <=1" , " 1" , " >=1" , " >1" ,
" <1.5" , " <=1.5" , " 1.5" , " >=1.5" , " >1.5" ,
" <2" , " <=2" , " 2" , " >=2" , " >2" ,
" <3" , " <=3" , " 3" , " >=3" , " >3" ,
" <4" , " <=4" , " 4" , " >=4" , " >4" ,
2018-07-28 10:48:27 +02:00
" <5" , " <=5" , " 5" , " >=5" , " >5" ,
2018-02-21 11:52:31 +01:00
" <6" , " <=6" , " 6" , " >=6" , " >6" ,
2018-07-28 10:48:27 +02:00
" <7" , " <=7" , " 7" , " >=7" , " >7" ,
2018-02-21 11:52:31 +01:00
" <8" , " <=8" , " 8" , " >=8" , " >8" ,
" <10" , " <=10" , " 10" , " >=10" , " >10" ,
" <12" , " <=12" , " 12" , " >=12" , " >12" ,
" <16" , " <=16" , " 16" , " >=16" , " >16" ,
" <20" , " <=20" , " 20" , " >=20" , " >20" ,
" <24" , " <=24" , " 24" , " >=24" , " >24" ,
" <32" , " <=32" , " 32" , " >=32" , " >32" ,
" <40" , " <=40" , " 40" , " >=40" , " >40" ,
" <48" , " <=48" , " 48" , " >=48" , " >48" ,
" <64" , " <=64" , " 64" , " >=64" , " >64" ,
" <80" , " <=80" , " 80" , " >=80" , " >80" ,
" <96" , " <=96" , " 96" , " >=96" , " >96" ,
" <128" , " <=128" , " 128" , " >=128" , " >128" ,
" <160" , " <=160" , " 160" , " >=160" , " >160" ,
" <256" , " <=256" , " 256" , " >=256" , " >256" ,
" <320" , " <=320" , " 320" , " >=320" , " >320" ,
" <512" , " <=512" , " 512" , " >=512" , " >512" ,
" <1024" , " <=1024" , " 1024" , " >=1024" , " >1024" )
2018-04-02 16:05:09 +02:00
2018-02-21 11:52:31 +01:00
na_before <- x [is.na ( x ) | x == ' ' ] %>% length ( )
x [ ! x %in% lvls ] <- NA
na_after <- x [is.na ( x ) | x == ' ' ] %>% length ( )
2018-04-02 16:05:09 +02:00
2018-02-21 11:52:31 +01:00
if ( na_before != na_after ) {
list_missing <- x.bak [is.na ( x ) & ! is.na ( x.bak ) & x.bak != ' ' ] %>%
unique ( ) %>%
sort ( )
list_missing <- paste0 ( ' "' , list_missing , ' "' , collapse = " , " )
warning ( na_after - na_before , ' results truncated (' ,
2018-03-19 20:39:23 +01:00
round ( ( ( na_after - na_before ) / length ( x ) ) * 100 ) ,
2018-02-21 11:52:31 +01:00
' %) that were invalid MICs: ' ,
list_missing , call. = FALSE )
}
2018-04-02 16:05:09 +02:00
2018-10-17 17:32:34 +02:00
x <- factor ( x , levels = lvls , ordered = TRUE )
2018-02-21 11:52:31 +01:00
class ( x ) <- c ( ' mic' , ' ordered' , ' factor' )
x
}
}
#' @rdname as.mic
#' @export
#' @importFrom dplyr %>%
is.mic <- function ( x ) {
class ( x ) %>% identical ( c ( ' mic' , ' ordered' , ' factor' ) )
}
#' @exportMethod as.double.mic
#' @export
#' @noRd
as.double.mic <- function ( x , ... ) {
2018-03-13 11:57:30 +01:00
as.double ( gsub ( ' (<|=|>)+' , ' ' , as.character ( x ) ) )
2018-02-21 11:52:31 +01:00
}
#' @exportMethod as.integer.mic
#' @export
#' @noRd
as.integer.mic <- function ( x , ... ) {
2018-03-13 11:57:30 +01:00
as.integer ( gsub ( ' (<|=|>)+' , ' ' , as.character ( x ) ) )
2018-02-21 11:52:31 +01:00
}
#' @exportMethod as.numeric.mic
#' @export
#' @noRd
as.numeric.mic <- function ( x , ... ) {
2018-03-13 11:57:30 +01:00
as.numeric ( gsub ( ' (<|=|>)+' , ' ' , as.character ( x ) ) )
2018-02-21 11:52:31 +01:00
}
#' @exportMethod print.mic
#' @export
#' @importFrom dplyr %>% tibble group_by summarise pull
#' @noRd
print.mic <- function ( x , ... ) {
2018-07-15 22:56:41 +02:00
cat ( " Class 'mic'\n" )
2018-08-01 22:37:28 +02:00
print ( as.character ( x ) , quote = FALSE )
2018-02-21 11:52:31 +01:00
}
#' @exportMethod summary.mic
#' @export
2018-04-03 16:07:32 +02:00
#' @importFrom dplyr %>%
2018-02-21 11:52:31 +01:00
#' @noRd
summary.mic <- function ( object , ... ) {
x <- object
n_total <- x %>% length ( )
x <- x [ ! is.na ( x ) ]
n <- x %>% length ( )
2018-12-07 12:04:55 +01:00
c (
" Class" = ' mic' ,
" <NA>" = n_total - n ,
" Min." = sort ( x ) [1 ] %>% as.character ( ) ,
" Max." = sort ( x ) [n ] %>% as.character ( )
)
2018-02-21 11:52:31 +01:00
}
#' @exportMethod plot.mic
#' @export
#' @importFrom dplyr %>% group_by summarise
#' @importFrom graphics plot text
#' @noRd
plot.mic <- function ( x , ... ) {
x_name <- deparse ( substitute ( x ) )
2018-03-13 14:34:10 +01:00
create_barplot_mic ( x , x_name , ... )
}
#' @exportMethod barplot.mic
#' @export
2018-03-13 15:40:10 +01:00
#' @importFrom graphics barplot axis
2018-03-13 14:34:10 +01:00
#' @noRd
2018-03-13 15:40:10 +01:00
barplot.mic <- function ( height , ... ) {
x_name <- deparse ( substitute ( height ) )
create_barplot_mic ( height , x_name , ... )
2018-03-13 14:34:10 +01:00
}
2018-03-13 15:40:10 +01:00
#' @importFrom graphics barplot axis
2018-08-01 22:37:28 +02:00
#' @importFrom dplyr %>% group_by summarise
2018-03-13 14:34:10 +01:00
create_barplot_mic <- function ( x , x_name , ... ) {
2018-02-21 11:52:31 +01:00
data <- data.frame ( mic = x , cnt = 1 ) %>%
group_by ( mic ) %>%
summarise ( cnt = sum ( cnt ) ) %>%
droplevels ( )
2018-03-13 14:34:10 +01:00
barplot ( table ( droplevels ( x ) ) ,
ylab = ' Frequency' ,
xlab = ' MIC value' ,
2018-04-02 16:05:09 +02:00
main = paste ( ' MIC values of' , x_name ) ,
2018-03-13 14:34:10 +01:00
axes = FALSE ,
... )
axis ( 2 , seq ( 0 , max ( data $ cnt ) ) )
2018-02-21 11:52:31 +01:00
}