Skip to contents

This function calculates a normalised mean for antimicrobial resistance between multiple observations.

Usage

mean_amr_distance(x, ...)

# S3 method for default
mean_amr_distance(x, ...)

# S3 method for mic
mean_amr_distance(x, ...)

# S3 method for disk
mean_amr_distance(x, ...)

# S3 method for rsi
mean_amr_distance(x, combine_SI = TRUE, ...)

# S3 method for data.frame
mean_amr_distance(x, ..., combine_SI = TRUE)

distance_from_row(mean_distance, row)

Arguments

x

a vector of class rsi, rsi or rsi, or a data.frame containing columns of any of these classes

...

variables to select (supports tidy selection such as column1:column4 and where(is.mic)), and can thus also be antibiotic selectors

combine_SI

a logical to indicate whether all values of S and I must be merged into one, so the input only consists of S+I vs. R (susceptible vs. resistant), defaults to TRUE

mean_distance

the outcome of mean_amr_distance()

row

an index, such as a row number

Details

The mean AMR distance is a normalised numeric value to compare AMR test results and can help to identify similar isolates, without comparing antibiograms by hand. For common numeric data this distance is equal to Z scores (the number of standard deviations from the mean).

MIC values (see as.mic()) are transformed with log2() first; their distance is calculated as (log2(x) - mean(log2(x))) / sd(log2(x)).

R/SI values (see as.rsi()) are transformed using "S" = 1, "I" = 2, and "R" = 3. If combine_SI is TRUE (default), the "I" will be considered to be 1.

For data sets, the mean AMR distance will be calculated per variable, after which the mean of all columns will returned per row (using rowMeans()), see Examples.

Use distance_from_row() to subtract distances from the distance of one row, see Examples.

Interpretation

Isolates with distances less than 0.01 difference from each other should be considered similar. Differences lower than 0.025 should be considered suspicious.

Examples

x <- random_mic(10)
x
#> Class <mic>
#>  [1] 0.0625 0.001  0.25   >=128  0.025  1      0.5    0.005  1      16    
mean_amr_distance(x)
#>  [1] -0.41123292 -1.57568929 -0.02085462  1.73584774 -0.66925895  0.36952368
#>  [7]  0.17433453 -1.12247412  0.36952368  1.15028028

y <- data.frame(
  id = LETTERS[1:10],
  amox = random_mic(10, ab = "amox", mo = "Escherichia coli"),
  cipr = random_mic(10, ab = "cipr", mo = "Escherichia coli"),
  gent = random_mic(10, ab = "gent", mo = "Escherichia coli"),
  tobr = random_mic(10, ab = "tobr", mo = "Escherichia coli")
)
y
#>    id amox    cipr   gent tobr
#> 1   A    2       2 <=0.25    4
#> 2   B    4       2      2    4
#> 3   C >=16       2 <=0.25    2
#> 4   D  <=1    0.25      2    2
#> 5   E >=16 <=0.125 <=0.25 0.25
#> 6   F >=16 <=0.125      4 >=16
#> 7   G  <=1       2 <=0.25    4
#> 8   H    4    0.25      4    2
#> 9   I  <=1       1    0.5 >=16
#> 10  J    8       2    0.5 >=16
mean_amr_distance(y)
#> ℹ Calculating mean AMR distance based on columns "amox", "cipr", "gent",
#>   "id" and "tobr"
#> Warning: NAs introduced by coercion
#>  [1] -0.15641280  0.42857996  0.14992674 -0.42197963 -0.81679006  0.57661476
#>  [7] -0.30349990  0.01816313 -0.02817569  0.55357349
y$amr_distance <- mean_amr_distance(y, where(is.mic))
#> ℹ Calculating mean AMR distance based on columns "amox", "cipr", "gent" and
#>   "tobr"
y[order(y$amr_distance), ]
#>    id amox    cipr   gent tobr amr_distance
#> 5   E >=16 <=0.125 <=0.25 0.25  -0.81679006
#> 4   D  <=1    0.25      2    2  -0.42197963
#> 7   G  <=1       2 <=0.25    4  -0.30349990
#> 1   A    2       2 <=0.25    4  -0.15641280
#> 9   I  <=1       1    0.5 >=16  -0.02817569
#> 8   H    4    0.25      4    2   0.01816313
#> 3   C >=16       2 <=0.25    2   0.14992674
#> 2   B    4       2      2    4   0.42857996
#> 10  J    8       2    0.5 >=16   0.55357349
#> 6   F >=16 <=0.125      4 >=16   0.57661476

if (require("dplyr")) {
  y %>%
    mutate(
      amr_distance = mean_amr_distance(., where(is.mic)),
      check_id_C = distance_from_row(amr_distance, id == "C")
    ) %>%
    arrange(check_id_C)
}
#> ℹ Calculating mean AMR distance based on columns "amox", "cipr", "gent" and
#>   "tobr"
#>    id amox    cipr   gent tobr amr_distance check_id_C
#> 1   C >=16       2 <=0.25    2   0.14992674  0.0000000
#> 2   H    4    0.25      4    2   0.01816313  0.1317636
#> 3   I  <=1       1    0.5 >=16  -0.02817569  0.1781024
#> 4   B    4       2      2    4   0.42857996  0.2786532
#> 5   A    2       2 <=0.25    4  -0.15641280  0.3063395
#> 6   J    8       2    0.5 >=16   0.55357349  0.4036468
#> 7   F >=16 <=0.125      4 >=16   0.57661476  0.4266880
#> 8   G  <=1       2 <=0.25    4  -0.30349990  0.4534266
#> 9   D  <=1    0.25      2    2  -0.42197963  0.5719064
#> 10  E >=16 <=0.125 <=0.25 0.25  -0.81679006  0.9667168
if (require("dplyr")) {
  # support for groups
  example_isolates %>%
    filter(mo_genus() == "Enterococcus" & mo_species() != "") %>%
    select(mo, TCY, carbapenems()) %>%
    group_by(mo) %>%
    mutate(d = mean_amr_distance(., where(is.rsi))) %>%
    arrange(mo, d)
}
#> ℹ Using column 'mo' as input for `mo_genus()`
#> ℹ Using column 'mo' as input for `mo_species()`
#> ℹ For `carbapenems()` using columns 'IPM' (imipenem) and 'MEM' (meropenem)
#> ℹ Calculating mean AMR distance based on columns "IPM", "MEM" and "TCY"
#> # A tibble: 63 × 5
#> # Groups:   mo [4]
#>    mo           TCY   IPM   MEM         d
#>    <mo>         <rsi> <rsi> <rsi>   <dbl>
#>  1 B_ENTRC_AVIM S     S     NA    NaN    
#>  2 B_ENTRC_AVIM S     S     NA    NaN    
#>  3 B_ENTRC_CSSL NA    S     NA     NA    
#>  4 B_ENTRC_FACM S     S     NA     -2.66 
#>  5 B_ENTRC_FACM S     R     R      -0.423
#>  6 B_ENTRC_FACM S     R     R      -0.423
#>  7 B_ENTRC_FACM NA    R     R       0.224
#>  8 B_ENTRC_FACM NA    R     R       0.224
#>  9 B_ENTRC_FACM NA    R     R       0.224
#> 10 B_ENTRC_FACM NA    R     R       0.224
#> # … with 53 more rows