2019-01-11 20:37:23 +01:00
<!DOCTYPE html>
2019-10-13 09:31:58 +02:00
<!-- Generated by pkgdown: do not edit by hand --> < html lang = "en" >
< head >
< meta http-equiv = "Content-Type" content = "text/html; charset=UTF-8" >
< meta charset = "utf-8" >
2019-01-11 20:37:23 +01:00
< meta http-equiv = "X-UA-Compatible" content = "IE=edge" >
< meta name = "viewport" content = "width=device-width, initial-scale=1.0" >
2020-12-24 23:29:10 +01:00
< title > Benchmarks • AMR (for R)< / title >
2019-10-13 09:31:58 +02:00
<!-- favicons --> < link rel = "icon" type = "image/png" sizes = "16x16" href = "../favicon-16x16.png" >
2019-01-11 20:37:23 +01:00
< link rel = "icon" type = "image/png" sizes = "32x32" href = "../favicon-32x32.png" >
2019-10-13 09:31:58 +02:00
< link rel = "apple-touch-icon" type = "image/png" sizes = "180x180" href = "../apple-touch-icon.png" >
< link rel = "apple-touch-icon" type = "image/png" sizes = "120x120" href = "../apple-touch-icon-120x120.png" >
< link rel = "apple-touch-icon" type = "image/png" sizes = "76x76" href = "../apple-touch-icon-76x76.png" >
< link rel = "apple-touch-icon" type = "image/png" sizes = "60x60" href = "../apple-touch-icon-60x60.png" >
2020-12-27 00:07:00 +01:00
<!-- jquery --> < script src = "https://cdnjs.cloudflare.com/ajax/libs/jquery/3.4.1/jquery.min.js" integrity = "sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin = "anonymous" > < / script > <!-- Bootstrap --> < link href = "https://cdnjs.cloudflare.com/ajax/libs/bootswatch/3.4.0/flatly/bootstrap.min.css" rel = "stylesheet" crossorigin = "anonymous" >
2020-12-24 23:29:10 +01:00
< script src = "https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.4.1/js/bootstrap.min.js" integrity = "sha256-nuL8/2cJ5NDSSwnKD8VqreErSWHtnEP9E7AySL+1ev4=" crossorigin = "anonymous" > < / script > <!-- bootstrap - toc --> < link rel = "stylesheet" href = "../bootstrap-toc.css" >
2020-04-17 19:16:30 +02:00
< script src = "../bootstrap-toc.js" > < / script > <!-- Font Awesome icons --> < link rel = "stylesheet" href = "https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/all.min.css" integrity = "sha256-mmgLkCYLUQbXn0B1SRqzHar6dCnv9oZFPEC1g1cwlkk=" crossorigin = "anonymous" >
< link rel = "stylesheet" href = "https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.12.1/css/v4-shims.min.css" integrity = "sha256-wZjR52fzng1pJHwx4aV2AO3yyTOXrcDW7jBpJtTwVxw=" crossorigin = "anonymous" >
<!-- clipboard.js --> < script src = "https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.6/clipboard.min.js" integrity = "sha256-inc5kl9MA1hkeYUt+EC3BhlIgyp/2jDIyBLS6k3UxPI=" crossorigin = "anonymous" > < / script > <!-- headroom.js --> < script src = "https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/headroom.min.js" integrity = "sha256-AsUX4SJE1+yuDu5+mAVzJbuYNPHj/WroHuZ8Ir/CkE0=" crossorigin = "anonymous" > < / script > < script src = "https://cdnjs.cloudflare.com/ajax/libs/headroom/0.11.0/jQuery.headroom.min.js" integrity = "sha256-ZX/yNShbjqsohH1k95liqY9Gd8uOiE1S4vZc+9KQ1K4=" crossorigin = "anonymous" > < / script > <!-- pkgdown --> < link href = "../pkgdown.css" rel = "stylesheet" >
2020-02-23 20:56:11 +01:00
< script src = "../pkgdown.js" > < / script > < link href = "../extra.css" rel = "stylesheet" >
2019-10-13 09:31:58 +02:00
< script src = "../extra.js" > < / script > < meta property = "og:title" content = "Benchmarks" >
2020-04-13 21:09:56 +02:00
< meta property = "og:description" content = "AMR" >
2021-12-12 11:07:02 +01:00
< meta property = "og:image" content = "https://msberends.github.io/AMR/logo.svg" >
2021-08-16 21:54:34 +02:00
< meta name = "twitter:card" content = "summary_large_image" >
< meta name = "twitter:creator" content = "@msberends" >
< meta name = "twitter:site" content = "@univgroningen" >
2019-10-13 09:31:58 +02:00
<!-- mathjax --> < script src = "https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity = "sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin = "anonymous" > < / script > < script src = "https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity = "sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin = "anonymous" > < / script > <!-- [if lt IE 9]>
2019-01-11 20:37:23 +01:00
< script src = "https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js" > < / script >
< script src = "https://oss.maxcdn.com/respond/1.4.2/respond.min.js" > < / script >
<![endif]-->
2019-10-13 09:31:58 +02:00
< / head >
2020-04-17 19:16:30 +02:00
< body data-spy = "scroll" data-target = "#toc" >
2021-07-23 21:42:11 +02:00
2019-01-11 20:37:23 +01:00
< div class = "container template-article" >
2019-10-13 09:31:58 +02:00
< header > < div class = "navbar navbar-default navbar-fixed-top" role = "navigation" >
2019-01-11 20:37:23 +01:00
< div class = "container" >
< div class = "navbar-header" >
< button type = "button" class = "navbar-toggle collapsed" data-toggle = "collapse" data-target = "#navbar" aria-expanded = "false" >
< span class = "sr-only" > Toggle navigation< / span >
< span class = "icon-bar" > < / span >
< span class = "icon-bar" > < / span >
< span class = "icon-bar" > < / span >
< / button >
< span class = "navbar-brand" >
< a class = "navbar-link" href = "../index.html" > AMR (for R)< / a >
2022-03-14 16:36:10 +01:00
< span class = "version label label-default" data-toggle = "tooltip" data-placement = "bottom" title = "Released version" > 1.8.1< / span >
2019-01-11 20:37:23 +01:00
< / span >
< / div >
< div id = "navbar" class = "navbar-collapse collapse" >
< ul class = "nav navbar-nav" >
2019-10-13 09:31:58 +02:00
< li >
2019-01-11 20:37:23 +01:00
< a href = "../index.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-home" > < / span >
2019-01-11 20:37:23 +01:00
Home
< / a >
< / li >
< li class = "dropdown" >
< a href = "#" class = "dropdown-toggle" data-toggle = "dropdown" role = "button" aria-expanded = "false" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-question-circle" > < / span >
2019-01-11 20:37:23 +01:00
How to
< span class = "caret" > < / span >
< / a >
< ul class = "dropdown-menu" role = "menu" >
2019-10-13 09:31:58 +02:00
< li >
2019-01-11 20:37:23 +01:00
< a href = "../articles/AMR.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-directions" > < / span >
2019-01-11 20:37:23 +01:00
Conduct AMR analysis
< / a >
< / li >
< li >
2019-02-14 10:23:51 +01:00
< a href = "../articles/resistance_predict.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-dice" > < / span >
2019-01-11 20:37:23 +01:00
Predict antimicrobial resistance
< / a >
< / li >
2020-08-17 21:49:58 +02:00
< li >
< a href = "../articles/datasets.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-database" > < / span >
2020-08-17 21:49:58 +02:00
2020-09-03 20:59:21 +02:00
Data sets for download / own use
2020-08-17 21:49:58 +02:00
< / a >
< / li >
2020-03-07 21:48:21 +01:00
< li >
< a href = "../articles/PCA.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-compress" > < / span >
2020-03-07 21:48:21 +01:00
Conduct principal component analysis for AMR
< / a >
< / li >
2019-05-23 16:58:59 +02:00
< li >
< a href = "../articles/MDR.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-skull-crossbones" > < / span >
2019-05-23 16:58:59 +02:00
Determine multi-drug resistance (MDR)
< / a >
< / li >
2019-01-29 00:06:50 +01:00
< li >
< a href = "../articles/WHONET.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-globe-americas" > < / span >
2019-01-29 00:06:50 +01:00
Work with WHONET data
< / a >
< / li >
2019-02-14 15:18:17 +01:00
< li >
< a href = "../articles/SPSS.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-file-upload" > < / span >
2019-02-14 15:18:17 +01:00
Import data from SPSS/SAS/Stata
< / a >
< / li >
2019-01-11 20:37:23 +01:00
< li >
< a href = "../articles/EUCAST.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-exchange-alt" > < / span >
2019-01-11 20:37:23 +01:00
Apply EUCAST rules
< / a >
< / li >
< li >
2019-02-14 10:23:51 +01:00
< a href = "../reference/mo_property.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-bug" > < / span >
2019-01-11 20:37:23 +01:00
Get properties of a microorganism
< / a >
< / li >
< li >
2019-05-10 16:44:59 +02:00
< a href = "../reference/ab_property.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-capsules" > < / span >
2019-01-11 20:37:23 +01:00
Get properties of an antibiotic
< / a >
< / li >
< li >
< a href = "../articles/benchmarks.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-shipping-fast" > < / span >
2019-01-11 20:37:23 +01:00
Other: benchmarks
< / a >
< / li >
< / ul >
< / li >
< li >
2020-07-28 18:39:57 +02:00
< a href = "../reference/index.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-book-open" > < / span >
2019-01-11 20:37:23 +01:00
Manual
< / a >
< / li >
< li >
< a href = "../authors.html" >
2021-07-23 21:42:11 +02:00
< span class = "fa fa-users" > < / span >
2019-01-11 20:37:23 +01:00
Authors
< / a >
< / li >
< li >
2020-07-28 18:39:57 +02:00
< a href = "../news/index.html" >
2021-05-03 10:47:32 +02:00
< span class = "far fa-newspaper" > < / span >
2019-01-11 20:37:23 +01:00
Changelog
< / a >
< / li >
< / ul >
2019-10-13 09:31:58 +02:00
< ul class = "nav navbar-nav navbar-right" >
< li >
2021-07-23 21:42:11 +02:00
< a href = "https://github.com/msberends/AMR" class = "external-link" >
2021-05-03 10:47:32 +02:00
< span class = "fab fa-github" > < / span >
2019-01-11 20:37:23 +01:00
Source Code
< / a >
< / li >
< / ul >
2019-10-13 09:31:58 +02:00
< / div >
<!-- /.nav - collapse -->
< / div >
<!-- /.container -->
< / div >
<!-- /.navbar -->
2019-01-11 20:37:23 +01:00
2019-09-23 13:53:50 +02:00
2022-03-14 16:43:15 +01:00
< / header > < div class = "row" >
2019-01-11 20:37:23 +01:00
< div class = "col-md-9 contents" >
< div class = "page-header toc-ignore" >
2020-04-17 19:16:30 +02:00
< h1 data-toc-skip > Benchmarks< / h1 >
2019-01-11 20:37:23 +01:00
2021-12-06 11:12:30 +01:00
< small class = "dont-index" > Source: < a href = "https://github.com/msberends/AMR/blob/HEAD/vignettes/benchmarks.Rmd" class = "external-link" > < code > vignettes/benchmarks.Rmd< / code > < / a > < / small >
2019-01-11 20:37:23 +01:00
< div class = "hidden name" > < code > benchmarks.Rmd< / code > < / div >
< / div >
2022-03-14 16:36:10 +01:00
< p > One of the most important features of this package is the complete
microbial taxonomic database, supplied by the < a href = "http://www.catalogueoflife.org" class = "external-link" > Catalogue of Life< / a > (CoL) and
the < a href = "https://lpsn.dsmz.de" class = "external-link" > List of Prokaryotic names with
Standing in Nomenclature< / a > (LPSN). We created a function
< code > < a href = "../reference/as.mo.html" > as.mo()< / a > < / code > that transforms any user input value to a valid
microbial ID by using intelligent rules combined with the microbial
taxonomy.< / p >
< p > Using the < code > microbenchmark< / code > package, we can review the
calculation performance of this function. Its function
< code > < a href = "https://rdrr.io/pkg/microbenchmark/man/microbenchmark.html" class = "external-link" > microbenchmark()< / a > < / code > runs different input expressions
independently of each other and measures their time-to-result.< / p >
2021-05-03 10:47:32 +02:00
< div class = "sourceCode" id = "cb1" > < pre class = "downlit sourceCode r" >
2021-07-23 21:42:11 +02:00
< code class = "sourceCode R" > < span class = "kw" > < a href = "https://rdrr.io/r/base/library.html" class = "external-link" > library< / a > < / span > < span class = "op" > (< / span > < span class = "va" > < a href = "https://github.com/joshuaulrich/microbenchmark/" class = "external-link" > microbenchmark< / a > < / span > < span class = "op" > )< / span >
2022-03-14 16:36:10 +01:00
< span class = "kw" > < a href = "https://rdrr.io/r/base/library.html" class = "external-link" > library< / a > < / span > < span class = "op" > (< / span > < span class = "va" > < a href = "https://msberends.github.io/AMR/" > AMR< / a > < / span > < span class = "op" > )< / span >
2021-07-23 21:42:11 +02:00
< span class = "kw" > < a href = "https://rdrr.io/r/base/library.html" class = "external-link" > library< / a > < / span > < span class = "op" > (< / span > < span class = "va" > < a href = "https://dplyr.tidyverse.org" class = "external-link" > dplyr< / a > < / span > < span class = "op" > )< / span > < / code > < / pre > < / div >
2022-03-14 16:36:10 +01:00
< p > In the next test, we try to ‘ coerce’ different input values into the
microbial code of < em > Staphylococcus aureus< / em > . Coercion is a
computational process of forcing output based on an input. For
microorganism names, coercing user input to taxonomically valid
microorganism names is crucial to ensure correct interpretation and to
enable grouping based on taxonomic properties.< / p >
< p > The actual result is the same every time: it returns its
microorganism code < code > B_STPHY_AURS< / code > (< em > B< / em > stands for
< em > Bacteria< / em > , its taxonomic kingdom).< / p >
2019-03-06 14:39:02 +01:00
< p > But the calculation time differs a lot:< / p >
2021-05-03 10:47:32 +02:00
< div class = "sourceCode" id = "cb2" > < pre class = "downlit sourceCode r" >
2021-07-23 21:42:11 +02:00
< code class = "sourceCode R" > < span class = "va" > S.aureus< / span > < span class = "op" > < -< / span > < span class = "fu" > < a href = "https://rdrr.io/pkg/microbenchmark/man/microbenchmark.html" class = "external-link" > microbenchmark< / a > < / span > < span class = "op" > (< / span >
2020-10-15 09:46:41 +02:00
< span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "sau"< / span > < span class = "op" > )< / span > , < span class = "co" > # WHONET code< / span >
< span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "stau"< / span > < span class = "op" > )< / span > ,
< span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "STAU"< / span > < span class = "op" > )< / span > ,
< span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "staaur"< / span > < span class = "op" > )< / span > ,
< span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "STAAUR"< / span > < span class = "op" > )< / span > ,
< span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "S. aureus"< / span > < span class = "op" > )< / span > ,
< span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "S aureus"< / span > < span class = "op" > )< / span > ,
< span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "Staphylococcus aureus"< / span > < span class = "op" > )< / span > , < span class = "co" > # official taxonomic name< / span >
< span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "Staphylococcus aureus (MRSA)"< / span > < span class = "op" > )< / span > , < span class = "co" > # additional text< / span >
< span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "Sthafilokkockus aaureuz"< / span > < span class = "op" > )< / span > , < span class = "co" > # incorrect spelling< / span >
< span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "MRSA"< / span > < span class = "op" > )< / span > , < span class = "co" > # Methicillin Resistant S. aureus< / span >
< span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "VISA"< / span > < span class = "op" > )< / span > , < span class = "co" > # Vancomycin Intermediate S. aureus< / span >
2021-02-22 20:21:33 +01:00
times < span class = "op" > =< / span > < span class = "fl" > 25< / span > < span class = "op" > )< / span >
2022-03-14 16:43:15 +01:00
< span class = "fu" > < a href = "https://docs.ropensci.org/skimr/reference/print.html" class = "external-link" > print< / a > < / span > < span class = "op" > (< / span > < span class = "va" > S.aureus< / span > , unit < span class = "op" > =< / span > < span class = "st" > "ms"< / span > , signif < span class = "op" > =< / span > < span class = "fl" > 2< / span > < span class = "op" > )< / span >
2020-04-17 19:16:30 +02:00
< span class = "co" > # Unit: milliseconds< / span >
2022-03-14 16:43:15 +01:00
< span class = "co" > # expr min lq mean median uq max neval< / span >
< span class = "co" > # as.mo("sau") 12.0 13.0 17.0 14.0 15 53 25< / span >
< span class = "co" > # as.mo("stau") 51.0 59.0 74.0 71.0 90 97 25< / span >
< span class = "co" > # as.mo("STAU") 53.0 60.0 77.0 87.0 91 96 25< / span >
< span class = "co" > # as.mo("staaur") 11.0 13.0 16.0 14.0 15 48 25< / span >
< span class = "co" > # as.mo("STAAUR") 13.0 14.0 19.0 15.0 16 48 25< / span >
< span class = "co" > # as.mo("S. aureus") 28.0 31.0 48.0 59.0 63 70 25< / span >
< span class = "co" > # as.mo("S aureus") 28.0 29.0 42.0 33.0 58 83 25< / span >
< span class = "co" > # as.mo("Staphylococcus aureus") 3.9 4.1 6.1 4.4 5 43 25< / span >
< span class = "co" > # as.mo("Staphylococcus aureus (MRSA)") 250.0 260.0 270.0 270.0 270 390 25< / span >
< span class = "co" > # as.mo("Sthafilokkockus aaureuz") 160.0 190.0 200.0 200.0 220 240 25< / span >
< span class = "co" > # as.mo("MRSA") 13.0 13.0 19.0 14.0 15 50 25< / span >
< span class = "co" > # as.mo("VISA") 21.0 22.0 29.0 24.0 27 61 25< / span > < / code > < / pre > < / div >
2021-02-22 20:21:33 +01:00
< p > < img src = "benchmarks_files/figure-html/unnamed-chunk-4-1.png" width = "750" > < / p >
2022-03-14 16:36:10 +01:00
< p > In the table above, all measurements are shown in milliseconds
(thousands of seconds). A value of 5 milliseconds means it can determine
200 input values per second. It case of 200 milliseconds, this is only 5
input values per second. It is clear that accepted taxonomic names are
2022-03-14 16:43:15 +01:00
extremely fast, but some variations are up to 61 times slower to
2022-03-14 16:36:10 +01:00
determine.< / p >
< p > To improve performance, we implemented two important algorithms to
save unnecessary calculations: < strong > repetitive results< / strong > and
< strong > already precalculated results< / strong > .< / p >
2021-12-06 11:12:30 +01:00
< div class = "section level3" >
< h3 id = "repetitive-results" > Repetitive results< a class = "anchor" aria-label = "anchor" href = "#repetitive-results" > < / a >
< / h3 >
2022-03-14 16:36:10 +01:00
< p > Repetitive results are values that are present more than once in a
vector. Unique values will only be calculated once by
< code > < a href = "../reference/as.mo.html" > as.mo()< / a > < / code > . So running
< code > as.mo(c("E. coli", "E. coli"))< / code > will check the value
< code > "E. coli"< / code > only once.< / p >
< p > To prove this, we will use < code > < a href = "../reference/mo_property.html" > mo_name()< / a > < / code > for testing - a
helper function that returns the full microbial name (genus, species and
possibly subspecies) which uses < code > < a href = "../reference/as.mo.html" > as.mo()< / a > < / code > internally.< / p >
2021-05-03 10:47:32 +02:00
< div class = "sourceCode" id = "cb3" > < pre class = "downlit sourceCode r" >
< code class = "sourceCode R" > < span class = "co" > # start with the example_isolates data set< / span >
2021-12-06 11:12:30 +01:00
< span class = "va" > x< / span > < span class = "op" > < -< / span > < span class = "va" > example_isolates< / span > < span class = "op" > < a href = "https://magrittr.tidyverse.org/reference/pipe.html" class = "external-link" > %> %< / a > < / span >
2021-02-22 20:21:33 +01:00
< span class = "co" > # take all MO codes from the 'mo' column< / span >
2021-12-06 11:12:30 +01:00
< span class = "fu" > < a href = "https://dplyr.tidyverse.org/reference/pull.html" class = "external-link" > pull< / a > < / span > < span class = "op" > (< / span > < span class = "va" > mo< / span > < span class = "op" > )< / span > < span class = "op" > < a href = "https://magrittr.tidyverse.org/reference/pipe.html" class = "external-link" > %> %< / a > < / span >
2020-09-03 20:59:21 +02:00
< span class = "co" > # and copy them a thousand times< / span >
2021-12-06 11:12:30 +01:00
< span class = "fu" > < a href = "https://rdrr.io/r/base/rep.html" class = "external-link" > rep< / a > < / span > < span class = "op" > (< / span > < span class = "fl" > 1000< / span > < span class = "op" > )< / span > < span class = "op" > < a href = "https://magrittr.tidyverse.org/reference/pipe.html" class = "external-link" > %> %< / a > < / span >
2020-09-03 20:59:21 +02:00
< span class = "co" > # then scramble them< / span >
2021-07-23 21:42:11 +02:00
< span class = "fu" > < a href = "https://rdrr.io/r/base/sample.html" class = "external-link" > sample< / a > < / span > < span class = "op" > (< / span > < span class = "op" > )< / span >
2021-02-22 20:21:33 +01:00
< span class = "co" > # what do these values look like? They are of class < mo> :< / span >
2021-07-23 21:42:11 +02:00
< span class = "fu" > < a href = "https://rdrr.io/r/utils/head.html" class = "external-link" > head< / a > < / span > < span class = "op" > (< / span > < span class = "va" > x< / span > < span class = "op" > )< / span >
2021-02-22 20:21:33 +01:00
< span class = "co" > # Class < mo> < / span >
2022-03-14 16:43:15 +01:00
< span class = "co" > # [1] B_ACNTB B_ESCHR_COLI B_STRPT_GRPC B_STPHY_HMNS B_STPHY_CONS< / span >
2022-03-14 16:36:10 +01:00
< span class = "co" > # [6] B_ESCHR_COLI< / span >
2020-08-10 12:46:03 +02:00
2021-02-22 20:21:33 +01:00
< span class = "co" > # as the example_isolates data set has 2,000 rows, we should have 2 million items< / span >
2021-07-23 21:42:11 +02:00
< span class = "fu" > < a href = "https://rdrr.io/r/base/length.html" class = "external-link" > length< / a > < / span > < span class = "op" > (< / span > < span class = "va" > x< / span > < span class = "op" > )< / span >
2020-09-03 20:59:21 +02:00
< span class = "co" > # [1] 2000000< / span >
2020-04-17 19:16:30 +02:00
< span class = "co" > # and how many unique values do we have?< / span >
2021-07-23 21:42:11 +02:00
< span class = "fu" > < a href = "https://dplyr.tidyverse.org/reference/n_distinct.html" class = "external-link" > n_distinct< / a > < / span > < span class = "op" > (< / span > < span class = "va" > x< / span > < span class = "op" > )< / span >
2020-09-03 20:59:21 +02:00
< span class = "co" > # [1] 90< / span >
2020-04-17 19:16:30 +02:00
< span class = "co" > # now let's see:< / span >
2021-07-23 21:42:11 +02:00
< span class = "va" > run_it< / span > < span class = "op" > < -< / span > < span class = "fu" > < a href = "https://rdrr.io/pkg/microbenchmark/man/microbenchmark.html" class = "external-link" > microbenchmark< / a > < / span > < span class = "op" > (< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > x< / span > < span class = "op" > )< / span > ,
2020-10-15 09:46:41 +02:00
times < span class = "op" > =< / span > < span class = "fl" > 10< / span > < span class = "op" > )< / span >
2022-03-14 16:43:15 +01:00
< span class = "fu" > < a href = "https://docs.ropensci.org/skimr/reference/print.html" class = "external-link" > print< / a > < / span > < span class = "op" > (< / span > < span class = "va" > run_it< / span > , unit < span class = "op" > =< / span > < span class = "st" > "ms"< / span > , signif < span class = "op" > =< / span > < span class = "fl" > 3< / span > < span class = "op" > )< / span >
2020-04-17 19:16:30 +02:00
< span class = "co" > # Unit: milliseconds< / span >
2020-10-08 11:16:03 +02:00
< span class = "co" > # expr min lq mean median uq max neval< / span >
2022-03-14 16:43:15 +01:00
< span class = "co" > # mo_name(x) 200 204 265 225 320 392 10< / span > < / code > < / pre > < / div >
2022-03-14 16:36:10 +01:00
< p > So getting official taxonomic names of 2,000,000 (!!) items
2022-03-14 16:43:15 +01:00
consisting of 90 unique values only takes 0.225 seconds. That is 112
2022-03-14 16:36:10 +01:00
nanoseconds on average. You only lose time on your unique input
values.< / p >
2019-01-11 20:37:23 +01:00
< / div >
2021-12-06 11:12:30 +01:00
< div class = "section level3" >
< h3 id = "precalculated-results" > Precalculated results< a class = "anchor" aria-label = "anchor" href = "#precalculated-results" > < / a >
< / h3 >
2022-03-14 16:36:10 +01:00
< p > What about precalculated results? If the input is an already
precalculated result of a helper function such as
< code > < a href = "../reference/mo_property.html" > mo_name()< / a > < / code > , it almost doesn’ t take any time at all. In other
words, if you run < code > < a href = "../reference/mo_property.html" > mo_name()< / a > < / code > on a valid taxonomic name, it
will return the results immediately (see ‘ C’ below):< / p >
2021-05-03 10:47:32 +02:00
< div class = "sourceCode" id = "cb4" > < pre class = "downlit sourceCode r" >
2021-07-23 21:42:11 +02:00
< code class = "sourceCode R" > < span class = "va" > run_it< / span > < span class = "op" > < -< / span > < span class = "fu" > < a href = "https://rdrr.io/pkg/microbenchmark/man/microbenchmark.html" class = "external-link" > microbenchmark< / a > < / span > < span class = "op" > (< / span > A < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "STAAUR"< / span > < span class = "op" > )< / span > ,
2020-10-15 09:46:41 +02:00
B < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "S. aureus"< / span > < span class = "op" > )< / span > ,
C < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "Staphylococcus aureus"< / span > < span class = "op" > )< / span > ,
times < span class = "op" > =< / span > < span class = "fl" > 10< / span > < span class = "op" > )< / span >
2022-03-14 16:43:15 +01:00
< span class = "fu" > < a href = "https://docs.ropensci.org/skimr/reference/print.html" class = "external-link" > print< / a > < / span > < span class = "op" > (< / span > < span class = "va" > run_it< / span > , unit < span class = "op" > =< / span > < span class = "st" > "ms"< / span > , signif < span class = "op" > =< / span > < span class = "fl" > 3< / span > < span class = "op" > )< / span >
2020-04-17 19:16:30 +02:00
< span class = "co" > # Unit: milliseconds< / span >
2022-03-14 16:43:15 +01:00
< span class = "co" > # expr min lq mean median uq max neval< / span >
< span class = "co" > # A 8.35 8.84 9.10 9.01 9.32 10.20 10< / span >
< span class = "co" > # B 23.00 24.70 30.30 25.00 26.90 72.70 10< / span >
< span class = "co" > # C 2.05 2.07 2.44 2.41 2.83 3.05 10< / span > < / code > < / pre > < / div >
2022-03-14 16:36:10 +01:00
< p > So going from < code > mo_name("Staphylococcus aureus")< / code > to
2022-03-14 16:43:15 +01:00
< code > "Staphylococcus aureus"< / code > takes 0.0024 seconds - it doesn’ t
2022-03-14 16:36:10 +01:00
even start calculating < em > if the result would be the same as the
expected resulting value< / em > . That goes for all helper functions:< / p >
2021-05-03 10:47:32 +02:00
< div class = "sourceCode" id = "cb5" > < pre class = "downlit sourceCode r" >
2021-07-23 21:42:11 +02:00
< code class = "sourceCode R" > < span class = "va" > run_it< / span > < span class = "op" > < -< / span > < span class = "fu" > < a href = "https://rdrr.io/pkg/microbenchmark/man/microbenchmark.html" class = "external-link" > microbenchmark< / a > < / span > < span class = "op" > (< / span > A < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_species< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "aureus"< / span > < span class = "op" > )< / span > ,
2020-10-15 09:46:41 +02:00
B < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_genus< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "Staphylococcus"< / span > < span class = "op" > )< / span > ,
C < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "Staphylococcus aureus"< / span > < span class = "op" > )< / span > ,
D < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_family< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "Staphylococcaceae"< / span > < span class = "op" > )< / span > ,
E < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_order< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "Bacillales"< / span > < span class = "op" > )< / span > ,
F < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_class< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "Bacilli"< / span > < span class = "op" > )< / span > ,
G < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_phylum< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "Firmicutes"< / span > < span class = "op" > )< / span > ,
H < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_kingdom< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "Bacteria"< / span > < span class = "op" > )< / span > ,
times < span class = "op" > =< / span > < span class = "fl" > 10< / span > < span class = "op" > )< / span >
2022-03-14 16:43:15 +01:00
< span class = "fu" > < a href = "https://docs.ropensci.org/skimr/reference/print.html" class = "external-link" > print< / a > < / span > < span class = "op" > (< / span > < span class = "va" > run_it< / span > , unit < span class = "op" > =< / span > < span class = "st" > "ms"< / span > , signif < span class = "op" > =< / span > < span class = "fl" > 3< / span > < span class = "op" > )< / span >
2020-04-17 19:16:30 +02:00
< span class = "co" > # Unit: milliseconds< / span >
2021-07-23 21:42:11 +02:00
< span class = "co" > # expr min lq mean median uq max neval< / span >
2022-03-14 16:43:15 +01:00
< span class = "co" > # A 1.89 1.93 2.09 2.05 2.17 2.40 10< / span >
< span class = "co" > # B 1.89 1.93 2.08 2.00 2.19 2.63 10< / span >
< span class = "co" > # C 1.91 1.92 2.10 1.97 2.30 2.43 10< / span >
< span class = "co" > # D 1.90 1.94 2.21 2.02 2.53 2.88 10< / span >
< span class = "co" > # E 1.87 1.95 2.09 2.04 2.22 2.33 10< / span >
< span class = "co" > # F 1.84 1.91 1.97 1.92 2.04 2.14 10< / span >
< span class = "co" > # G 1.87 1.92 2.10 1.96 2.12 2.96 10< / span >
< span class = "co" > # H 1.90 1.96 2.12 2.06 2.21 2.47 10< / span > < / code > < / pre > < / div >
2022-03-14 16:36:10 +01:00
< p > Of course, when running < code > mo_phylum("Firmicutes")< / code > the
function has zero knowledge about the actual microorganism, namely
< em > S. aureus< / em > . But since the result would be
< code > "Firmicutes"< / code > anyway, there is no point in calculating the
result. And because this package contains all phyla of all known
bacteria, it can just return the initial value immediately.< / p >
2019-01-11 20:37:23 +01:00
< / div >
2021-12-06 11:12:30 +01:00
< div class = "section level3" >
< h3 id = "results-in-other-languages" > Results in other languages< a class = "anchor" aria-label = "anchor" href = "#results-in-other-languages" > < / a >
< / h3 >
2022-03-14 16:36:10 +01:00
< p > When the system language is non-English and supported by this
< code > AMR< / code > package, some functions will have a translated result.
This almost does’ t take extra time (compare “en” from the table below
with the other languages):< / p >
2021-05-03 10:47:32 +02:00
< div class = "sourceCode" id = "cb6" > < pre class = "downlit sourceCode r" >
2021-12-13 10:18:28 +01:00
< code class = "sourceCode R" > < span class = "va" > CoNS< / span > < span class = "op" > < -< / span > < span class = "fu" > < a href = "../reference/as.mo.html" > as.mo< / a > < / span > < span class = "op" > (< / span > < span class = "st" > "CoNS"< / span > < span class = "op" > )< / span >
< span class = "va" > CoNS< / span >
< span class = "co" > # Class < mo> < / span >
< span class = "co" > # [1] B_STPHY_CONS< / span >
< span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "en"< / span > < span class = "op" > )< / span > < span class = "co" > # or just mo_name(CoNS) on an English system< / span >
2020-04-17 19:16:30 +02:00
< span class = "co" > # [1] "Coagulase-negative Staphylococcus (CoNS)"< / span >
2021-12-13 10:18:28 +01:00
< span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "es"< / span > < span class = "op" > )< / span > < span class = "co" > # or just mo_name(CoNS) on a Spanish system< / span >
2020-04-17 19:16:30 +02:00
< span class = "co" > # [1] "Staphylococcus coagulasa negativo (SCN)"< / span >
2021-12-13 10:18:28 +01:00
< span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "nl"< / span > < span class = "op" > )< / span > < span class = "co" > # or just mo_name(CoNS) on a Dutch system< / span >
2020-04-17 19:16:30 +02:00
< span class = "co" > # [1] "Coagulase-negatieve Staphylococcus (CNS)"< / span >
2021-12-13 10:18:28 +01:00
< span class = "va" > run_it< / span > < span class = "op" > < -< / span > < span class = "fu" > < a href = "https://rdrr.io/pkg/microbenchmark/man/microbenchmark.html" class = "external-link" > microbenchmark< / a > < / span > < span class = "op" > (< / span > da < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "da"< / span > < span class = "op" > )< / span > ,
de < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "de"< / span > < span class = "op" > )< / span > ,
en < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "en"< / span > < span class = "op" > )< / span > ,
es < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "es"< / span > < span class = "op" > )< / span > ,
fr < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "fr"< / span > < span class = "op" > )< / span > ,
it < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "it"< / span > < span class = "op" > )< / span > ,
nl < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "nl"< / span > < span class = "op" > )< / span > ,
pt < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "pt"< / span > < span class = "op" > )< / span > ,
ru < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "ru"< / span > < span class = "op" > )< / span > ,
sv < span class = "op" > =< / span > < span class = "fu" > < a href = "../reference/mo_property.html" > mo_name< / a > < / span > < span class = "op" > (< / span > < span class = "va" > CoNS< / span > , language < span class = "op" > =< / span > < span class = "st" > "sv"< / span > < span class = "op" > )< / span > ,
2020-10-15 09:46:41 +02:00
times < span class = "op" > =< / span > < span class = "fl" > 100< / span > < span class = "op" > )< / span >
2022-03-14 16:43:15 +01:00
< span class = "fu" > < a href = "https://docs.ropensci.org/skimr/reference/print.html" class = "external-link" > print< / a > < / span > < span class = "op" > (< / span > < span class = "va" > run_it< / span > , unit < span class = "op" > =< / span > < span class = "st" > "ms"< / span > , signif < span class = "op" > =< / span > < span class = "fl" > 4< / span > < span class = "op" > )< / span >
2020-04-17 19:16:30 +02:00
< span class = "co" > # Unit: milliseconds< / span >
2022-03-14 16:43:15 +01:00
< span class = "co" > # expr min lq mean median uq max neval< / span >
< span class = "co" > # da 2.133 2.304 3.442 2.494 2.816 46.020 100< / span >
< span class = "co" > # de 2.128 2.312 3.068 2.520 2.699 53.220 100< / span >
< span class = "co" > # en 1.014 1.115 1.262 1.227 1.362 2.424 100< / span >
< span class = "co" > # es 2.133 2.338 2.981 2.570 2.737 43.770 100< / span >
< span class = "co" > # fr 1.986 2.149 3.139 2.377 2.567 41.610 100< / span >
< span class = "co" > # it 2.072 2.268 2.911 2.468 2.656 44.560 100< / span >
< span class = "co" > # nl 2.115 2.286 2.962 2.521 2.723 43.240 100< / span >
< span class = "co" > # pt 2.055 2.205 2.912 2.520 2.687 39.520 100< / span >
< span class = "co" > # ru 1.998 2.210 2.866 2.474 2.631 39.820 100< / span >
< span class = "co" > # sv 2.022 2.187 2.759 2.357 2.536 38.560 100< / span > < / code > < / pre > < / div >
2022-03-14 16:36:10 +01:00
< p > Currently supported languages are Danish, Dutch, English, French,
German, Italian, Portuguese, Russian, Spanish and Swedish.< / p >
2019-01-11 20:37:23 +01:00
< / div >
< / div >
2020-04-13 21:09:56 +02:00
< div class = "col-md-3 hidden-xs hidden-sm" id = "pkgdown-sidebar" >
2019-10-13 09:31:58 +02:00
2019-01-11 20:37:23 +01:00
< / div >
< / div >
2019-10-13 09:31:58 +02:00
< footer > < div class = "copyright" >
2021-07-23 21:42:11 +02:00
< p > < / p >
2022-03-14 16:36:10 +01:00
< p > Developed by Matthijs S. Berends, Christian F. Luz, Dennis Souverein,
Erwin E. A. Hassing.< / p >
2019-01-11 20:37:23 +01:00
< / div >
< div class = "pkgdown" >
2021-07-23 21:42:11 +02:00
< p > < / p >
2022-03-14 16:36:10 +01:00
< p > Site built with < a href = "https://pkgdown.r-lib.org/" class = "external-link" > pkgdown< / a >
2.0.2.< / p >
2019-01-11 20:37:23 +01:00
< / div >
2019-10-13 09:31:58 +02:00
2019-01-11 20:37:23 +01:00
< / footer >
2019-10-13 09:31:58 +02:00
< / div >
2019-01-11 20:37:23 +01:00
2020-02-23 20:56:11 +01:00
2021-07-23 21:42:11 +02:00
2020-02-23 20:56:11 +01:00
< / body >
2019-01-11 20:37:23 +01:00
< / html >