From 85917f0c17f88ac3a5634b1e27ebc53eb38d5036 Mon Sep 17 00:00:00 2001 From: Sebastian Fischer Date: Wed, 11 Dec 2024 16:16:04 +0000 Subject: [PATCH] ... --- paper/paper.bib | 12 ++++++++++++ paper/paper.md | 4 +++- 2 files changed, 15 insertions(+), 1 deletion(-) diff --git a/paper/paper.bib b/paper/paper.bib index a31678a73..c9228bf3c 100644 --- a/paper/paper.bib +++ b/paper/paper.bib @@ -184,3 +184,15 @@ @incollection{benchlargescale editor = "Bernd Bischl and Raphael Sonabend and Lars Kotthoff and Michel Lang", url = "https://mlr3book.mlr-org.com/large-scale_benchmarking.html" } + +@article{wilkinson2016fair, + title={The FAIR Guiding Principles for scientific data management and stewardship}, + author={Wilkinson, Mark D and Dumontier, Michel and Aalbersberg, IJsbrand Jan and Appleton, Gabrielle and Axton, Myles and Baak, Arie and Blomberg, Niklas and Boiten, Jan-Willem and da Silva Santos, Luiz Bonino and Bourne, Philip E and others}, + journal={Scientific data}, + volume={3}, + number={1}, + pages={1--9}, + year={2016}, + publisher={Nature Publishing Group} +} + diff --git a/paper/paper.md b/paper/paper.md index 5a71c1f64..cfe02b5a8 100644 --- a/paper/paper.md +++ b/paper/paper.md @@ -119,6 +119,7 @@ Beyond accessibility, `mlr3extralearners` also allows `mlr3` users and package d This **enriches each learner with extensive metadata** about its parameter space, prediction types, and other key attributes. Furthermore, `mlr3extralearners` includes robust mechanisms for **quality assurance**, such as regular sanity checks and verification tests that ensure learner parameters are consistent and up-to-date with the latest versions of their underlying R packages. In order to allow the integration of learners that are not available on `CRAN`, the package is hosted on the [`mlr` R-universe](https://mlr-org.r-universe.dev/). +By providing a standardized interface and comprehensive metadata for each learner, mlr3extralearners enhances the FAIRness (findability, accessibility, interoperability, and reusability) of machine learning algorithms within the R ecosystem [#wilkinson2016fair]). # Statement of Need @@ -162,7 +163,8 @@ Integrating learners from diverse R packages poses challenges, particularly due - **Interface Consistency**: The package regularly verifies that each learner adheres to the expected interface of its upstream function. When new parameters are introduced or existing ones change, the tests fail until the parameter sets are updated accordingly. - **Automated Testing**: To ensure correctness, `mlr3extralearners` performs regular automated tests on all learners. -These tests include sanity checks and validate metadata annotations, such as verifying that a learner claiming to handle missing values works as expected. +These tests include sanity checks that, e.g., verify that the learners produce sensible predictions for simple tasks. +Furthermore, the tests also validate the learners' metadata annotations, such as whether a learner can actually handle missing values or is able to produce importance scores. ## Simplified Integration of New Learners