├── .Rbuildignore
├── .editorconfig
├── .github
    └── workflows
    │   ├── pkgdown.yml
    │   └── r-cmd-check.yml
├── .gitignore
├── .ignore
├── .lintr
├── DESCRIPTION
├── LICENSE
├── NAMESPACE
├── NEWS.md
├── R
    ├── DataBackendDplyr.R
    ├── DataBackendDuckDB.R
    ├── DataBackendPolars.R
    ├── as_duckdb_backend.R
    ├── as_polars_backend.R
    ├── as_sqlite_backend.R
    ├── helper.R
    └── zzz.R
├── README.Rmd
├── README.md
├── inst
    └── extdata
    │   ├── spam.parquet
    │   ├── userdata1.parquet
    │   ├── userdata2.parquet
    │   ├── userdata3.parquet
    │   ├── userdata4.parquet
    │   └── userdata5.parquet
├── man-roxygen
    ├── field_connector.R
    ├── field_levels.R
    ├── param_connector.R
    ├── param_path.R
    ├── param_primary_key.R
    └── param_strings_as_factors.R
├── man
    ├── DataBackendDplyr.Rd
    ├── DataBackendDuckDB.Rd
    ├── DataBackendPolars.Rd
    ├── as_duckdb_backend.Rd
    ├── as_polars_backend.Rd
    ├── as_sqlite_backend.Rd
    ├── figures
    │   └── logo_navbar.png
    └── mlr3db-package.Rd
├── mlr3db.Rproj
├── pkgdown
    ├── _pkgdown.yml
    └── favicon
    │   ├── apple-touch-icon-120x120.png
    │   ├── apple-touch-icon-152x152.png
    │   ├── apple-touch-icon-180x180.png
    │   ├── apple-touch-icon-60x60.png
    │   ├── apple-touch-icon-76x76.png
    │   ├── apple-touch-icon.png
    │   ├── favicon-16x16.png
    │   ├── favicon-32x32.png
    │   └── favicon.ico
└── tests
    ├── testthat.R
    └── testthat
        ├── helper.R
        ├── setup.R
        ├── teardown.R
        ├── test_as_duckdb_backend.R
        ├── test_as_polars_backend.R
        ├── test_as_sqlite_backend.R
        ├── test_dplyr.R
        ├── test_duckdb.R
        ├── test_polars.R
        ├── test_reconnect.R
        ├── test_train_predict_dplyr.R
        ├── test_train_predict_duckdb.R
        └── test_train_predict_polars.R


/.Rbuildignore:
--------------------------------------------------------------------------------
 1 | ^LICENSE$
 2 | .ignore
 3 | .editorconfig
 4 | .gitignore
 5 | ^.git$
 6 | ^.github$
 7 | ^.*\.Rproj$
 8 | ^\.Rproj\.user$
 9 | ^man-roxygen$
10 | ^docs$
11 | ^pkgdown$
12 | ^\.ccache$
13 | ^\.github$
14 | ^.lintr$
15 | ^README\.Rmd$
16 | 


--------------------------------------------------------------------------------
/.editorconfig:
--------------------------------------------------------------------------------
 1 | # See http://editorconfig.org
 2 | root = true
 3 | 
 4 | [*]
 5 | charset = utf-8
 6 | end_of_line = lf
 7 | insert_final_newline = true
 8 | indent_style = space
 9 | trim_trailing_whitespace = true
10 | 
11 | [*.{r,R,md,Rmd}]
12 | indent_size = 2
13 | 
14 | [*.{c,h}]
15 | indent_size = 4
16 | 
17 | [*.{cpp,hpp}]
18 | indent_size = 4
19 | 
20 | [{NEWS.md,DESCRIPTION,LICENSE}]
21 | max_line_length = 80
22 | 


--------------------------------------------------------------------------------
/.github/workflows/pkgdown.yml:
--------------------------------------------------------------------------------
 1 | # pkgdown workflow of the mlr3 ecosystem v0.1.0
 2 | # https://github.com/mlr-org/actions
 3 | on:
 4 |   push:
 5 |     branches:
 6 |       - main
 7 |   pull_request:
 8 |     branches:
 9 |       - main
10 |   release:
11 |     types:
12 |       - published
13 |   workflow_dispatch:
14 | 
15 | name: pkgdown
16 | 
17 | jobs:
18 |   pkgdown:
19 |     runs-on: ubuntu-latest
20 | 
21 |     concurrency:
22 |       group: pkgdown-${{ github.event_name != 'pull_request' || github.run_id }}
23 |     env:
24 |       GITHUB_PAT: ${{ secrets.GITHUB_TOKEN }}
25 |     steps:
26 |       - uses: actions/checkout@v3
27 | 
28 |       - uses: r-lib/actions/setup-pandoc@v2
29 | 
30 |       - uses: r-lib/actions/setup-r@v2
31 |         with:
32 |           extra-repositories: 'https://community.r-multiverse.org'
33 | 
34 |       - uses: r-lib/actions/setup-r-dependencies@v2
35 |         with:
36 |           extra-packages: any::pkgdown, local::.
37 |           needs: website
38 | 
39 |       - name: Install template
40 |         run: pak::pkg_install("mlr-org/mlr3pkgdowntemplate")
41 |         shell: Rscript {0}
42 | 
43 |       - name: Build site
44 |         run: pkgdown::build_site_github_pages(new_process = FALSE, install = FALSE)
45 |         shell: Rscript {0}
46 | 
47 |       - name: Deploy
48 |         if: github.event_name != 'pull_request'
49 |         uses: JamesIves/github-pages-deploy-action@v4.4.1
50 |         with:
51 |           clean: false
52 |           branch: gh-pages
53 |           folder: docs
54 | 


--------------------------------------------------------------------------------
/.github/workflows/r-cmd-check.yml:
--------------------------------------------------------------------------------
 1 | # r cmd check workflow of the mlr3 ecosystem v0.1.0
 2 | # https://github.com/mlr-org/actions
 3 | on:
 4 |   workflow_dispatch:
 5 |   push:
 6 |     branches:
 7 |       - main
 8 |   pull_request:
 9 |     branches:
10 |       - main
11 | 
12 | name: r-cmd-check
13 | 
14 | jobs:
15 |   r-cmd-check:
16 |     runs-on: ${{ matrix.config.os }}
17 | 
18 |     name: ${{ matrix.config.os }} (${{ matrix.config.r }})
19 | 
20 |     env:
21 |       GITHUB_PAT: ${{ secrets.GITHUB_TOKEN }}
22 | 
23 |     strategy:
24 |       fail-fast: false
25 |       matrix:
26 |         config:
27 |           - {os: ubuntu-latest,   r: 'devel'}
28 |           - {os: ubuntu-latest,   r: 'release'}
29 | 
30 |     steps:
31 |       - uses: actions/checkout@v3
32 | 
33 |       - uses: r-lib/actions/setup-r@v2
34 |         with:
35 |           r-version: ${{ matrix.config.r }}
36 |           extra-repositories: 'https://community.r-multiverse.org'
37 | 
38 |       - uses: r-lib/actions/setup-r-dependencies@v2
39 |         with:
40 |           extra-packages: any::rcmdcheck
41 |           needs: check
42 | 
43 |       - uses: r-lib/actions/check-r-package@v2
44 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
1 | .Rproj.user
2 | .Rhistory
3 | .RData
4 | .Ruserdata
5 | docs/
6 | .DS_Store
7 | 


--------------------------------------------------------------------------------
/.ignore:
--------------------------------------------------------------------------------
1 | man/
2 | docs/
3 | pkgdown/
4 | 


--------------------------------------------------------------------------------
/.lintr:
--------------------------------------------------------------------------------
 1 | linters: linters_with_defaults(
 2 |     # lintr defaults: https://github.com/jimhester/lintr#available-linters
 3 |     # the following setup changes/removes certain linters
 4 |     assignment_linter = NULL, # do not force using <- for assignments
 5 |     object_name_linter = object_name_linter(c("snake_case", "CamelCase")), # only allow snake case and camel case object names
 6 |     cyclocomp_linter = NULL, # do not check function complexity
 7 |     commented_code_linter = NULL, # allow code in comments
 8 |     line_length_linter = line_length_linter(120)
 9 |     )
10 | 
11 | 


--------------------------------------------------------------------------------
/DESCRIPTION:
--------------------------------------------------------------------------------
 1 | Package: mlr3db
 2 | Title: Data Base Backend for 'mlr3'
 3 | Version: 0.5.1-9000
 4 | Authors@R:
 5 |     c(
 6 |       person(given = "Michel",
 7 |            family = "Lang",
 8 |            role = c("cre", "aut"),
 9 |            email = "michellang@gmail.com",
10 |            comment = c(ORCID = "0000-0001-9754-0393")),
11 |       person(given = "Lona",
12 |            family = "Koers",
13 |            role = c("aut"),
14 |            email = "lona.koers@gmail.com")
15 |     )
16 | Description: Extends the 'mlr3' package with a backend to
17 |     transparently work with databases such as 'SQLite', 'DuckDB', 'MySQL',
18 |     'MariaDB', or 'PostgreSQL'. The package provides two additional backends:
19 |     'DataBackendDplyr' relies on the abstraction of package 'dbplyr' to
20 |     interact with most DBMS. 'DataBackendDuckDB' operates on 'DuckDB' data bases
21 |     and also on Apache Parquet files.
22 | License: LGPL-3
23 | URL: https:///mlr3db.mlr-org.com,
24 |     https://github.com/mlr-org/mlr3db
25 | BugReports: https://github.com/mlr-org/mlr3db/issues
26 | Depends:
27 |     mlr3 (>= 0.13.0),
28 |     R (>= 3.1.0)
29 | Imports:
30 |     R6,
31 |     backports,
32 |     checkmate,
33 |     data.table,
34 |     mlr3misc (>= 0.10.0)
35 | Suggests:
36 |     DBI,
37 |     RSQLite,
38 |     dbplyr,
39 |     dplyr,
40 |     duckdb (>= 0.4.0),
41 |     future,
42 |     future.apply,
43 |     future.callr,
44 |     lgr,
45 |     polars,
46 |     testthat (>= 3.0.0),
47 |     tibble
48 | Encoding: UTF-8
49 | Config/testthat/edition: 3
50 | Roxygen: list(markdown = TRUE)
51 | RoxygenNote: 7.3.2
52 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
  1 |                    GNU LESSER GENERAL PUBLIC LICENSE
  2 |                        Version 3, 29 June 2007
  3 | 
  4 |  Copyright (C) 2007 Free Software Foundation, Inc. <https://fsf.org/>
  5 |  Everyone is permitted to copy and distribute verbatim copies
  6 |  of this license document, but changing it is not allowed.
  7 | 
  8 | 
  9 |   This version of the GNU Lesser General Public License incorporates
 10 | the terms and conditions of version 3 of the GNU General Public
 11 | License, supplemented by the additional permissions listed below.
 12 | 
 13 |   0. Additional Definitions.
 14 | 
 15 |   As used herein, "this License" refers to version 3 of the GNU Lesser
 16 | General Public License, and the "GNU GPL" refers to version 3 of the GNU
 17 | General Public License.
 18 | 
 19 |   "The Library" refers to a covered work governed by this License,
 20 | other than an Application or a Combined Work as defined below.
 21 | 
 22 |   An "Application" is any work that makes use of an interface provided
 23 | by the Library, but which is not otherwise based on the Library.
 24 | Defining a subclass of a class defined by the Library is deemed a mode
 25 | of using an interface provided by the Library.
 26 | 
 27 |   A "Combined Work" is a work produced by combining or linking an
 28 | Application with the Library.  The particular version of the Library
 29 | with which the Combined Work was made is also called the "Linked
 30 | Version".
 31 | 
 32 |   The "Minimal Corresponding Source" for a Combined Work means the
 33 | Corresponding Source for the Combined Work, excluding any source code
 34 | for portions of the Combined Work that, considered in isolation, are
 35 | based on the Application, and not on the Linked Version.
 36 | 
 37 |   The "Corresponding Application Code" for a Combined Work means the
 38 | object code and/or source code for the Application, including any data
 39 | and utility programs needed for reproducing the Combined Work from the
 40 | Application, but excluding the System Libraries of the Combined Work.
 41 | 
 42 |   1. Exception to Section 3 of the GNU GPL.
 43 | 
 44 |   You may convey a covered work under sections 3 and 4 of this License
 45 | without being bound by section 3 of the GNU GPL.
 46 | 
 47 |   2. Conveying Modified Versions.
 48 | 
 49 |   If you modify a copy of the Library, and, in your modifications, a
 50 | facility refers to a function or data to be supplied by an Application
 51 | that uses the facility (other than as an argument passed when the
 52 | facility is invoked), then you may convey a copy of the modified
 53 | version:
 54 | 
 55 |    a) under this License, provided that you make a good faith effort to
 56 |    ensure that, in the event an Application does not supply the
 57 |    function or data, the facility still operates, and performs
 58 |    whatever part of its purpose remains meaningful, or
 59 | 
 60 |    b) under the GNU GPL, with none of the additional permissions of
 61 |    this License applicable to that copy.
 62 | 
 63 |   3. Object Code Incorporating Material from Library Header Files.
 64 | 
 65 |   The object code form of an Application may incorporate material from
 66 | a header file that is part of the Library.  You may convey such object
 67 | code under terms of your choice, provided that, if the incorporated
 68 | material is not limited to numerical parameters, data structure
 69 | layouts and accessors, or small macros, inline functions and templates
 70 | (ten or fewer lines in length), you do both of the following:
 71 | 
 72 |    a) Give prominent notice with each copy of the object code that the
 73 |    Library is used in it and that the Library and its use are
 74 |    covered by this License.
 75 | 
 76 |    b) Accompany the object code with a copy of the GNU GPL and this license
 77 |    document.
 78 | 
 79 |   4. Combined Works.
 80 | 
 81 |   You may convey a Combined Work under terms of your choice that,
 82 | taken together, effectively do not restrict modification of the
 83 | portions of the Library contained in the Combined Work and reverse
 84 | engineering for debugging such modifications, if you also do each of
 85 | the following:
 86 | 
 87 |    a) Give prominent notice with each copy of the Combined Work that
 88 |    the Library is used in it and that the Library and its use are
 89 |    covered by this License.
 90 | 
 91 |    b) Accompany the Combined Work with a copy of the GNU GPL and this license
 92 |    document.
 93 | 
 94 |    c) For a Combined Work that displays copyright notices during
 95 |    execution, include the copyright notice for the Library among
 96 |    these notices, as well as a reference directing the user to the
 97 |    copies of the GNU GPL and this license document.
 98 | 
 99 |    d) Do one of the following:
100 | 
101 |        0) Convey the Minimal Corresponding Source under the terms of this
102 |        License, and the Corresponding Application Code in a form
103 |        suitable for, and under terms that permit, the user to
104 |        recombine or relink the Application with a modified version of
105 |        the Linked Version to produce a modified Combined Work, in the
106 |        manner specified by section 6 of the GNU GPL for conveying
107 |        Corresponding Source.
108 | 
109 |        1) Use a suitable shared library mechanism for linking with the
110 |        Library.  A suitable mechanism is one that (a) uses at run time
111 |        a copy of the Library already present on the user's computer
112 |        system, and (b) will operate properly with a modified version
113 |        of the Library that is interface-compatible with the Linked
114 |        Version.
115 | 
116 |    e) Provide Installation Information, but only if you would otherwise
117 |    be required to provide such information under section 6 of the
118 |    GNU GPL, and only to the extent that such information is
119 |    necessary to install and execute a modified version of the
120 |    Combined Work produced by recombining or relinking the
121 |    Application with a modified version of the Linked Version. (If
122 |    you use option 4d0, the Installation Information must accompany
123 |    the Minimal Corresponding Source and Corresponding Application
124 |    Code. If you use option 4d1, you must provide the Installation
125 |    Information in the manner specified by section 6 of the GNU GPL
126 |    for conveying Corresponding Source.)
127 | 
128 |   5. Combined Libraries.
129 | 
130 |   You may place library facilities that are a work based on the
131 | Library side by side in a single library together with other library
132 | facilities that are not Applications and are not covered by this
133 | License, and convey such a combined library under terms of your
134 | choice, if you do both of the following:
135 | 
136 |    a) Accompany the combined library with a copy of the same work based
137 |    on the Library, uncombined with any other library facilities,
138 |    conveyed under the terms of this License.
139 | 
140 |    b) Give prominent notice with the combined library that part of it
141 |    is a work based on the Library, and explaining where to find the
142 |    accompanying uncombined form of the same work.
143 | 
144 |   6. Revised Versions of the GNU Lesser General Public License.
145 | 
146 |   The Free Software Foundation may publish revised and/or new versions
147 | of the GNU Lesser General Public License from time to time. Such new
148 | versions will be similar in spirit to the present version, but may
149 | differ in detail to address new problems or concerns.
150 | 
151 |   Each version is given a distinguishing version number. If the
152 | Library as you received it specifies that a certain numbered version
153 | of the GNU Lesser General Public License "or any later version"
154 | applies to it, you have the option of following the terms and
155 | conditions either of that published version or of any later version
156 | published by the Free Software Foundation. If the Library as you
157 | received it does not specify a version number of the GNU Lesser
158 | General Public License, you may choose any version of the GNU Lesser
159 | General Public License ever published by the Free Software Foundation.
160 | 
161 |   If the Library as you received it specifies that a proxy can decide
162 | whether future versions of the GNU Lesser General Public License shall
163 | apply, that proxy's public statement of acceptance of any version is
164 | permanent authorization for you to choose that version for the
165 | Library.
166 | 


--------------------------------------------------------------------------------
/NAMESPACE:
--------------------------------------------------------------------------------
 1 | # Generated by roxygen2: do not edit by hand
 2 | 
 3 | S3method(as_data_backend,RPolarsDataFrame)
 4 | S3method(as_data_backend,RPolarsLazyFrame)
 5 | S3method(as_data_backend,tbl_SQLiteConnection)
 6 | S3method(as_data_backend,tbl_duckdb_connection)
 7 | S3method(as_data_backend,tbl_lazy)
 8 | S3method(as_duckdb_backend,DataBackend)
 9 | S3method(as_duckdb_backend,character)
10 | S3method(as_duckdb_backend,data.frame)
11 | S3method(as_polars_backend,DataBackend)
12 | S3method(as_polars_backend,data.frame)
13 | S3method(as_sqlite_backend,DataBackend)
14 | S3method(as_sqlite_backend,data.frame)
15 | export(DataBackendDplyr)
16 | export(DataBackendDuckDB)
17 | export(DataBackendPolars)
18 | export(as_duckdb_backend)
19 | export(as_polars_backend)
20 | export(as_sqlite_backend)
21 | if (getRversion() >= "3.6.0") S3method(dplyr::show_query, DataBackendDplyr)
22 | import(checkmate)
23 | import(data.table)
24 | importFrom(R6,R6Class)
25 | importFrom(mlr3,DataBackend)
26 | importFrom(mlr3,as_data_backend)
27 | importFrom(mlr3misc,calculate_hash)
28 | importFrom(mlr3misc,map_lgl)
29 | importFrom(stats,setNames)
30 | importFrom(utils,head)
31 | 


--------------------------------------------------------------------------------
/NEWS.md:
--------------------------------------------------------------------------------
 1 | # mlr3db 0.5.2
 2 | 
 3 | - Bugfix: `DataBackendDuckDB` calculated missing values incorrectly.
 4 | - Compatibility with future versions of `dbplyr` (#35).
 5 | 
 6 | # mlr3db 0.5.1
 7 | 
 8 | - Compatibility with new duckdb version (#36).
 9 | 
10 | # mlr3db 0.5.0
11 | 
12 | - Support for parquet files as Backend via DuckDB.
13 | - New converter `as_duckdb_backend()`.
14 | 
15 | # mlr3db 0.4.2
16 | 
17 | - Compatibility fixes with new duckdb version.
18 | 
19 | # mlr3db 0.4.1
20 | 
21 | - Temporarily disabled some tests to overcome some regressions in duckdb.
22 | 
23 | # mlr3db 0.4.0
24 | 
25 | * Added a `show_query()` method for `DataBackendDplyr` (#4).
26 | * A reconnector is automatically added in `as_data_backend()` for objects of
27 |   type `tbl_SQLiteConnection` and `tbl_duckdb_connection`.
28 | 
29 | # mlr3db 0.3.0
30 | 
31 | * New backend `DataBackendDuckDB`.
32 | * `dplyr` is now optional (moved from imports to suggests).
33 | 
34 | # mlr3db 0.2.0
35 | 
36 | * Set a primary key for SQLite databases generated from data frames.
37 | * Set a reconnector for SQLite databases generated from data frames.
38 | * Resolved a warning signaled by dplyr-1.0.0.
39 | 
40 | # mlr3db 0.1.5
41 | 
42 | * `as_data_backend()` method to construct a `DataBackendDplyr` now specialized
43 |   to operate on objects of type `"tbl_lazy"` (was `"tbl"` before). This way,
44 |   local `"tbl"` objects such as tibbles are converted to a
45 |   `DataBackendDataTable` by `mlr3::as_data_backend.data.frame()`.
46 | 
47 | # mlr3db 0.1.4
48 | 
49 | * Connections can now be automatically re-connected via a user-provided function.
50 | * `DataBackendDplyr` now has a finalizer which automatically disconnects the
51 |   database connection during garbage collection.
52 | 
53 | # mlr3db 0.1.3
54 | 
55 | * During construction of `DataBackendDplyr`, you can now select columns to be
56 |   converted from string to factor. This simplifies the work with SQL databases
57 |   which do not naturally support factors (or where the level information is
58 |   lost in the transaction).
59 | 
60 | # mlr3db 0.1.2
61 | 
62 | * Fixed `$distinct()` to not return missing values per default.
63 | * Added `na_rm` argument to `$distinct()`.
64 | * Renamed `as_sqlite()` to `as_sqlite_backend()`
65 | 
66 | # mlr3db 0.1.1
67 | 
68 | * Initial release.
69 | 


--------------------------------------------------------------------------------
/R/DataBackendDplyr.R:
--------------------------------------------------------------------------------
  1 | #' @title DataBackend for dplyr/dbplyr
  2 | #'
  3 | #' @description
  4 | #' A [mlr3::DataBackend] using [dplyr::tbl()] from packages \CRANpkg{dplyr}/\CRANpkg{dbplyr}.
  5 | #' This includes [`tibbles`][tibble::tibble()] and abstract database connections interfaced by \CRANpkg{dbplyr}.
  6 | #' The latter allows [mlr3::Task]s to interface an out-of-memory database.
  7 | #'
  8 | #'
  9 | #' @param rows `integer()`\cr
 10 | #'   Row indices.
 11 | #' @param cols `character()`\cr
 12 | #'   Column names.
 13 | #' @param data_format (`character(1)`)\cr
 14 | #'  Desired data format, e.g. `"data.table"` or `"Matrix"`.
 15 | #' @param na_rm `logical(1)`\cr
 16 | #'   Whether to remove NAs or not.
 17 | #'
 18 | #' @template param_primary_key
 19 | #' @template param_strings_as_factors
 20 | #' @template param_connector
 21 | #'
 22 | #' @importFrom mlr3 DataBackend
 23 | #' @export
 24 | #' @examples
 25 | #' if (mlr3misc::require_namespaces(c("tibble", "RSQLite", "dbplyr"), quietly = TRUE)) {
 26 | #'   # Backend using a in-memory tibble
 27 | #'   data = tibble::as_tibble(iris)
 28 | #'   data$Sepal.Length[1:30] = NA
 29 | #'   data$row_id = 1:150
 30 | #'   b = DataBackendDplyr$new(data, primary_key = "row_id")
 31 | #'
 32 | #'   # Object supports all accessors of DataBackend
 33 | #'   print(b)
 34 | #'   b$nrow
 35 | #'   b$ncol
 36 | #'   b$colnames
 37 | #'   b$data(rows = 100:101, cols = "Species")
 38 | #'   b$distinct(b$rownames, "Species")
 39 | #'
 40 | #'   # Classification task using this backend
 41 | #'   task = mlr3::TaskClassif$new(id = "iris_tibble", backend = b, target = "Species")
 42 | #'   print(task)
 43 | #'   head(task)
 44 | #'
 45 | #'   # Create a temporary SQLite database
 46 | #'   con = DBI::dbConnect(RSQLite::SQLite(), ":memory:")
 47 | #'   dplyr::copy_to(con, data)
 48 | #'   tbl = dplyr::tbl(con, "data")
 49 | #'
 50 | #'   # Define a backend on a subset of the database: do not use column "Sepal.Width"
 51 | #'   tbl = dplyr::select_at(tbl, setdiff(colnames(tbl), "Sepal.Width"))
 52 | #'   tbl = dplyr::filter(tbl, row_id %in% 1:120) # Use only first 120 rows
 53 | #'   b = DataBackendDplyr$new(tbl, primary_key = "row_id")
 54 | #'   print(b)
 55 | #'
 56 | #'   # Query disinct values
 57 | #'   b$distinct(b$rownames, "Species")
 58 | #'
 59 | #'   # Query number of missing values
 60 | #'   b$missings(b$rownames, b$colnames)
 61 | #'
 62 | #'   # Note that SQLite does not support factors, column Species has been converted to character
 63 | #'   lapply(b$head(), class)
 64 | #'
 65 | #'   # Cleanup
 66 | #'   rm(tbl)
 67 | #'   DBI::dbDisconnect(con)
 68 | #' }
 69 | DataBackendDplyr = R6Class("DataBackendDplyr", inherit = DataBackend, cloneable = FALSE,
 70 |   public = list(
 71 |     #' @template field_levels
 72 |     levels = NULL,
 73 | 
 74 |     #' @template field_connector
 75 |     connector = NULL,
 76 | 
 77 |     #' @description
 78 |     #'
 79 |     #' Creates a backend for a [dplyr::tbl()] object.
 80 |     #'
 81 |     #' @param data ([dplyr::tbl()])\cr
 82 |     #'   The data object.
 83 |     #'
 84 |     #' Instead of calling the constructor yourself, you can call [mlr3::as_data_backend()]
 85 |     #' on a [dplyr::tbl()].
 86 |     #' Note that only objects of class `"tbl_lazy"` will be converted to a [DataBackendDplyr]
 87 |     #' (this includes all connectors from \CRANpkg{dbplyr}).
 88 |     #' Local `"tbl"` objects such as [`tibbles`][tibble::tibble()] will converted to a
 89 |     #' [DataBackendDataTable][mlr3::DataBackendDataTable].
 90 |     initialize = function(data, primary_key, strings_as_factors = TRUE, connector = NULL) {
 91 |       loadNamespace("DBI")
 92 |       loadNamespace("dbplyr")
 93 | 
 94 |       if (!dplyr::is.tbl(data)) {
 95 |         stop("Argument 'data' must be of class 'tbl'")
 96 |       }
 97 | 
 98 |       if (inherits(data, "tbl_sql")) {
 99 |         requireNamespace("dbplyr")
100 |       }
101 | 
102 |       super$initialize(data, primary_key)
103 |       assert_choice(primary_key, colnames(data))
104 | 
105 |       if (isFALSE(strings_as_factors)) {
106 |         self$levels = list()
107 |       } else {
108 |         h = self$head(1L)
109 |         string_cols = setdiff(names(h)[map_lgl(h, is.character)], self$primary_key)
110 | 
111 |         if (isTRUE(strings_as_factors)) {
112 |           strings_as_factors = string_cols
113 |         } else {
114 |           assert_subset(strings_as_factors, string_cols)
115 |         }
116 | 
117 |         self$levels = self$distinct(rows = NULL, cols = strings_as_factors)
118 |       }
119 | 
120 |       self$connector = assert_function(connector, args = character(), null.ok = TRUE)
121 |     },
122 | 
123 |     #' @description
124 |     #' Finalizer which disconnects from the database.
125 |     #' This is called during garbage collection of the instance.
126 |     #' @return `logical(1)`, the return value of [DBI::dbDisconnect()].
127 |     finalize = function() {
128 |       if (isTRUE(self$valid)) {
129 |         DBI::dbDisconnect(private$.data$src$con)
130 |       }
131 |     },
132 | 
133 |     #' @description
134 |     #' Returns a slice of the data.
135 |     #' Calls [dplyr::filter()] and [dplyr::select()] on the table and converts it to a [data.table::data.table()].
136 |     #'
137 |     #' The rows must be addressed as vector of primary key values, columns must be referred to via column names.
138 |     #' Queries for rows with no matching row id and queries for columns with no matching
139 |     #' column name are silently ignored.
140 |     #' Rows are guaranteed to be returned in the same order as `rows`, columns may be returned in an arbitrary order.
141 |     #' Duplicated row ids result in duplicated rows, duplicated column names lead to an exception.
142 |     data = function(rows, cols, data_format = "data.table") {
143 |       private$.reconnect()
144 |       rows = assert_integerish(rows, coerce = TRUE)
145 |       assert_names(cols, type = "unique")
146 |       assert_choice(data_format, self$data_formats)
147 |       cols = intersect(cols, colnames(private$.data))
148 | 
149 |       res = setDT(dplyr::collect(dplyr::select_at(
150 |         dplyr::filter_at(private$.data, self$primary_key, dplyr::all_vars(. %in% rows)),
151 |         union(cols, self$primary_key))))
152 | 
153 |       recode(res[list(rows), cols, nomatch = NULL, with = FALSE, on = self$primary_key],
154 |         self$levels)
155 |     },
156 | 
157 |     #' @description
158 |     #' Retrieve the first `n` rows.
159 |     #'
160 |     #' @param n (`integer(1)`)\cr
161 |     #'   Number of rows.
162 |     #'
163 |     #' @return [data.table::data.table()] of the first `n` rows.
164 |     head = function(n = 6L) {
165 |       private$.reconnect()
166 |       recode(setDT(dplyr::collect(head(private$.data, n))), self$levels)
167 |     },
168 | 
169 |     #' @description
170 |     #' Returns a named list of vectors of distinct values for each column
171 |     #' specified. If `na_rm` is `TRUE`, missing values are removed from the
172 |     #' returned vectors of distinct values. Non-existing rows and columns are
173 |     #' silently ignored.
174 |     #'
175 |     #' @return Named `list()` of distinct values.
176 |     distinct = function(rows, cols, na_rm = TRUE) {
177 |       private$.reconnect()
178 |       # TODO: what does dplyr::disinct return for enums?
179 |       assert_names(cols, type = "unique")
180 |       cols = intersect(cols, self$colnames)
181 | 
182 |       tbl = private$.data
183 |       if (!is.null(rows)) {
184 |         tbl = dplyr::filter_at(tbl, self$primary_key, dplyr::all_vars(. %in% rows))
185 |       }
186 | 
187 |       get_distinct = function(col) {
188 |         x = dplyr::collect(dplyr::distinct(dplyr::select_at(tbl, col)))[[1L]]
189 |         if (is.factor(x)) {
190 |           x = as.character(x)
191 |         }
192 |         if (na_rm) {
193 |           x = x[!is.na(x)]
194 |         }
195 |         x
196 |       }
197 |       setNames(lapply(cols, get_distinct), cols)
198 |     },
199 | 
200 |     #' @description
201 |     #' Returns the number of missing values per column in the specified slice
202 |     #' of data. Non-existing rows and columns are silently ignored.
203 |     #'
204 |     #' @return Total of missing values per column (named `numeric()`).
205 |     missings = function(rows, cols) {
206 |       private$.reconnect()
207 |       rows = assert_integerish(rows, coerce = TRUE)
208 |       assert_names(cols, type = "unique")
209 | 
210 |       cols = intersect(cols, self$colnames)
211 |       if (length(cols) == 0L) {
212 |         return(setNames(integer(0L), character(0L)))
213 |       }
214 | 
215 |       res = dplyr::collect(dplyr::summarize_at(
216 |         dplyr::filter_at(private$.data, self$primary_key, dplyr::all_vars(. %in% rows)),
217 |         cols, list(~ sum(is.na(.), na.rm = TRUE))))
218 | 
219 |       if (nrow(res) == 0L) {
220 |         return(setNames(integer(length(cols)), cols))
221 |       }
222 |       unlist(res, recursive = FALSE)
223 |     }
224 |   ),
225 | 
226 |   active = list(
227 |     #' @field rownames (`integer()`)\cr
228 |     #' Returns vector of all distinct row identifiers, i.e. the contents of the primary key column.
229 |     rownames = function() {
230 |       private$.reconnect()
231 |       dplyr::collect(dplyr::select_at(private$.data, self$primary_key))[[1L]]
232 |     },
233 | 
234 |     #' @field colnames (`character()`)\cr
235 |     #' Returns vector of all column names, including the primary key column.
236 |     colnames = function() {
237 |       private$.reconnect()
238 |       colnames(private$.data)
239 |     },
240 | 
241 |     #' @field nrow (`integer(1)`)\cr
242 |     #' Number of rows (observations).
243 |     nrow = function() {
244 |       private$.reconnect()
245 |       dplyr::collect(dplyr::tally(private$.data))[[1L]]
246 |     },
247 | 
248 |     #' @field ncol (`integer(1)`)\cr
249 |     #' Number of columns (variables), including the primary key column.
250 |     ncol = function() {
251 |       private$.reconnect()
252 |       ncol(private$.data)
253 |     },
254 | 
255 |     #' @field valid (`logical(1)`)\cr
256 |     #'   Returns `NA` if the data does not inherits from `"tbl_sql"` (i.e., it is not a real SQL data base).
257 |     #'   Returns the result of [DBI::dbIsValid()] otherwise.
258 |     valid = function() {
259 |       if (!inherits(private$.data, "tbl_sql")) {
260 |         return(NA)
261 |       }
262 | 
263 |       loadNamespace("DBI")
264 |       loadNamespace("dbplyr")
265 | 
266 |       # workaround for https://github.com/r-dbi/DBI/issues/302
267 |       force(names(private$.data$src$con))
268 | 
269 |       DBI::dbIsValid(private$.data$src$con)
270 |     }
271 |   ),
272 | 
273 |   private = list(
274 |     .calculate_hash = function() {
275 |       private$.reconnect()
276 |       calculate_hash(private$.data)
277 |     },
278 | 
279 |     .reconnect = function() {
280 |       if (isFALSE(self$valid)) {
281 |         if (is.null(self$connector)) {
282 |           stop("Invalid connection. Provide a connector during construction to automatically reconnect", call. = FALSE)
283 |         }
284 | 
285 |         con = self$connector()
286 | 
287 |         if (!all(class(private$.data$src$con) == class(con))) {
288 |           stop(sprintf("Reconnecting failed. Expected a connection of class %s, but got %s",
289 |             paste0(class(private$.data$src$con), collapse = "/"), paste0(class(con), collapse = "/")), call. = FALSE)
290 |         }
291 | 
292 |         private$.data$src$con = con
293 |       }
294 |     }
295 |   )
296 | )
297 | 
298 | #' @importFrom mlr3 as_data_backend
299 | #' @export
300 | as_data_backend.tbl_SQLiteConnection = function(data, primary_key, strings_as_factors = TRUE, ...) { # nolint
301 |   b = DataBackendDplyr$new(data, primary_key)
302 |   path = data$src$con@dbname
303 |   if (!identical(path, ":memory:") && test_string(path) && file.exists(path)) {
304 |     b$connector = sqlite_reconnector(path)
305 |   }
306 |   return(b)
307 | }
308 | 
309 | #' @importFrom mlr3 as_data_backend
310 | #' @export
311 | as_data_backend.tbl_lazy = function(data, primary_key, strings_as_factors = TRUE, ...) { # nolint
312 |   DataBackendDplyr$new(data, primary_key)
313 | }
314 | 
315 | #' @rawNamespace if (getRversion() >= "3.6.0") S3method(dplyr::show_query, DataBackendDplyr)
316 | show_query.DataBackendDplyr = function(x, ...) { # nolint
317 |   requireNamespace("dplyr")
318 |   requireNamespace("dbplyr")
319 |   dplyr::show_query(x$.__enclos_env__$private$.data)
320 | }
321 | 


--------------------------------------------------------------------------------
/R/DataBackendDuckDB.R:
--------------------------------------------------------------------------------
  1 | #' @title DataBackend for DuckDB
  2 | #'
  3 | #' @description
  4 | #' A [mlr3::DataBackend] for \CRANpkg{duckdb}.
  5 | #' Can be easily constructed with [as_duckdb_backend()].
  6 | #'
  7 | #' @seealso
  8 | #' \url{https://duckdb.org/}
  9 | #'
 10 | #' @param rows `integer()`\cr
 11 | #'   Row indices.
 12 | #' @param cols `character()`\cr
 13 | #'   Column names.
 14 | #' @param data_format (`character(1)`)\cr
 15 | #'  Desired data format, e.g. `"data.table"` or `"Matrix"`.
 16 | #' @param na_rm `logical(1)`\cr
 17 | #'   Whether to remove NAs or not.
 18 | #'
 19 | #' @template param_primary_key
 20 | #' @template param_strings_as_factors
 21 | #' @template param_connector
 22 | #'
 23 | #' @importFrom mlr3 DataBackend
 24 | #' @export
 25 | DataBackendDuckDB = R6Class("DataBackendDuckDB", inherit = DataBackend, cloneable = FALSE,
 26 |   public = list(
 27 |     #' @template field_levels
 28 |     levels = NULL,
 29 | 
 30 |     #' @template field_connector
 31 |     connector = NULL,
 32 | 
 33 |     #' @field table (`character(1)`)\cr
 34 |     #'  Data base table or view to operate on.
 35 |     table = NULL,
 36 | 
 37 |     #' @description
 38 |     #'
 39 |     #' Creates a backend for a [duckdb::duckdb()] database.
 40 |     #'
 41 |     #' @param data (connection)\cr
 42 |     #'   A connection created with [DBI::dbConnect()].
 43 |     #'   If constructed manually (and not via the helper function [as_duckdb_backend()],
 44 |     #'   make sure that there exists an (unique) index for the key column.
 45 |     #' @param table (`character(1)`)\cr
 46 |     #'   Table or view to operate on.
 47 |     initialize = function(data, table, primary_key, strings_as_factors = TRUE, connector = NULL) {
 48 |       loadNamespace("duckdb")
 49 | 
 50 |       assert_class(data, "duckdb_connection")
 51 |       super$initialize(data, primary_key)
 52 |       self$table = assert_string(table)
 53 | 
 54 |       info = self$table_info
 55 |       assert_choice(self$primary_key, info$name)
 56 |       assert_choice(self$table, DBI::dbGetQuery(private$.data, "PRAGMA show_tables")$name)
 57 |       self$connector = assert_function(connector, args = character(), null.ok = TRUE)
 58 | 
 59 |       if (isFALSE(strings_as_factors)) {
 60 |         self$levels = list()
 61 |       } else {
 62 |         string_cols = info$name[tolower(info$type) %in% c("varchar", "string", "text")]
 63 |         string_cols = setdiff(string_cols, self$primary_key)
 64 | 
 65 |         if (isTRUE(strings_as_factors)) {
 66 |           strings_as_factors = string_cols
 67 |         } else {
 68 |           assert_subset(strings_as_factors, string_cols)
 69 |         }
 70 | 
 71 |         self$levels = self$distinct(rows = NULL, cols = strings_as_factors)
 72 |       }
 73 | 
 74 |     },
 75 | 
 76 |     #' @description
 77 |     #' Finalizer which disconnects from the database.
 78 |     #' This is called during garbage collection of the instance.
 79 |     #' @return `logical(1)`, the return value of [DBI::dbDisconnect()].
 80 |     finalize = function() {
 81 |       if (isTRUE(self$valid)) {
 82 |         DBI::dbDisconnect(private$.data, shutdown = TRUE)
 83 |       }
 84 |     },
 85 | 
 86 |     #' @description
 87 |     #' Returns a slice of the data.
 88 |     #'
 89 |     #' The rows must be addressed as vector of primary key values, columns must be referred to via column names.
 90 |     #' Queries for rows with no matching row id and queries for columns with no matching
 91 |     #' column name are silently ignored.
 92 |     #' Rows are guaranteed to be returned in the same order as `rows`, columns may be returned in an arbitrary order.
 93 |     #' Duplicated row ids result in duplicated rows, duplicated column names lead to an exception.
 94 |     data = function(rows, cols, data_format = "data.table") {
 95 |       private$.reconnect()
 96 |       rows = assert_integerish(rows, coerce = TRUE)
 97 |       assert_names(cols, type = "unique")
 98 |       assert_choice(data_format, self$data_formats)
 99 |       cols = intersect(cols, self$colnames)
100 |       tmp_tbl = write_temp_table(private$.data, rows)
101 |       on.exit(DBI::dbRemoveTable(private$.data, tmp_tbl, temporary = TRUE))
102 | 
103 |       query = sprintf('SELECT %1$s FROM "%2$s" INNER JOIN "%3$s" ON "%2$s"."row_id" = "%3$s"."%4$s"',
104 |         paste0(sprintf('"%s"."%s"', self$table, union(cols, self$primary_key)), collapse = ","),
105 |         tmp_tbl, self$table, self$primary_key)
106 | 
107 |       res = setDT(DBI::dbGetQuery(private$.data, query), key = self$primary_key)
108 |       recode(res[list(rows), cols, nomatch = NULL, on = self$primary_key, with = FALSE],
109 |         self$levels)
110 |     },
111 | 
112 |     #' @description
113 |     #' Retrieve the first `n` rows.
114 |     #'
115 |     #' @param n (`integer(1)`)\cr
116 |     #'   Number of rows.
117 |     #'
118 |     #' @return [data.table::data.table()] of the first `n` rows.
119 |     head = function(n = 6L) {
120 |       private$.reconnect()
121 |       res = DBI::dbGetQuery(private$.data,
122 |         sprintf('SELECT * FROM "%s" ORDER BY "%s" LIMIT %i', self$table, self$primary_key, n))
123 |       recode(setDT(res), self$levels)
124 |     },
125 | 
126 |     #' @description
127 |     #' Returns a named list of vectors of distinct values for each column
128 |     #' specified. If `na_rm` is `TRUE`, missing values are removed from the
129 |     #' returned vectors of distinct values. Non-existing rows and columns are
130 |     #' silently ignored.
131 |     #'
132 |     #' @return Named `list()` of distinct values.
133 |     distinct = function(rows, cols, na_rm = TRUE) {
134 |       private$.reconnect()
135 |       assert_names(cols, type = "unique")
136 |       cols = intersect(cols, self$colnames)
137 |       order = sprintf('ORDER BY "%s"', self$primary_key)
138 | 
139 |       if (is.null(rows)) {
140 |         get_query = function(col) {
141 |           sprintf('SELECT DISTINCT("%s") FROM "%s"', col, self$table)
142 |         }
143 |       } else {
144 |         tmp_tbl = write_temp_table(private$.data, rows)
145 |         on.exit(DBI::dbRemoveTable(private$.data, tmp_tbl, temporary = TRUE))
146 | 
147 |         get_query = function(col) {
148 |           sprintf('SELECT DISTINCT("%1$s"."%2$s") FROM "%3$s" LEFT JOIN "%1$s" ON "%3$s"."row_id" = "%1$s"."%4$s"',
149 |             self$table, col, tmp_tbl, self$primary_key)
150 |         }
151 |       }
152 | 
153 |       res = lapply(cols, function(col) {
154 |         query = get_query(col)
155 |         if (na_rm) {
156 |           query = sprintf('%s WHERE "%s"."%s" IS NOT NULL', query, self$table, col)
157 |         }
158 |         levels = DBI::dbGetQuery(private$.data, paste(query, order))[[1L]]
159 |         if (is.factor(levels)) as.character(levels) else levels
160 |       })
161 | 
162 |       setNames(res, cols)
163 |     },
164 | 
165 |     #' @description
166 |     #' Returns the number of missing values per column in the specified slice
167 |     #' of data. Non-existing rows and columns are silently ignored.
168 |     #'
169 |     #' @return Total of missing values per column (named `numeric()`).
170 |     missings = function(rows, cols) {
171 |       private$.reconnect()
172 |       rows = assert_integerish(rows, coerce = TRUE)
173 |       assert_names(cols, type = "unique")
174 | 
175 |       cols = intersect(cols, self$colnames)
176 |       if (length(cols) == 0L) {
177 |         return(setNames(integer(0L), character(0L)))
178 |       }
179 | 
180 |       tmp_tbl = write_temp_table(private$.data, rows)
181 |       on.exit(DBI::dbRemoveTable(private$.data, tmp_tbl, temporary = TRUE))
182 | 
183 |       query = sprintf('SELECT %1$s FROM (SELECT * FROM "%2$s" INNER JOIN "%3$s" ON "%2$s"."%4$s" = "%3$s"."row_id")',
184 |         paste0(sprintf('COUNT("%s")', cols), collapse = ","),
185 |         self$table,
186 |         tmp_tbl,
187 |         self$primary_key
188 |       )
189 | 
190 |       counts = unlist(DBI::dbGetQuery(private$.data, query), recursive = FALSE)
191 |       setNames(as.integer(length(rows) - counts), cols)
192 |     }
193 |   ),
194 | 
195 |   active = list(
196 |     #' @field table_info (`data.frame()`)\cr
197 |     #' Data frame as returned by pragma `table_info()`.
198 |     table_info = function() {
199 |       private$.reconnect()
200 |       DBI::dbGetQuery(private$.data, sprintf("PRAGMA table_info('%s')", self$table))
201 |     },
202 | 
203 |     #' @field rownames (`integer()`)\cr
204 |     #' Returns vector of all distinct row identifiers, i.e. the contents of the primary key column.
205 |     rownames = function() {
206 |       private$.reconnect()
207 |       res = DBI::dbGetQuery(private$.data,
208 |         sprintf('SELECT "%1$s" FROM "%2$s" ORDER BY "%1$s"', self$primary_key, self$table))
209 |       res[[1L]]
210 |     },
211 | 
212 |     #' @field colnames (`character()`)\cr
213 |     #' Returns vector of all column names, including the primary key column.
214 |     colnames = function() {
215 |       private$.reconnect()
216 |       self$table_info$name
217 |     },
218 | 
219 |     #' @field nrow (`integer(1)`)\cr
220 |     #' Number of rows (observations).
221 |     nrow = function() {
222 |       private$.reconnect()
223 |       res = DBI::dbGetQuery(private$.data,
224 |         sprintf('SELECT COUNT(*) AS n FROM "%s"', self$table))
225 |       as.integer(res$n)
226 |     },
227 | 
228 |     #' @field ncol (`integer(1)`)\cr
229 |     #' Number of columns (variables), including the primary key column.
230 |     ncol = function() {
231 |       private$.reconnect()
232 |       nrow(self$table_info)
233 |     },
234 | 
235 |     #' @field valid (`logical(1)`)\cr
236 |     #'   Returns `NA` if the data does not inherits from `"tbl_sql"` (i.e., it is not a real SQL data base).
237 |     #'   Returns the result of [DBI::dbIsValid()] otherwise.
238 |     valid = function() {
239 |       loadNamespace("DBI")
240 |       loadNamespace("duckdb")
241 |       DBI::dbIsValid(private$.data)
242 |     }
243 |   ),
244 | 
245 |   private = list(
246 |     .calculate_hash = function() {
247 |       private$.reconnect()
248 |       calculate_hash(private$.data@driver@dbdir)
249 |     },
250 | 
251 |     .reconnect = function() {
252 |       if (isFALSE(self$valid)) {
253 |         if (is.null(self$connector)) {
254 |           stop("Invalid connection. Provide a connector during construction to automatically reconnect", call. = FALSE)
255 |         }
256 | 
257 |         con = self$connector()
258 | 
259 |         if (!all(class(private$.data) == class(con))) {
260 |           stop(sprintf("Reconnecting failed. Expected a connection of class %s, but got %s",
261 |             paste0(class(private$.data$src$con), collapse = "/"), paste0(class(con), collapse = "/")), call. = FALSE)
262 |         }
263 | 
264 |         private$.data = con
265 |       }
266 |     }
267 |   )
268 | )
269 | 
270 | write_temp_table = function(con, rows) {
271 |   tbl_name = sprintf("rows_%i", Sys.getpid())
272 |   DBI::dbWriteTable(con, tbl_name, data.frame(row_id = sort(unique(rows))),
273 |     temporary = TRUE, overwrite = TRUE, append = FALSE)
274 |   tbl_name
275 | }
276 | 
277 | #' @importFrom mlr3 as_data_backend
278 | #' @export
279 | as_data_backend.tbl_duckdb_connection = function(data, primary_key, strings_as_factors = TRUE, ...) { # nolint
280 |   b = DataBackendDuckDB$new(data, primary_key)
281 |   path = data$src$con@driver@dbdir
282 |   if (!identical(path, ":memory:") && test_string(path) && file.exists(path)) {
283 |     b$connector = duckdb_reconnector(path)
284 |   }
285 |   return(b)
286 | }
287 | 


--------------------------------------------------------------------------------
/R/DataBackendPolars.R:
--------------------------------------------------------------------------------
  1 | #' @title DataBackend for Polars
  2 | #'
  3 | #' @description
  4 | #' A [mlr3::DataBackend] using `RPolarsLazyFrame` from package \CRANpkg{polars}.
  5 | #' Can be easily constructed with [as_polars_backend()].
  6 | #' [mlr3::Task]s can interface out-of-memory files if the `polars::RPolarsLazyFrame` was imported using a `polars::scan_x` function.
  7 | #' Streaming, a \CRANpkg{polars} alpha feature, is always enabled, but only used when applicable.
  8 | #' A connector is not required but can be useful e.g. for scanning larger than memory files
  9 | #'
 10 | #' @seealso
 11 | #' \url{https://pola-rs.github.io/r-polars/}
 12 | #'
 13 | #' @param rows (`integer()`)\cr
 14 | #'   Row indices.
 15 | #' @param cols (`character()`)\cr
 16 | #'   Column names.
 17 | #' @param na_rm (`logical(1)`)\cr
 18 | #'   Whether to remove NAs or not.
 19 | #' @param primary_key (`character(1)`)\cr
 20 | #'   Name of the primary key column.
 21 | #'   Because `polars` does not natively support primary keys, uniqueness of the primary key column is expected but not enforced.
 22 | #' @param connector (`function()`)\cr
 23 | #'   Optional function which is called to re-connect to e.g. a source file in case the connection became invalid.
 24 | #'
 25 | #' @template param_strings_as_factors
 26 | #'
 27 | #' @importFrom mlr3 DataBackend
 28 | #' @export
 29 | #' @examples
 30 | #' if (mlr3misc::require_namespaces("polars", quietly = TRUE)) {
 31 | #'   # Backend using a in-memory data set
 32 | #'   data = iris
 33 | #'   data$Sepal.Length[1:30] = NA
 34 | #'   data$row_id = 1:150
 35 | #'   data = polars::as_polars_lf(data)
 36 | #'   b = DataBackendPolars$new(data, primary_key = "row_id")
 37 | #'
 38 | #'   # Object supports all accessors of DataBackend
 39 | #'   print(b)
 40 | #'   b$nrow
 41 | #'   b$ncol
 42 | #'   b$colnames
 43 | #'   b$data(rows = 100:101, cols = "Species")
 44 | #'   b$distinct(b$rownames, "Species")
 45 | #'
 46 | #'   # Classification task using this backend
 47 | #'   task = mlr3::TaskClassif$new(id = "iris_polars", backend = b, target = "Species")
 48 | #'   print(task)
 49 | #'   head(task)
 50 | #'
 51 | #'   # Write a parquet file to scan
 52 | #'   data$collect()$write_parquet("iris.parquet")
 53 | #'   data = polars::pl$scan_parquet("iris.parquet")
 54 | #'
 55 | #'   # Backend that re-reads the parquet file if the connection fails
 56 | #'   b = DataBackendPolars$new(data, "row_id",
 57 | #'     connector = function() polars::pl$scan_parquet("iris.parquet"))
 58 | #'   print(b)
 59 | #'
 60 | #'   # Define a backend on a subset of the database: do not use column "Sepal.Width"
 61 | #'   data = data$select(
 62 | #'     polars::pl$col(setdiff(colnames(data), "Sepal.Width"))
 63 | #'   )$filter(
 64 | #'     polars::pl$col("row_id")$is_in(1:120) # Use only first 120 rows
 65 | #'   )
 66 | #'
 67 | #'   # Backend with only scanned data
 68 | #'   b = DataBackendPolars$new(data, "row_id", strings_as_factors = TRUE)
 69 | #'   print(b)
 70 | #'
 71 | #'   # Query disinct values
 72 | #'   b$distinct(b$rownames, "Species")
 73 | #'
 74 | #'   # Query number of missing values
 75 | #'   b$missings(b$rownames, b$colnames)
 76 | #'
 77 | #'   # Cleanup
 78 | #'   if (file.exists("iris.parquet")) {
 79 | #'     file.remove("iris.parquet")
 80 | #'   }
 81 | #' }
 82 | DataBackendPolars = R6Class("DataBackendPolars", inherit = DataBackend, cloneable = FALSE,
 83 |   public = list(
 84 |     #' @template field_levels
 85 |     levels = NULL,
 86 | 
 87 |     #' @template field_connector
 88 |     connector = NULL,
 89 | 
 90 |     #' @description
 91 |     #'
 92 |     #' Creates a backend for a [polars::RPolarsDataFrame] object.
 93 |     #'
 94 |     #' @param data ([polars::RPolarsLazyFrame])\cr
 95 |     #'   The data object.
 96 |     #'
 97 |     #' Instead of calling the constructor itself, please call [mlr3::as_data_backend()] on
 98 |     #' a [polars::RPolarsLazyFrame] or [polars::RPolarsDataFrame].
 99 |     #' Note that only [polars::RPolarsLazyFrame]s will be converted to a [DataBackendPolars].
100 |     #' [polars::RPolarsDataFrame] objects without lazy execution will be converted to a
101 |     #' [DataBackendDataTable][mlr3::DataBackendDataTable].
102 |     initialize = function(data, primary_key, strings_as_factors = TRUE, connector = NULL) {
103 |       loadNamespace("polars")
104 |       assert_choice(class(data), "RPolarsLazyFrame")
105 | 
106 |       super$initialize(data, primary_key)
107 |       assert_choice(primary_key, colnames(data))
108 |       self$connector = assert_function(connector, args = character(), null.ok = TRUE)
109 | 
110 |       if (isFALSE(strings_as_factors)) {
111 |         self$levels = list()
112 |       } else {
113 |         h = self$head(1L)
114 |         string_cols = setdiff(names(h)[map_lgl(h, function(x) {is.character(x) || is.factor(x)})], self$primary_key)
115 | 
116 |         if (isTRUE(strings_as_factors)) {
117 |           strings_as_factors = string_cols
118 |         } else {
119 |           assert_subset(strings_as_factors, string_cols)
120 |         }
121 | 
122 |         self$levels = self$distinct(rows = NULL, cols = strings_as_factors)
123 |       }
124 |     },
125 | 
126 |     #' @description
127 |     #' Returns a slice of the data.
128 |     #'
129 |     #' The rows must be addressed as vector of primary key values, columns must be referred to via column names.
130 |     #' Queries for rows with no matching row id and queries for columns with no matching
131 |     #' column name are silently ignored.
132 |     data = function(rows, cols) {
133 |       private$.reconnect()
134 |       rows = assert_integerish(rows, coerce = TRUE)
135 |       assert_names(cols, type = "unique")
136 |       cols = intersect(cols, self$colnames)
137 | 
138 |       data = private$.data
139 |       res = data$filter(polars::pl$col(self$primary_key)$is_in(rows))$select(polars::pl$col(union(self$primary_key, cols)))$collect(streaming = TRUE)
140 |       res = as.data.table(res)
141 | 
142 |       recode(res[list(rows), cols, nomatch = NULL, on = self$primary_key, with = FALSE],
143 |              self$levels)
144 |     },
145 | 
146 |     #' @description
147 |     #' Retrieve the first `n` rows.
148 |     #'
149 |     #' @param n (`integer(1)`)\cr
150 |     #'   Number of rows.
151 |     #'
152 |     #' @return [data.table::data.table()] of the first `n` rows.
153 |     head = function(n = 6L) {
154 |       private$.reconnect()
155 |       recode(as.data.table(private$.data$head(n)$collect(streaming = TRUE)), self$levels)
156 |     },
157 | 
158 |     #' @description
159 |     #' Returns a named list of vectors of distinct values for each column
160 |     #' specified. If `na_rm` is `TRUE`, missing values are removed from the
161 |     #' returned vectors of distinct values. Non-existing rows and columns are
162 |     #' silently ignored.
163 |     #'
164 |     #' @return Named `list()` of distinct values.
165 |     distinct = function(rows, cols, na_rm = TRUE) {
166 |       private$.reconnect()
167 |       assert_names(cols, type = "unique")
168 |       cols = intersect(cols, self$colnames)
169 | 
170 |       dat = private$.data
171 | 
172 |       if (!is.null(rows)) {
173 |         dat = dat$filter(polars::pl$col(self$primary_key)$is_in(rows))
174 |       }
175 | 
176 |       get_distinct = function(col) {
177 |         x = as.vector(
178 |           dat$select(
179 |             polars::pl$col(col)$unique()
180 |           )$collect(streaming = TRUE)$get_column(col)
181 |         )
182 | 
183 |         if (is.factor(x)) {
184 |           x = as.character(x)
185 |         }
186 |         if (na_rm) {
187 |           x = x[!is.na(x)]
188 |         }
189 |         x
190 |       }
191 |       setNames(lapply(cols, get_distinct), cols)
192 |     },
193 | 
194 |     #' @description
195 |     #' Returns the number of missing values per column in the specified slice
196 |     #' of data. Non-existing rows and columns are silently ignored.
197 |     #'
198 |     #' @return Total of missing values per column (named `numeric()`).
199 |     missings = function(rows, cols) {
200 |       private$.reconnect()
201 |       rows = assert_integerish(rows, coerce = TRUE)
202 |       assert_names(cols, type = "unique")
203 | 
204 |       cols = intersect(cols, self$colnames)
205 |       if (length(cols) == 0L) {
206 |         return(setNames(integer(0L), character(0L)))
207 |       }
208 | 
209 |       res = private$.data$filter(
210 |           polars::pl$col(self$primary_key)$is_in(rows)
211 |         )
212 |       res = res$select(
213 |         lapply(cols, function(col) {
214 |           polars::pl$col(col)$is_null()$sum()$alias(col)
215 |         })
216 |       )$collect(streaming = TRUE)
217 | 
218 |       if (res$height == 0L) {
219 |         return(setNames(integer(length(cols)), cols))
220 |       }
221 | 
222 |       setNames(mlr3misc::map_int(cols, function(col) as.integer(as.vector(res$get_column(col)))), cols)
223 |     }
224 |   ),
225 | 
226 |   active = list(
227 |     #' @field rownames (`integer()`)\cr
228 |     #' Returns vector of all distinct row identifiers, i.e. the contents of the primary key column.
229 |     rownames = function() {
230 |       private$.reconnect()
231 | 
232 |       as.vector(
233 |         private$.data$
234 |           select(polars::pl$col(self$primary_key))$
235 |           collect()$
236 |           get_column(self$primary_key)
237 |       )
238 |     },
239 | 
240 |     #' @field colnames (`character()`)\cr
241 |     #' Returns vector of all column names, including the primary key column.
242 |     colnames = function() {
243 |       private$.reconnect()
244 |       names(private$.data$schema)
245 |     },
246 | 
247 |     #' @field nrow (`integer(1)`)\cr
248 |     #' Number of rows (observations).
249 |     nrow = function() {
250 |       private$.reconnect()
251 |       n = private$.data$select(polars::pl$len())$collect(streaming = TRUE)$item()
252 |       as.integer(n)
253 |     },
254 | 
255 |     #' @field ncol (`integer(1)`)\cr
256 |     #' Number of columns (variables), including the primary key column.
257 |     ncol = function() {
258 |       private$.reconnect()
259 |       length(private$.data$schema)
260 |     }
261 |   ),
262 | 
263 |   private = list(
264 |     .calculate_hash = function() {
265 |       private$.reconnect()
266 |       calculate_hash(private$.data)
267 |     },
268 | 
269 |     .reconnect = function() {
270 |       if (is.null(self$connector)) {
271 |         return(invisible())
272 |       }
273 | 
274 |       con = self$connector()
275 | 
276 |       if (!all(class(private$.data) == class(con))) {
277 |         stop(sprintf("Reconnecting failed. Expected a connection of class %s, but got %s",
278 |                      paste0(class(private$.data), collapse = "/"), paste0(class(con), collapse = "/")), call. = FALSE)
279 |       }
280 | 
281 |       private$.data = con
282 |     }
283 |   )
284 | )
285 | 
286 | #' @importFrom mlr3 as_data_backend
287 | #' @export
288 | as_data_backend.RPolarsDataFrame = function(data, primary_key = NULL, ...) { # nolint
289 |   data = as.data.frame(data)
290 | 
291 |   if (!is.null(primary_key) && test_integerish(data[[primary_key]])) {
292 |     data[[primary_key]] = as.integer(data[[primary_key]])
293 |   }
294 | 
295 |   as_data_backend(data, primary_key = primary_key)
296 | }
297 | 
298 | #' @importFrom mlr3 as_data_backend
299 | #' @export
300 | as_data_backend.RPolarsLazyFrame = function(data, primary_key, strings_as_factors = TRUE, ...) { # nolint
301 |   DataBackendPolars$new(data, primary_key, strings_as_factors)
302 | }
303 | 


--------------------------------------------------------------------------------
/R/as_duckdb_backend.R:
--------------------------------------------------------------------------------
 1 | #' @title Convert to DuckDB Backend
 2 | #'
 3 | #' @description
 4 | #' Converts to a [DataBackendDuckDB] using the \CRANpkg{duckdb} database, depending on the input type:
 5 | #'
 6 | #' * `data.frame`: Creates a new [DataBackendDataTable] first using [as_data_backend()], then proceeds
 7 | #'   with the conversion from [DataBackendDataTable] to [DataBackendDuckDB].
 8 | #' * [mlr3::DataBackend]: Creates a new DuckDB data base in the specified path.
 9 | #'   The filename is determined by the hash of the [DataBackend].
10 | #'   If the file already exists, a connection to the existing database is established and the existing
11 | #'   files are reused.
12 | #'
13 | #' The created backend automatically reconnects to the database if the connection was lost, e.g. because
14 | #' the object was serialized to the filesystem and restored in a different R session.
15 | #' The only requirement is that the path does not change and that the path is accessible
16 | #' on all workers.
17 | #'
18 | #' @param data (`data.frame()` | [mlr3::DataBackend])\cr
19 | #'   See description.
20 | #' @param ... (`any`)\cr
21 | #'   Additional arguments, passed to [DataBackendDuckDB].
22 | #' @template param_path
23 | #'
24 | #' @return [DataBackendDuckDB] or [Task].
25 | #' @export
26 | as_duckdb_backend = function(data, path = getOption("mlr3db.duckdb_dir", ":temp:"), ...) {
27 |   UseMethod("as_duckdb_backend")
28 | }
29 | 
30 | #' @export
31 | as_duckdb_backend.data.frame = function(data, path = getOption("mlr3db.duckdb_dir", ":temp:"), primary_key = NULL, ...) { # nolint
32 |   backend = as_data_backend(data, primary_key = primary_key)
33 |   as_duckdb_backend.DataBackend(backend, path = path, ...)
34 | }
35 | 
36 | #' @export
37 | as_duckdb_backend.character = function(data, path = getOption("mlr3db.duckdb_dir", ":temp:"), primary_key = NULL, ...) {
38 |   assert_file_exists(data, access = "r", extension = "parquet")
39 |   con = DBI::dbConnect(duckdb::duckdb())
40 | 
41 |   query = "CREATE OR REPLACE VIEW 'mlr3db_view' AS SELECT *"
42 |   if (is.null(primary_key)) {
43 |     primary_key = "mlr3_row_id"
44 |     query = paste0(query, ", row_number() OVER () AS mlr3_row_id")
45 |   } else {
46 |     assert_string(primary_key)
47 |   }
48 | 
49 |   query = sprintf("%s FROM parquet_scan(['%s'])", query, paste0(data, collapse = "','"))
50 |   DBI::dbExecute(con, query)
51 | 
52 |   DataBackendDuckDB$new(con, table = "mlr3db_view", primary_key = primary_key)
53 | }
54 | 
55 | #' @export
56 | as_duckdb_backend.DataBackend = function(data, path = getOption("mlr3db.duckdb_dir", ":temp:"), ...) { # nolint
57 |   path = get_db_path(path, hash = data$hash, "duckdb")
58 |   primary_key = data$primary_key
59 | 
60 |   con = NULL
61 |   on.exit({
62 |     if (!is.null(con)) DBI::dbDisconnect(con, shutdown = TRUE)
63 |   }, add = TRUE)
64 | 
65 |   if (!file.exists(path)) {
66 |     on.exit({
67 |       if (file.exists(path)) unlink(paste0(path, c("", ".wal", ".tmp"), recursive = TRUE))
68 |     }, add = TRUE)
69 | 
70 |     con = DBI::dbConnect(duckdb::duckdb(), dbdir = path, read_only = FALSE)
71 |     DBI::dbWriteTable(con, "data", data$head(Inf), row.names = FALSE)
72 |     DBI::dbExecute(con, sprintf('CREATE UNIQUE INDEX primary_key ON "%s" ("%s")', "data", primary_key))
73 |     DBI::dbDisconnect(con, shutdown = TRUE)
74 |   }
75 | 
76 |   con = DBI::dbConnect(duckdb::duckdb(), dbdir = path, read_only = TRUE)
77 |   backend = DataBackendDuckDB$new(con, table = "data", primary_key = primary_key, ...)
78 |   backend$connector = duckdb_reconnector(path)
79 | 
80 |   on.exit()
81 |   return(backend)
82 | }
83 | 
84 | duckdb_reconnector = function(path) {
85 |   force(path)
86 |   function() {
87 |     DBI::dbConnect(duckdb::duckdb(), path, read_only = TRUE)
88 |   }
89 | }
90 | 


--------------------------------------------------------------------------------
/R/as_polars_backend.R:
--------------------------------------------------------------------------------
 1 | #' @title Convert to Polars Backend
 2 | #'
 3 | #' @description
 4 | #' Converts to a [DataBackendPolars] using the \CRANpkg{polars} database, depending on the input type:
 5 | #'
 6 | #' * `data.frame`: Creates a new [DataBackendDataTable] first using [as_data_backend()], then proceeds
 7 | #'   with the conversion from [DataBackendDataTable] to [DataBackendPolars].
 8 | #' * [mlr3::DataBackend]: Creates a new [DataBackendPolars].
 9 | #'
10 | #' There is no automatic connection to the origin file set.
11 | #' If the data is obtained using scanning and the data is streamed, a `connector` can be set manually but is not required.
12 | #'
13 | #' @param data (`data.frame()` | [mlr3::DataBackend])\cr
14 | #'   See description.
15 | #' @param streaming (`logical(1)`)\cr
16 | #'   Whether the data should be only scanned (recommended for large data sets) and streamed with
17 | #'   every [DataBackendPolars] operation or loaded into memory completely.
18 | #'
19 | #' @param ... (`any`)\cr
20 | #'   Additional arguments, passed to [DataBackendPolars].
21 | #'
22 | #' @return [DataBackendPolars] or [Task].
23 | #' @export
24 | as_polars_backend = function(data, streaming = FALSE, ...) {
25 |   UseMethod("as_polars_backend")
26 | }
27 | 
28 | 
29 | #' @export
30 | as_polars_backend.data.frame = function(data, streaming = FALSE, primary_key = NULL, ...) {
31 |   backend = as_data_backend(data, primary_key = primary_key, streaming = streaming)
32 |   as_polars_backend.DataBackend(backend, ...)
33 | }
34 | 
35 | 
36 | #' @export
37 | as_polars_backend.DataBackend = function(data, streaming = FALSE, ...) {
38 |   path = get_db_path(tempfile(), data$hash, "polars")
39 | 
40 |   on.exit({
41 |     if (file.exists(path)) file.remove(path)
42 |   })
43 | 
44 |   primary_key = data$primary_key
45 | 
46 |   if(streaming) {
47 |     polars::as_polars_df(data$head(Inf))$write_parquet(sprintf("%s.parquet", path))
48 |     data = polars::pl$scan_parquet(sprintf("%s.parquet", path))
49 |   } else {
50 |     data = polars::as_polars_lf(data$head(Inf))
51 |   }
52 | 
53 |   DataBackendPolars$new(data = data, primary_key = primary_key, ...)
54 | }
55 | 


--------------------------------------------------------------------------------
/R/as_sqlite_backend.R:
--------------------------------------------------------------------------------
 1 | #' @title Convert to SQLite Backend
 2 | #'
 3 | #' @description
 4 | #' Converts to a [DataBackendDplyr] using a \CRANpkg{RSQLite} database, depending on the input type:
 5 | #'
 6 | #' * `data.frame`: Creates a new [DataBackendDataTable] first using [as_data_backend()], then proceeds
 7 | #'   with the conversion from [DataBackendDataTable] to [DataBackendDplyr].
 8 | #' * [mlr3::DataBackend]: Creates a new SQLite data base in the specified path.
 9 | #'   The filename is determined by the hash of the [DataBackend].
10 | #'   If the file already exists, a connection to the existing database is established and the existing
11 | #'   files are reused.
12 | #'
13 | #' The created backend automatically reconnects to the database if the connection was lost, e.g. because
14 | #' the object was serialized to the filesystem and restored in a different R session.
15 | #' The only requirement is that the path does not change and that the path is accessible
16 | #' on all workers.
17 | #'
18 | #' @param data (`data.frame()` | [mlr3::DataBackend]\cr
19 | #'   See description.
20 | #' @param ... (`any`)\cr
21 | #'   Additional arguments, passed to [DataBackendDplyr].
22 | #' @template param_path
23 | #'
24 | #' @return [DataBackendDplyr] or [Task].
25 | #' @export
26 | as_sqlite_backend = function(data, path = getOption("mlr3db.sqlite_dir", ":temp:"), ...) {
27 |   UseMethod("as_sqlite_backend")
28 | }
29 | 
30 | #' @inheritParams as_data_backend
31 | #' @export
32 | as_sqlite_backend.data.frame = function(data, path = getOption("mlr3db.sqlite_dir", ":temp:"), primary_key = NULL, keep_rownames = FALSE, ...) { # nolint
33 |   backend = as_data_backend(data, primary_key = primary_key, keep_rownames = keep_rownames)
34 |   as_sqlite_backend.DataBackend(backend, path = path, ...)
35 | }
36 | 
37 | #' @export
38 | as_sqlite_backend.DataBackend = function(data, path = getOption("mlr3db.sqlite_dir", ":temp:"), ...) { # nolint
39 |   path = get_db_path(path, data$hash, "sqlite")
40 |   primary_key = data$primary_key
41 | 
42 |   if (!file.exists(path)) {
43 |     on.exit({
44 |       if (file.exists(path)) file.remove(path)
45 |     })
46 | 
47 |     con = DBI::dbConnect(RSQLite::SQLite(), dbname = path, flags = RSQLite::SQLITE_RWC)
48 |     field_types = setNames("INTEGER NOT NULL PRIMARY KEY", primary_key)
49 |     DBI::dbWriteTable(con, "data", data$head(Inf), row.names = FALSE, field.types = field_types)
50 |     DBI::dbDisconnect(con)
51 |   }
52 | 
53 |   con = DBI::dbConnect(RSQLite::SQLite(), path, flags = RSQLite::SQLITE_RO)
54 |   backend = DataBackendDplyr$new(dplyr::tbl(con, "data"), primary_key = primary_key, ...)
55 |   backend$connector = sqlite_reconnector(path)
56 | 
57 |   on.exit()
58 |   return(backend)
59 | }
60 | 
61 | sqlite_reconnector = function(path) {
62 |   force(path)
63 |   function() {
64 |     DBI::dbConnect(RSQLite::SQLite(), path, flags = RSQLite::SQLITE_RO)
65 |   }
66 | }
67 | 


--------------------------------------------------------------------------------
/R/helper.R:
--------------------------------------------------------------------------------
 1 | recode = function(tab, levels) {
 2 |   if (length(levels) > 0L) {
 3 |     for (col in intersect(names(tab), names(levels))) {
 4 |       set(tab, i = NULL, j = col, value = factor(tab[[col]], levels = levels[[col]]))
 5 |     }
 6 |   }
 7 | 
 8 |   tab[]
 9 | }
10 | 
11 | get_db_path = function(path, hash, extension) {
12 |   assert_string(path)
13 |   parent = switch(path,
14 |     ":temp:" = tempdir(),
15 |     ":user:" = R_user_dir("mlr3db", "cache"),
16 |     path
17 |   )
18 |   if (!dir.exists(parent)) {
19 |     dir.create(parent, recursive = TRUE)
20 |   }
21 | 
22 |   file.path(parent, sprintf("%s.%s",
23 |     gsub("[^[:alnum:]._-]", "_", hash),
24 |     extension)
25 |   )
26 | }
27 | 


--------------------------------------------------------------------------------
/R/zzz.R:
--------------------------------------------------------------------------------
 1 | #' @import data.table
 2 | #' @import checkmate
 3 | #' @importFrom stats setNames
 4 | #' @importFrom utils head
 5 | #' @importFrom R6 R6Class
 6 | #' @importFrom mlr3misc map_lgl calculate_hash
 7 | #' @section Options:
 8 | #' * `mlr3db.sqlite_dir`: Default directory to store SQLite databases constructed
 9 | #'   with [as_sqlite_backend()]..
10 | #' * `mlr3db.sqlite_dir`: Default directory to store DuckDB databases constructed
11 | #'   with [as_duckdb_backend()]..
12 | "_PACKAGE"
13 | 
14 | .onLoad = function(libname, pkgname) { # nolint
15 |   # nocov start
16 |   backports::import(pkgname)
17 |   backports::import(pkgname, "R_user_dir", force = TRUE)
18 | } # nocov end
19 | 
20 | mlr3misc::leanify_package()
21 | utils::globalVariables(".", "mlr3db", add = TRUE)
22 | 


--------------------------------------------------------------------------------
/README.Rmd:
--------------------------------------------------------------------------------
 1 | ---
 2 | output: github_document
 3 | ---
 4 | 
 5 | ```{r, include = FALSE}
 6 | knitr::opts_chunk$set(
 7 |   collapse = TRUE,
 8 |   comment = "#>",
 9 |   fig.path = "man/figures/README-",
10 |   out.width = "100%"
11 | )
12 | lgr::get_logger("mlr3")$set_threshold("warn")
13 | ```
14 | 
15 | # mlr3db
16 | 
17 | <!-- badges: start -->
18 | [![r-cmd-check](https://github.com/mlr-org/mlr3db/actions/workflows/r-cmd-check.yml/badge.svg)](https://github.com/mlr-org/mlr3db/actions/workflows/r-cmd-check.yml)
19 | [![CRAN Status](https://www.r-pkg.org/badges/version-ago/mlr3db)](https://cran.r-project.org/package=mlr3db)
20 | [![StackOverflow](https://img.shields.io/badge/stackoverflow-mlr3-orange.svg)](https://stackoverflow.com/questions/tagged/mlr3)
21 | [![Mattermost](https://img.shields.io/badge/chat-mattermost-orange.svg)](https://lmmisld-lmu-stats-slds.srv.mwn.de/mlr_invite/)
22 | <!-- badges: end -->
23 | 
24 | Package website: [release](https://mlr3db.mlr-org.com/) | [dev](https://mlr3db.mlr-org.com/dev/)
25 | 
26 | Extends the [mlr3](https://mlr3.mlr-org.com/) package with a DataBackend to transparently work with databases.
27 | Two additional backends are currently implemented:
28 | 
29 | * `DataBackendDplyr`: Relies internally on the abstraction of [dplyr](https://dplyr.tidyverse.org/) and [dbplyr](https://dbplyr.tidyverse.org/).
30 |     This allows working on a broad range of DBMS, such as SQLite, MySQL, MariaDB, or PostgreSQL.
31 | * `DataBackendDuckDB`: Connector to [duckdb](https://cran.r-project.org/package=duckdb).
32 |   This includes support for Parquet files (see example below).
33 | 
34 | To construct the backends, you have to establish a connection to the DBMS yourself with the [DBI](https://cran.r-project.org/package=DBI) package.
35 | For the serverless SQLite and DuckDB, we provide the converters `as_sqlite_backend()` and `as_duckdb_backend()`.
36 | 
37 | 
38 | ## Installation
39 | 
40 | You can install the released version of mlr3db from [CRAN](https://CRAN.R-project.org) with:
41 | 
42 | ```{r, eval = FALSE}
43 | install.packages("mlr3db")
44 | ```
45 | 
46 | And the development version from [GitHub](https://github.com/) with:
47 | 
48 | ```{r, eval = FALSE}
49 | # install.packages("devtools")
50 | devtools::install_github("mlr-org/mlr3db")
51 | ```
52 | 
53 | ## Example
54 | 
55 | ### DataBackendDplyr
56 | 
57 | ```{r}
58 | library("mlr3db")
59 | 
60 | # Create a classification task:
61 | task = tsk("spam")
62 | 
63 | # Convert the task backend from a in-memory backend (DataBackendDataTable)
64 | # to an out-of-memory SQLite backend via DataBackendDplyr.
65 | # A temporary directory is used here to store the database files.
66 | task$backend = as_sqlite_backend(task$backend, path = tempfile())
67 | 
68 | # Resample a classification tree using a 3-fold CV.
69 | # The requested data will be queried and fetched from the database in the background.
70 | resample(task, lrn("classif.rpart"), rsmp("cv", folds = 3))
71 | ```
72 | 
73 | ### DataBackendDuckDB
74 | 
75 | ```{r}
76 | library("mlr3db")
77 | 
78 | # Get an example parquet file from the package install directory:
79 | # spam dataset (tsk("spam")) stored as parquet file
80 | file = system.file(file.path("extdata", "spam.parquet"), package = "mlr3db")
81 | 
82 | # Create a backend on the file
83 | backend = as_duckdb_backend(file)
84 | 
85 | # Construct classification task on the constructed backend
86 | task = as_task_classif(backend, target = "type")
87 | 
88 | # Resample a classification tree using a 3-fold CV.
89 | # The requested data will be queried and fetched from the database in the background.
90 | resample(task, lrn("classif.rpart"), rsmp("cv", folds = 3))
91 | ```
92 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | 
 2 | # mlr3db
 3 | 
 4 | <!-- badges: start -->
 5 | 
 6 | [![r-cmd-check](https://github.com/mlr-org/mlr3db/actions/workflows/r-cmd-check.yml/badge.svg)](https://github.com/mlr-org/mlr3db/actions/workflows/r-cmd-check.yml)
 7 | [![CRAN
 8 | Status](https://www.r-pkg.org/badges/version-ago/mlr3db)](https://cran.r-project.org/package=mlr3db)
 9 | [![StackOverflow](https://img.shields.io/badge/stackoverflow-mlr3-orange.svg)](https://stackoverflow.com/questions/tagged/mlr3)
10 | [![Mattermost](https://img.shields.io/badge/chat-mattermost-orange.svg)](https://lmmisld-lmu-stats-slds.srv.mwn.de/mlr_invite/)
11 | <!-- badges: end -->
12 | 
13 | Package website: [release](https://mlr3db.mlr-org.com/) \|
14 | [dev](https://mlr3db.mlr-org.com/dev/)
15 | 
16 | Extends the [mlr3](https://mlr3.mlr-org.com/) package with a DataBackend
17 | to transparently work with databases. Two additional backends are
18 | currently implemented:
19 | 
20 | - `DataBackendDplyr`: Relies internally on the abstraction of
21 |   [dplyr](https://dplyr.tidyverse.org/) and
22 |   [dbplyr](https://dbplyr.tidyverse.org/). This allows working on a
23 |   broad range of DBMS, such as SQLite, MySQL, MariaDB, or PostgreSQL.
24 | - `DataBackendDuckDB`: Connector to
25 |   [duckdb](https://cran.r-project.org/package=duckdb). This includes
26 |   support for Parquet files (see example below).
27 | 
28 | To construct the backends, you have to establish a connection to the
29 | DBMS yourself with the [DBI](https://cran.r-project.org/package=DBI)
30 | package. For the serverless SQLite and DuckDB, we provide the converters
31 | `as_sqlite_backend()` and `as_duckdb_backend()`.
32 | 
33 | ## Installation
34 | 
35 | You can install the released version of mlr3db from
36 | [CRAN](https://CRAN.R-project.org) with:
37 | 
38 | ``` r
39 | install.packages("mlr3db")
40 | ```
41 | 
42 | And the development version from [GitHub](https://github.com/) with:
43 | 
44 | ``` r
45 | # install.packages("devtools")
46 | devtools::install_github("mlr-org/mlr3db")
47 | ```
48 | 
49 | ## Example
50 | 
51 | ### DataBackendDplyr
52 | 
53 | ``` r
54 | library("mlr3db")
55 | #> Loading required package: mlr3
56 | 
57 | # Create a classification task:
58 | task = tsk("spam")
59 | 
60 | # Convert the task backend from a in-memory backend (DataBackendDataTable)
61 | # to an out-of-memory SQLite backend via DataBackendDplyr.
62 | # A temporary directory is used here to store the database files.
63 | task$backend = as_sqlite_backend(task$backend, path = tempfile())
64 | 
65 | # Resample a classification tree using a 3-fold CV.
66 | # The requested data will be queried and fetched from the database in the background.
67 | resample(task, lrn("classif.rpart"), rsmp("cv", folds = 3))
68 | #> <ResampleResult> of 3 iterations
69 | #> * Task: spam
70 | #> * Learner: classif.rpart
71 | #> * Warnings: 0 in 0 iterations
72 | #> * Errors: 0 in 0 iterations
73 | ```
74 | 
75 | ### DataBackendDuckDB
76 | 
77 | ``` r
78 | library("mlr3db")
79 | 
80 | # Get an example parquet file from the package install directory:
81 | # spam dataset (tsk("spam")) stored as parquet file
82 | file = system.file(file.path("extdata", "spam.parquet"), package = "mlr3db")
83 | 
84 | # Create a backend on the file
85 | backend = as_duckdb_backend(file)
86 | 
87 | # Construct classification task on the constructed backend
88 | task = as_task_classif(backend, target = "type")
89 | 
90 | # Resample a classification tree using a 3-fold CV.
91 | # The requested data will be queried and fetched from the database in the background.
92 | resample(task, lrn("classif.rpart"), rsmp("cv", folds = 3))
93 | #> <ResampleResult> of 3 iterations
94 | #> * Task: backend
95 | #> * Learner: classif.rpart
96 | #> * Warnings: 0 in 0 iterations
97 | #> * Errors: 0 in 0 iterations
98 | ```
99 | 


--------------------------------------------------------------------------------
/inst/extdata/spam.parquet:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/inst/extdata/spam.parquet


--------------------------------------------------------------------------------
/inst/extdata/userdata1.parquet:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/inst/extdata/userdata1.parquet


--------------------------------------------------------------------------------
/inst/extdata/userdata2.parquet:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/inst/extdata/userdata2.parquet


--------------------------------------------------------------------------------
/inst/extdata/userdata3.parquet:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/inst/extdata/userdata3.parquet


--------------------------------------------------------------------------------
/inst/extdata/userdata4.parquet:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/inst/extdata/userdata4.parquet


--------------------------------------------------------------------------------
/inst/extdata/userdata5.parquet:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/inst/extdata/userdata5.parquet


--------------------------------------------------------------------------------
/man-roxygen/field_connector.R:
--------------------------------------------------------------------------------
1 | #' @field connector (`function()`)\cr
2 | #'   Function which is called to re-connect in case the connection became invalid.
3 | 


--------------------------------------------------------------------------------
/man-roxygen/field_levels.R:
--------------------------------------------------------------------------------
1 | #' @field levels (named `list()`)\cr
2 | #'   List (named with column names) of factor levels as `character()`.
3 | #'   Used to auto-convert character columns to factor variables.
4 | 


--------------------------------------------------------------------------------
/man-roxygen/param_connector.R:
--------------------------------------------------------------------------------
 1 | #' @param connector (function()`)\cr
 2 | #'   If not `NULL`, a function which re-connects to the database in case the connection has become invalid.
 3 | #'   Database connections can become invalid due to timeouts or if the backend is serialized
 4 | #'   to the file system and then de-serialized again.
 5 | #'   This round trip is often performed for parallelization, e.g. to send the objects to remote workers.
 6 | #'   [DBI::dbIsValid()] is called to validate the connection.
 7 | #'   The function must return just the connection, not a [dplyr::tbl()] object!
 8 | #'   Note that this this function is serialized together with the backend, including
 9 | #'   possible sensitive information such as login credentials.
10 | #'   These can be retrieved from the stored [mlr3::DataBackend]/[mlr3::Task].
11 | #'   To protect your credentials, it is recommended to use the \CRANpkg{secret} package.
12 | 


--------------------------------------------------------------------------------
/man-roxygen/param_path.R:
--------------------------------------------------------------------------------
 1 | #' @param path (`character(1)`)\cr
 2 | #'   Path for the DuckDB databases.
 3 | #'   Either a valid path to a directory which will be created if it not exists, or one of the special strings:
 4 | #'
 5 | #'   * `":temp:"` (default): Temporary directory of the R session is used, see [tempdir()].
 6 | #'     Note that this directory will be removed during the shutdown of the R session.
 7 | #'     Also note that this usually does not work for parallelization on remote workers.
 8 | #'     Set to a custom path instead or use special string `":user:"` instead.
 9 | #'   * `":user:"`: User cache directory as returned by [R_user_dir()] is used.
10 | #'
11 | #'
12 | #' The default for this argument can be configured via option `"mlr3db.sqlite_dir"` or `"mlr3db.duckdb_dir"`,
13 | #' respectively. The database files will use the hash of the [DataBackend] as filename with
14 | #' file extension `".duckdb"` or `".sqlite"`.
15 | #' If the database already exists on the file system, the converters will just established a new read-only
16 | #' connection.
17 | 


--------------------------------------------------------------------------------
/man-roxygen/param_primary_key.R:
--------------------------------------------------------------------------------
1 | #' @param primary_key (`character(1)`)\cr
2 | #'   Name of the primary key column.
3 | 


--------------------------------------------------------------------------------
/man-roxygen/param_strings_as_factors.R:
--------------------------------------------------------------------------------
1 | #' @param strings_as_factors (`logical(1)` || `character()`)\cr
2 | #'   Either a character vector of column names to convert to factors, or a single logical flag:
3 | #'   if `FALSE`, no column will be converted, if `TRUE` all string columns (except the primary key).
4 | #'   For conversion, the backend is queried for distinct values of the respective columns
5 | #'   on construction and their levels are stored in `$levels`.
6 | 


--------------------------------------------------------------------------------
/man/DataBackendDplyr.Rd:
--------------------------------------------------------------------------------
  1 | % Generated by roxygen2: do not edit by hand
  2 | % Please edit documentation in R/DataBackendDplyr.R
  3 | \name{DataBackendDplyr}
  4 | \alias{DataBackendDplyr}
  5 | \title{DataBackend for dplyr/dbplyr}
  6 | \description{
  7 | A \link[mlr3:DataBackend]{mlr3::DataBackend} using \code{\link[dplyr:tbl]{dplyr::tbl()}} from packages \CRANpkg{dplyr}/\CRANpkg{dbplyr}.
  8 | This includes \code{\link[tibble:tibble]{tibbles}} and abstract database connections interfaced by \CRANpkg{dbplyr}.
  9 | The latter allows \link[mlr3:Task]{mlr3::Task}s to interface an out-of-memory database.
 10 | }
 11 | \examples{
 12 | if (mlr3misc::require_namespaces(c("tibble", "RSQLite", "dbplyr"), quietly = TRUE)) {
 13 |   # Backend using a in-memory tibble
 14 |   data = tibble::as_tibble(iris)
 15 |   data$Sepal.Length[1:30] = NA
 16 |   data$row_id = 1:150
 17 |   b = DataBackendDplyr$new(data, primary_key = "row_id")
 18 | 
 19 |   # Object supports all accessors of DataBackend
 20 |   print(b)
 21 |   b$nrow
 22 |   b$ncol
 23 |   b$colnames
 24 |   b$data(rows = 100:101, cols = "Species")
 25 |   b$distinct(b$rownames, "Species")
 26 | 
 27 |   # Classification task using this backend
 28 |   task = mlr3::TaskClassif$new(id = "iris_tibble", backend = b, target = "Species")
 29 |   print(task)
 30 |   head(task)
 31 | 
 32 |   # Create a temporary SQLite database
 33 |   con = DBI::dbConnect(RSQLite::SQLite(), ":memory:")
 34 |   dplyr::copy_to(con, data)
 35 |   tbl = dplyr::tbl(con, "data")
 36 | 
 37 |   # Define a backend on a subset of the database: do not use column "Sepal.Width"
 38 |   tbl = dplyr::select_at(tbl, setdiff(colnames(tbl), "Sepal.Width"))
 39 |   tbl = dplyr::filter(tbl, row_id \%in\% 1:120) # Use only first 120 rows
 40 |   b = DataBackendDplyr$new(tbl, primary_key = "row_id")
 41 |   print(b)
 42 | 
 43 |   # Query disinct values
 44 |   b$distinct(b$rownames, "Species")
 45 | 
 46 |   # Query number of missing values
 47 |   b$missings(b$rownames, b$colnames)
 48 | 
 49 |   # Note that SQLite does not support factors, column Species has been converted to character
 50 |   lapply(b$head(), class)
 51 | 
 52 |   # Cleanup
 53 |   rm(tbl)
 54 |   DBI::dbDisconnect(con)
 55 | }
 56 | }
 57 | \section{Super class}{
 58 | \code{\link[mlr3:DataBackend]{mlr3::DataBackend}} -> \code{DataBackendDplyr}
 59 | }
 60 | \section{Public fields}{
 61 | \if{html}{\out{<div class="r6-fields">}}
 62 | \describe{
 63 | \item{\code{levels}}{(named \code{list()})\cr
 64 | List (named with column names) of factor levels as \code{character()}.
 65 | Used to auto-convert character columns to factor variables.}
 66 | 
 67 | \item{\code{connector}}{(\verb{function()})\cr
 68 | Function which is called to re-connect in case the connection became invalid.}
 69 | }
 70 | \if{html}{\out{</div>}}
 71 | }
 72 | \section{Active bindings}{
 73 | \if{html}{\out{<div class="r6-active-bindings">}}
 74 | \describe{
 75 | \item{\code{rownames}}{(\code{integer()})\cr
 76 | Returns vector of all distinct row identifiers, i.e. the contents of the primary key column.}
 77 | 
 78 | \item{\code{colnames}}{(\code{character()})\cr
 79 | Returns vector of all column names, including the primary key column.}
 80 | 
 81 | \item{\code{nrow}}{(\code{integer(1)})\cr
 82 | Number of rows (observations).}
 83 | 
 84 | \item{\code{ncol}}{(\code{integer(1)})\cr
 85 | Number of columns (variables), including the primary key column.}
 86 | 
 87 | \item{\code{valid}}{(\code{logical(1)})\cr
 88 | Returns \code{NA} if the data does not inherits from \code{"tbl_sql"} (i.e., it is not a real SQL data base).
 89 | Returns the result of \code{\link[DBI:dbIsValid]{DBI::dbIsValid()}} otherwise.}
 90 | }
 91 | \if{html}{\out{</div>}}
 92 | }
 93 | \section{Methods}{
 94 | \subsection{Public methods}{
 95 | \itemize{
 96 | \item \href{#method-DataBackendDplyr-new}{\code{DataBackendDplyr$new()}}
 97 | \item \href{#method-DataBackendDplyr-finalize}{\code{DataBackendDplyr$finalize()}}
 98 | \item \href{#method-DataBackendDplyr-data}{\code{DataBackendDplyr$data()}}
 99 | \item \href{#method-DataBackendDplyr-head}{\code{DataBackendDplyr$head()}}
100 | \item \href{#method-DataBackendDplyr-distinct}{\code{DataBackendDplyr$distinct()}}
101 | \item \href{#method-DataBackendDplyr-missings}{\code{DataBackendDplyr$missings()}}
102 | }
103 | }
104 | \if{html}{\out{
105 | <details open><summary>Inherited methods</summary>
106 | <ul>
107 | <li><span class="pkg-link" data-pkg="mlr3" data-topic="DataBackend" data-id="format"><a href='../../mlr3/html/DataBackend.html#method-DataBackend-format'><code>mlr3::DataBackend$format()</code></a></span></li>
108 | <li><span class="pkg-link" data-pkg="mlr3" data-topic="DataBackend" data-id="print"><a href='../../mlr3/html/DataBackend.html#method-DataBackend-print'><code>mlr3::DataBackend$print()</code></a></span></li>
109 | </ul>
110 | </details>
111 | }}
112 | \if{html}{\out{<hr>}}
113 | \if{html}{\out{<a id="method-DataBackendDplyr-new"></a>}}
114 | \if{latex}{\out{\hypertarget{method-DataBackendDplyr-new}{}}}
115 | \subsection{Method \code{new()}}{
116 | Creates a backend for a \code{\link[dplyr:tbl]{dplyr::tbl()}} object.
117 | \subsection{Usage}{
118 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendDplyr$new(
119 |   data,
120 |   primary_key,
121 |   strings_as_factors = TRUE,
122 |   connector = NULL
123 | )}\if{html}{\out{</div>}}
124 | }
125 | 
126 | \subsection{Arguments}{
127 | \if{html}{\out{<div class="arguments">}}
128 | \describe{
129 | \item{\code{data}}{(\code{\link[dplyr:tbl]{dplyr::tbl()}})\cr
130 | The data object.
131 | 
132 | Instead of calling the constructor yourself, you can call \code{\link[mlr3:as_data_backend]{mlr3::as_data_backend()}}
133 | on a \code{\link[dplyr:tbl]{dplyr::tbl()}}.
134 | Note that only objects of class \code{"tbl_lazy"} will be converted to a \link{DataBackendDplyr}
135 | (this includes all connectors from \CRANpkg{dbplyr}).
136 | Local \code{"tbl"} objects such as \code{\link[tibble:tibble]{tibbles}} will converted to a
137 | \link[mlr3:DataBackendDataTable]{DataBackendDataTable}.}
138 | 
139 | \item{\code{primary_key}}{(\code{character(1)})\cr
140 | Name of the primary key column.}
141 | 
142 | \item{\code{strings_as_factors}}{(\code{logical(1)} || \code{character()})\cr
143 | Either a character vector of column names to convert to factors, or a single logical flag:
144 | if \code{FALSE}, no column will be converted, if \code{TRUE} all string columns (except the primary key).
145 | For conversion, the backend is queried for distinct values of the respective columns
146 | on construction and their levels are stored in \verb{$levels}.}
147 | 
148 | \item{\code{connector}}{(function()\verb{)\\cr If not }NULL`, a function which re-connects to the database in case the connection has become invalid.
149 | Database connections can become invalid due to timeouts or if the backend is serialized
150 | to the file system and then de-serialized again.
151 | This round trip is often performed for parallelization, e.g. to send the objects to remote workers.
152 | \code{\link[DBI:dbIsValid]{DBI::dbIsValid()}} is called to validate the connection.
153 | The function must return just the connection, not a \code{\link[dplyr:tbl]{dplyr::tbl()}} object!
154 | Note that this this function is serialized together with the backend, including
155 | possible sensitive information such as login credentials.
156 | These can be retrieved from the stored \link[mlr3:DataBackend]{mlr3::DataBackend}/\link[mlr3:Task]{mlr3::Task}.
157 | To protect your credentials, it is recommended to use the \CRANpkg{secret} package.}
158 | }
159 | \if{html}{\out{</div>}}
160 | }
161 | }
162 | \if{html}{\out{<hr>}}
163 | \if{html}{\out{<a id="method-DataBackendDplyr-finalize"></a>}}
164 | \if{latex}{\out{\hypertarget{method-DataBackendDplyr-finalize}{}}}
165 | \subsection{Method \code{finalize()}}{
166 | Finalizer which disconnects from the database.
167 | This is called during garbage collection of the instance.
168 | \subsection{Usage}{
169 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendDplyr$finalize()}\if{html}{\out{</div>}}
170 | }
171 | 
172 | \subsection{Returns}{
173 | \code{logical(1)}, the return value of \code{\link[DBI:dbDisconnect]{DBI::dbDisconnect()}}.
174 | }
175 | }
176 | \if{html}{\out{<hr>}}
177 | \if{html}{\out{<a id="method-DataBackendDplyr-data"></a>}}
178 | \if{latex}{\out{\hypertarget{method-DataBackendDplyr-data}{}}}
179 | \subsection{Method \code{data()}}{
180 | Returns a slice of the data.
181 | Calls \code{\link[dplyr:filter]{dplyr::filter()}} and \code{\link[dplyr:select]{dplyr::select()}} on the table and converts it to a \code{\link[data.table:data.table]{data.table::data.table()}}.
182 | 
183 | The rows must be addressed as vector of primary key values, columns must be referred to via column names.
184 | Queries for rows with no matching row id and queries for columns with no matching
185 | column name are silently ignored.
186 | Rows are guaranteed to be returned in the same order as \code{rows}, columns may be returned in an arbitrary order.
187 | Duplicated row ids result in duplicated rows, duplicated column names lead to an exception.
188 | \subsection{Usage}{
189 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendDplyr$data(rows, cols, data_format = "data.table")}\if{html}{\out{</div>}}
190 | }
191 | 
192 | \subsection{Arguments}{
193 | \if{html}{\out{<div class="arguments">}}
194 | \describe{
195 | \item{\code{rows}}{\code{integer()}\cr
196 | Row indices.}
197 | 
198 | \item{\code{cols}}{\code{character()}\cr
199 | Column names.}
200 | 
201 | \item{\code{data_format}}{(\code{character(1)})\cr
202 | Desired data format, e.g. \code{"data.table"} or \code{"Matrix"}.}
203 | }
204 | \if{html}{\out{</div>}}
205 | }
206 | }
207 | \if{html}{\out{<hr>}}
208 | \if{html}{\out{<a id="method-DataBackendDplyr-head"></a>}}
209 | \if{latex}{\out{\hypertarget{method-DataBackendDplyr-head}{}}}
210 | \subsection{Method \code{head()}}{
211 | Retrieve the first \code{n} rows.
212 | \subsection{Usage}{
213 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendDplyr$head(n = 6L)}\if{html}{\out{</div>}}
214 | }
215 | 
216 | \subsection{Arguments}{
217 | \if{html}{\out{<div class="arguments">}}
218 | \describe{
219 | \item{\code{n}}{(\code{integer(1)})\cr
220 | Number of rows.}
221 | }
222 | \if{html}{\out{</div>}}
223 | }
224 | \subsection{Returns}{
225 | \code{\link[data.table:data.table]{data.table::data.table()}} of the first \code{n} rows.
226 | }
227 | }
228 | \if{html}{\out{<hr>}}
229 | \if{html}{\out{<a id="method-DataBackendDplyr-distinct"></a>}}
230 | \if{latex}{\out{\hypertarget{method-DataBackendDplyr-distinct}{}}}
231 | \subsection{Method \code{distinct()}}{
232 | Returns a named list of vectors of distinct values for each column
233 | specified. If \code{na_rm} is \code{TRUE}, missing values are removed from the
234 | returned vectors of distinct values. Non-existing rows and columns are
235 | silently ignored.
236 | \subsection{Usage}{
237 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendDplyr$distinct(rows, cols, na_rm = TRUE)}\if{html}{\out{</div>}}
238 | }
239 | 
240 | \subsection{Arguments}{
241 | \if{html}{\out{<div class="arguments">}}
242 | \describe{
243 | \item{\code{rows}}{\code{integer()}\cr
244 | Row indices.}
245 | 
246 | \item{\code{cols}}{\code{character()}\cr
247 | Column names.}
248 | 
249 | \item{\code{na_rm}}{\code{logical(1)}\cr
250 | Whether to remove NAs or not.}
251 | }
252 | \if{html}{\out{</div>}}
253 | }
254 | \subsection{Returns}{
255 | Named \code{list()} of distinct values.
256 | }
257 | }
258 | \if{html}{\out{<hr>}}
259 | \if{html}{\out{<a id="method-DataBackendDplyr-missings"></a>}}
260 | \if{latex}{\out{\hypertarget{method-DataBackendDplyr-missings}{}}}
261 | \subsection{Method \code{missings()}}{
262 | Returns the number of missing values per column in the specified slice
263 | of data. Non-existing rows and columns are silently ignored.
264 | \subsection{Usage}{
265 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendDplyr$missings(rows, cols)}\if{html}{\out{</div>}}
266 | }
267 | 
268 | \subsection{Arguments}{
269 | \if{html}{\out{<div class="arguments">}}
270 | \describe{
271 | \item{\code{rows}}{\code{integer()}\cr
272 | Row indices.}
273 | 
274 | \item{\code{cols}}{\code{character()}\cr
275 | Column names.}
276 | }
277 | \if{html}{\out{</div>}}
278 | }
279 | \subsection{Returns}{
280 | Total of missing values per column (named \code{numeric()}).
281 | }
282 | }
283 | }
284 | 


--------------------------------------------------------------------------------
/man/DataBackendDuckDB.Rd:
--------------------------------------------------------------------------------
  1 | % Generated by roxygen2: do not edit by hand
  2 | % Please edit documentation in R/DataBackendDuckDB.R
  3 | \name{DataBackendDuckDB}
  4 | \alias{DataBackendDuckDB}
  5 | \title{DataBackend for DuckDB}
  6 | \description{
  7 | A \link[mlr3:DataBackend]{mlr3::DataBackend} for \CRANpkg{duckdb}.
  8 | Can be easily constructed with \code{\link[=as_duckdb_backend]{as_duckdb_backend()}}.
  9 | }
 10 | \seealso{
 11 | \url{https://duckdb.org/}
 12 | }
 13 | \section{Super class}{
 14 | \code{\link[mlr3:DataBackend]{mlr3::DataBackend}} -> \code{DataBackendDuckDB}
 15 | }
 16 | \section{Public fields}{
 17 | \if{html}{\out{<div class="r6-fields">}}
 18 | \describe{
 19 | \item{\code{levels}}{(named \code{list()})\cr
 20 | List (named with column names) of factor levels as \code{character()}.
 21 | Used to auto-convert character columns to factor variables.}
 22 | 
 23 | \item{\code{connector}}{(\verb{function()})\cr
 24 | Function which is called to re-connect in case the connection became invalid.}
 25 | 
 26 | \item{\code{table}}{(\code{character(1)})\cr
 27 | Data base table or view to operate on.}
 28 | }
 29 | \if{html}{\out{</div>}}
 30 | }
 31 | \section{Active bindings}{
 32 | \if{html}{\out{<div class="r6-active-bindings">}}
 33 | \describe{
 34 | \item{\code{table_info}}{(\code{data.frame()})\cr
 35 | Data frame as returned by pragma \code{table_info()}.}
 36 | 
 37 | \item{\code{rownames}}{(\code{integer()})\cr
 38 | Returns vector of all distinct row identifiers, i.e. the contents of the primary key column.}
 39 | 
 40 | \item{\code{colnames}}{(\code{character()})\cr
 41 | Returns vector of all column names, including the primary key column.}
 42 | 
 43 | \item{\code{nrow}}{(\code{integer(1)})\cr
 44 | Number of rows (observations).}
 45 | 
 46 | \item{\code{ncol}}{(\code{integer(1)})\cr
 47 | Number of columns (variables), including the primary key column.}
 48 | 
 49 | \item{\code{valid}}{(\code{logical(1)})\cr
 50 | Returns \code{NA} if the data does not inherits from \code{"tbl_sql"} (i.e., it is not a real SQL data base).
 51 | Returns the result of \code{\link[DBI:dbIsValid]{DBI::dbIsValid()}} otherwise.}
 52 | }
 53 | \if{html}{\out{</div>}}
 54 | }
 55 | \section{Methods}{
 56 | \subsection{Public methods}{
 57 | \itemize{
 58 | \item \href{#method-DataBackendDuckDB-new}{\code{DataBackendDuckDB$new()}}
 59 | \item \href{#method-DataBackendDuckDB-finalize}{\code{DataBackendDuckDB$finalize()}}
 60 | \item \href{#method-DataBackendDuckDB-data}{\code{DataBackendDuckDB$data()}}
 61 | \item \href{#method-DataBackendDuckDB-head}{\code{DataBackendDuckDB$head()}}
 62 | \item \href{#method-DataBackendDuckDB-distinct}{\code{DataBackendDuckDB$distinct()}}
 63 | \item \href{#method-DataBackendDuckDB-missings}{\code{DataBackendDuckDB$missings()}}
 64 | }
 65 | }
 66 | \if{html}{\out{
 67 | <details open><summary>Inherited methods</summary>
 68 | <ul>
 69 | <li><span class="pkg-link" data-pkg="mlr3" data-topic="DataBackend" data-id="format"><a href='../../mlr3/html/DataBackend.html#method-DataBackend-format'><code>mlr3::DataBackend$format()</code></a></span></li>
 70 | <li><span class="pkg-link" data-pkg="mlr3" data-topic="DataBackend" data-id="print"><a href='../../mlr3/html/DataBackend.html#method-DataBackend-print'><code>mlr3::DataBackend$print()</code></a></span></li>
 71 | </ul>
 72 | </details>
 73 | }}
 74 | \if{html}{\out{<hr>}}
 75 | \if{html}{\out{<a id="method-DataBackendDuckDB-new"></a>}}
 76 | \if{latex}{\out{\hypertarget{method-DataBackendDuckDB-new}{}}}
 77 | \subsection{Method \code{new()}}{
 78 | Creates a backend for a \code{\link[duckdb:duckdb]{duckdb::duckdb()}} database.
 79 | \subsection{Usage}{
 80 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendDuckDB$new(
 81 |   data,
 82 |   table,
 83 |   primary_key,
 84 |   strings_as_factors = TRUE,
 85 |   connector = NULL
 86 | )}\if{html}{\out{</div>}}
 87 | }
 88 | 
 89 | \subsection{Arguments}{
 90 | \if{html}{\out{<div class="arguments">}}
 91 | \describe{
 92 | \item{\code{data}}{(connection)\cr
 93 | A connection created with \code{\link[DBI:dbConnect]{DBI::dbConnect()}}.
 94 | If constructed manually (and not via the helper function \code{\link[=as_duckdb_backend]{as_duckdb_backend()}},
 95 | make sure that there exists an (unique) index for the key column.}
 96 | 
 97 | \item{\code{table}}{(\code{character(1)})\cr
 98 | Table or view to operate on.}
 99 | 
100 | \item{\code{primary_key}}{(\code{character(1)})\cr
101 | Name of the primary key column.}
102 | 
103 | \item{\code{strings_as_factors}}{(\code{logical(1)} || \code{character()})\cr
104 | Either a character vector of column names to convert to factors, or a single logical flag:
105 | if \code{FALSE}, no column will be converted, if \code{TRUE} all string columns (except the primary key).
106 | For conversion, the backend is queried for distinct values of the respective columns
107 | on construction and their levels are stored in \verb{$levels}.}
108 | 
109 | \item{\code{connector}}{(function()\verb{)\\cr If not }NULL`, a function which re-connects to the database in case the connection has become invalid.
110 | Database connections can become invalid due to timeouts or if the backend is serialized
111 | to the file system and then de-serialized again.
112 | This round trip is often performed for parallelization, e.g. to send the objects to remote workers.
113 | \code{\link[DBI:dbIsValid]{DBI::dbIsValid()}} is called to validate the connection.
114 | The function must return just the connection, not a \code{\link[dplyr:tbl]{dplyr::tbl()}} object!
115 | Note that this this function is serialized together with the backend, including
116 | possible sensitive information such as login credentials.
117 | These can be retrieved from the stored \link[mlr3:DataBackend]{mlr3::DataBackend}/\link[mlr3:Task]{mlr3::Task}.
118 | To protect your credentials, it is recommended to use the \CRANpkg{secret} package.}
119 | }
120 | \if{html}{\out{</div>}}
121 | }
122 | }
123 | \if{html}{\out{<hr>}}
124 | \if{html}{\out{<a id="method-DataBackendDuckDB-finalize"></a>}}
125 | \if{latex}{\out{\hypertarget{method-DataBackendDuckDB-finalize}{}}}
126 | \subsection{Method \code{finalize()}}{
127 | Finalizer which disconnects from the database.
128 | This is called during garbage collection of the instance.
129 | \subsection{Usage}{
130 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendDuckDB$finalize()}\if{html}{\out{</div>}}
131 | }
132 | 
133 | \subsection{Returns}{
134 | \code{logical(1)}, the return value of \code{\link[DBI:dbDisconnect]{DBI::dbDisconnect()}}.
135 | }
136 | }
137 | \if{html}{\out{<hr>}}
138 | \if{html}{\out{<a id="method-DataBackendDuckDB-data"></a>}}
139 | \if{latex}{\out{\hypertarget{method-DataBackendDuckDB-data}{}}}
140 | \subsection{Method \code{data()}}{
141 | Returns a slice of the data.
142 | 
143 | The rows must be addressed as vector of primary key values, columns must be referred to via column names.
144 | Queries for rows with no matching row id and queries for columns with no matching
145 | column name are silently ignored.
146 | Rows are guaranteed to be returned in the same order as \code{rows}, columns may be returned in an arbitrary order.
147 | Duplicated row ids result in duplicated rows, duplicated column names lead to an exception.
148 | \subsection{Usage}{
149 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendDuckDB$data(rows, cols, data_format = "data.table")}\if{html}{\out{</div>}}
150 | }
151 | 
152 | \subsection{Arguments}{
153 | \if{html}{\out{<div class="arguments">}}
154 | \describe{
155 | \item{\code{rows}}{\code{integer()}\cr
156 | Row indices.}
157 | 
158 | \item{\code{cols}}{\code{character()}\cr
159 | Column names.}
160 | 
161 | \item{\code{data_format}}{(\code{character(1)})\cr
162 | Desired data format, e.g. \code{"data.table"} or \code{"Matrix"}.}
163 | }
164 | \if{html}{\out{</div>}}
165 | }
166 | }
167 | \if{html}{\out{<hr>}}
168 | \if{html}{\out{<a id="method-DataBackendDuckDB-head"></a>}}
169 | \if{latex}{\out{\hypertarget{method-DataBackendDuckDB-head}{}}}
170 | \subsection{Method \code{head()}}{
171 | Retrieve the first \code{n} rows.
172 | \subsection{Usage}{
173 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendDuckDB$head(n = 6L)}\if{html}{\out{</div>}}
174 | }
175 | 
176 | \subsection{Arguments}{
177 | \if{html}{\out{<div class="arguments">}}
178 | \describe{
179 | \item{\code{n}}{(\code{integer(1)})\cr
180 | Number of rows.}
181 | }
182 | \if{html}{\out{</div>}}
183 | }
184 | \subsection{Returns}{
185 | \code{\link[data.table:data.table]{data.table::data.table()}} of the first \code{n} rows.
186 | }
187 | }
188 | \if{html}{\out{<hr>}}
189 | \if{html}{\out{<a id="method-DataBackendDuckDB-distinct"></a>}}
190 | \if{latex}{\out{\hypertarget{method-DataBackendDuckDB-distinct}{}}}
191 | \subsection{Method \code{distinct()}}{
192 | Returns a named list of vectors of distinct values for each column
193 | specified. If \code{na_rm} is \code{TRUE}, missing values are removed from the
194 | returned vectors of distinct values. Non-existing rows and columns are
195 | silently ignored.
196 | \subsection{Usage}{
197 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendDuckDB$distinct(rows, cols, na_rm = TRUE)}\if{html}{\out{</div>}}
198 | }
199 | 
200 | \subsection{Arguments}{
201 | \if{html}{\out{<div class="arguments">}}
202 | \describe{
203 | \item{\code{rows}}{\code{integer()}\cr
204 | Row indices.}
205 | 
206 | \item{\code{cols}}{\code{character()}\cr
207 | Column names.}
208 | 
209 | \item{\code{na_rm}}{\code{logical(1)}\cr
210 | Whether to remove NAs or not.}
211 | }
212 | \if{html}{\out{</div>}}
213 | }
214 | \subsection{Returns}{
215 | Named \code{list()} of distinct values.
216 | }
217 | }
218 | \if{html}{\out{<hr>}}
219 | \if{html}{\out{<a id="method-DataBackendDuckDB-missings"></a>}}
220 | \if{latex}{\out{\hypertarget{method-DataBackendDuckDB-missings}{}}}
221 | \subsection{Method \code{missings()}}{
222 | Returns the number of missing values per column in the specified slice
223 | of data. Non-existing rows and columns are silently ignored.
224 | \subsection{Usage}{
225 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendDuckDB$missings(rows, cols)}\if{html}{\out{</div>}}
226 | }
227 | 
228 | \subsection{Arguments}{
229 | \if{html}{\out{<div class="arguments">}}
230 | \describe{
231 | \item{\code{rows}}{\code{integer()}\cr
232 | Row indices.}
233 | 
234 | \item{\code{cols}}{\code{character()}\cr
235 | Column names.}
236 | }
237 | \if{html}{\out{</div>}}
238 | }
239 | \subsection{Returns}{
240 | Total of missing values per column (named \code{numeric()}).
241 | }
242 | }
243 | }
244 | 


--------------------------------------------------------------------------------
/man/DataBackendPolars.Rd:
--------------------------------------------------------------------------------
  1 | % Generated by roxygen2: do not edit by hand
  2 | % Please edit documentation in R/DataBackendPolars.R
  3 | \name{DataBackendPolars}
  4 | \alias{DataBackendPolars}
  5 | \title{DataBackend for Polars}
  6 | \description{
  7 | A \link[mlr3:DataBackend]{mlr3::DataBackend} using \code{RPolarsLazyFrame} from package \CRANpkg{polars}.
  8 | Can be easily constructed with \code{\link[=as_polars_backend]{as_polars_backend()}}.
  9 | \link[mlr3:Task]{mlr3::Task}s can interface out-of-memory files if the \code{polars::RPolarsLazyFrame} was imported using a \code{polars::scan_x} function.
 10 | Streaming, a \CRANpkg{polars} alpha feature, is always enabled, but only used when applicable.
 11 | A connector is not required but can be useful e.g. for scanning larger than memory files
 12 | }
 13 | \examples{
 14 | if (mlr3misc::require_namespaces("polars", quietly = TRUE)) {
 15 |   # Backend using a in-memory data set
 16 |   data = iris
 17 |   data$Sepal.Length[1:30] = NA
 18 |   data$row_id = 1:150
 19 |   data = polars::as_polars_lf(data)
 20 |   b = DataBackendPolars$new(data, primary_key = "row_id")
 21 | 
 22 |   # Object supports all accessors of DataBackend
 23 |   print(b)
 24 |   b$nrow
 25 |   b$ncol
 26 |   b$colnames
 27 |   b$data(rows = 100:101, cols = "Species")
 28 |   b$distinct(b$rownames, "Species")
 29 | 
 30 |   # Classification task using this backend
 31 |   task = mlr3::TaskClassif$new(id = "iris_polars", backend = b, target = "Species")
 32 |   print(task)
 33 |   head(task)
 34 | 
 35 |   # Write a parquet file to scan
 36 |   data$collect()$write_parquet("iris.parquet")
 37 |   data = polars::pl$scan_parquet("iris.parquet")
 38 | 
 39 |   # Backend that re-reads the parquet file if the connection fails
 40 |   b = DataBackendPolars$new(data, "row_id",
 41 |     connector = function() polars::pl$scan_parquet("iris.parquet"))
 42 |   print(b)
 43 | 
 44 |   # Define a backend on a subset of the database: do not use column "Sepal.Width"
 45 |   data = data$select(
 46 |     polars::pl$col(setdiff(colnames(data), "Sepal.Width"))
 47 |   )$filter(
 48 |     polars::pl$col("row_id")$is_in(1:120) # Use only first 120 rows
 49 |   )
 50 | 
 51 |   # Backend with only scanned data
 52 |   b = DataBackendPolars$new(data, "row_id", strings_as_factors = TRUE)
 53 |   print(b)
 54 | 
 55 |   # Query disinct values
 56 |   b$distinct(b$rownames, "Species")
 57 | 
 58 |   # Query number of missing values
 59 |   b$missings(b$rownames, b$colnames)
 60 | 
 61 |   # Cleanup
 62 |   if (file.exists("iris.parquet")) {
 63 |     file.remove("iris.parquet")
 64 |   }
 65 | }
 66 | }
 67 | \seealso{
 68 | \url{https://pola-rs.github.io/r-polars/}
 69 | }
 70 | \section{Super class}{
 71 | \code{\link[mlr3:DataBackend]{mlr3::DataBackend}} -> \code{DataBackendPolars}
 72 | }
 73 | \section{Public fields}{
 74 | \if{html}{\out{<div class="r6-fields">}}
 75 | \describe{
 76 | \item{\code{levels}}{(named \code{list()})\cr
 77 | List (named with column names) of factor levels as \code{character()}.
 78 | Used to auto-convert character columns to factor variables.}
 79 | 
 80 | \item{\code{connector}}{(\verb{function()})\cr
 81 | Function which is called to re-connect in case the connection became invalid.}
 82 | }
 83 | \if{html}{\out{</div>}}
 84 | }
 85 | \section{Active bindings}{
 86 | \if{html}{\out{<div class="r6-active-bindings">}}
 87 | \describe{
 88 | \item{\code{rownames}}{(\code{integer()})\cr
 89 | Returns vector of all distinct row identifiers, i.e. the contents of the primary key column.}
 90 | 
 91 | \item{\code{colnames}}{(\code{character()})\cr
 92 | Returns vector of all column names, including the primary key column.}
 93 | 
 94 | \item{\code{nrow}}{(\code{integer(1)})\cr
 95 | Number of rows (observations).}
 96 | 
 97 | \item{\code{ncol}}{(\code{integer(1)})\cr
 98 | Number of columns (variables), including the primary key column.}
 99 | }
100 | \if{html}{\out{</div>}}
101 | }
102 | \section{Methods}{
103 | \subsection{Public methods}{
104 | \itemize{
105 | \item \href{#method-DataBackendPolars-new}{\code{DataBackendPolars$new()}}
106 | \item \href{#method-DataBackendPolars-data}{\code{DataBackendPolars$data()}}
107 | \item \href{#method-DataBackendPolars-head}{\code{DataBackendPolars$head()}}
108 | \item \href{#method-DataBackendPolars-distinct}{\code{DataBackendPolars$distinct()}}
109 | \item \href{#method-DataBackendPolars-missings}{\code{DataBackendPolars$missings()}}
110 | }
111 | }
112 | \if{html}{\out{
113 | <details open><summary>Inherited methods</summary>
114 | <ul>
115 | <li><span class="pkg-link" data-pkg="mlr3" data-topic="DataBackend" data-id="format"><a href='../../mlr3/html/DataBackend.html#method-DataBackend-format'><code>mlr3::DataBackend$format()</code></a></span></li>
116 | <li><span class="pkg-link" data-pkg="mlr3" data-topic="DataBackend" data-id="print"><a href='../../mlr3/html/DataBackend.html#method-DataBackend-print'><code>mlr3::DataBackend$print()</code></a></span></li>
117 | </ul>
118 | </details>
119 | }}
120 | \if{html}{\out{<hr>}}
121 | \if{html}{\out{<a id="method-DataBackendPolars-new"></a>}}
122 | \if{latex}{\out{\hypertarget{method-DataBackendPolars-new}{}}}
123 | \subsection{Method \code{new()}}{
124 | Creates a backend for a \link[polars:RPolarsDataFrame]{polars::RPolarsDataFrame} object.
125 | \subsection{Usage}{
126 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendPolars$new(
127 |   data,
128 |   primary_key,
129 |   strings_as_factors = TRUE,
130 |   connector = NULL
131 | )}\if{html}{\out{</div>}}
132 | }
133 | 
134 | \subsection{Arguments}{
135 | \if{html}{\out{<div class="arguments">}}
136 | \describe{
137 | \item{\code{data}}{(\link[polars:RPolarsLazyFrame]{polars::RPolarsLazyFrame})\cr
138 | The data object.
139 | 
140 | Instead of calling the constructor itself, please call \code{\link[mlr3:as_data_backend]{mlr3::as_data_backend()}} on
141 | a \link[polars:RPolarsLazyFrame]{polars::RPolarsLazyFrame} or \link[polars:RPolarsDataFrame]{polars::RPolarsDataFrame}.
142 | Note that only \link[polars:RPolarsLazyFrame]{polars::RPolarsLazyFrame}s will be converted to a \link{DataBackendPolars}.
143 | \link[polars:RPolarsDataFrame]{polars::RPolarsDataFrame} objects without lazy execution will be converted to a
144 | \link[mlr3:DataBackendDataTable]{DataBackendDataTable}.}
145 | 
146 | \item{\code{primary_key}}{(\code{character(1)})\cr
147 | Name of the primary key column.
148 | Because \code{polars} does not natively support primary keys, uniqueness of the primary key column is expected but not enforced.}
149 | 
150 | \item{\code{strings_as_factors}}{(\code{logical(1)} || \code{character()})\cr
151 | Either a character vector of column names to convert to factors, or a single logical flag:
152 | if \code{FALSE}, no column will be converted, if \code{TRUE} all string columns (except the primary key).
153 | For conversion, the backend is queried for distinct values of the respective columns
154 | on construction and their levels are stored in \verb{$levels}.}
155 | 
156 | \item{\code{connector}}{(\verb{function()})\cr
157 | Optional function which is called to re-connect to e.g. a source file in case the connection became invalid.}
158 | }
159 | \if{html}{\out{</div>}}
160 | }
161 | }
162 | \if{html}{\out{<hr>}}
163 | \if{html}{\out{<a id="method-DataBackendPolars-data"></a>}}
164 | \if{latex}{\out{\hypertarget{method-DataBackendPolars-data}{}}}
165 | \subsection{Method \code{data()}}{
166 | Returns a slice of the data.
167 | 
168 | The rows must be addressed as vector of primary key values, columns must be referred to via column names.
169 | Queries for rows with no matching row id and queries for columns with no matching
170 | column name are silently ignored.
171 | \subsection{Usage}{
172 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendPolars$data(rows, cols)}\if{html}{\out{</div>}}
173 | }
174 | 
175 | \subsection{Arguments}{
176 | \if{html}{\out{<div class="arguments">}}
177 | \describe{
178 | \item{\code{rows}}{(\code{integer()})\cr
179 | Row indices.}
180 | 
181 | \item{\code{cols}}{(\code{character()})\cr
182 | Column names.}
183 | }
184 | \if{html}{\out{</div>}}
185 | }
186 | }
187 | \if{html}{\out{<hr>}}
188 | \if{html}{\out{<a id="method-DataBackendPolars-head"></a>}}
189 | \if{latex}{\out{\hypertarget{method-DataBackendPolars-head}{}}}
190 | \subsection{Method \code{head()}}{
191 | Retrieve the first \code{n} rows.
192 | \subsection{Usage}{
193 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendPolars$head(n = 6L)}\if{html}{\out{</div>}}
194 | }
195 | 
196 | \subsection{Arguments}{
197 | \if{html}{\out{<div class="arguments">}}
198 | \describe{
199 | \item{\code{n}}{(\code{integer(1)})\cr
200 | Number of rows.}
201 | }
202 | \if{html}{\out{</div>}}
203 | }
204 | \subsection{Returns}{
205 | \code{\link[data.table:data.table]{data.table::data.table()}} of the first \code{n} rows.
206 | }
207 | }
208 | \if{html}{\out{<hr>}}
209 | \if{html}{\out{<a id="method-DataBackendPolars-distinct"></a>}}
210 | \if{latex}{\out{\hypertarget{method-DataBackendPolars-distinct}{}}}
211 | \subsection{Method \code{distinct()}}{
212 | Returns a named list of vectors of distinct values for each column
213 | specified. If \code{na_rm} is \code{TRUE}, missing values are removed from the
214 | returned vectors of distinct values. Non-existing rows and columns are
215 | silently ignored.
216 | \subsection{Usage}{
217 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendPolars$distinct(rows, cols, na_rm = TRUE)}\if{html}{\out{</div>}}
218 | }
219 | 
220 | \subsection{Arguments}{
221 | \if{html}{\out{<div class="arguments">}}
222 | \describe{
223 | \item{\code{rows}}{(\code{integer()})\cr
224 | Row indices.}
225 | 
226 | \item{\code{cols}}{(\code{character()})\cr
227 | Column names.}
228 | 
229 | \item{\code{na_rm}}{(\code{logical(1)})\cr
230 | Whether to remove NAs or not.}
231 | }
232 | \if{html}{\out{</div>}}
233 | }
234 | \subsection{Returns}{
235 | Named \code{list()} of distinct values.
236 | }
237 | }
238 | \if{html}{\out{<hr>}}
239 | \if{html}{\out{<a id="method-DataBackendPolars-missings"></a>}}
240 | \if{latex}{\out{\hypertarget{method-DataBackendPolars-missings}{}}}
241 | \subsection{Method \code{missings()}}{
242 | Returns the number of missing values per column in the specified slice
243 | of data. Non-existing rows and columns are silently ignored.
244 | \subsection{Usage}{
245 | \if{html}{\out{<div class="r">}}\preformatted{DataBackendPolars$missings(rows, cols)}\if{html}{\out{</div>}}
246 | }
247 | 
248 | \subsection{Arguments}{
249 | \if{html}{\out{<div class="arguments">}}
250 | \describe{
251 | \item{\code{rows}}{(\code{integer()})\cr
252 | Row indices.}
253 | 
254 | \item{\code{cols}}{(\code{character()})\cr
255 | Column names.}
256 | }
257 | \if{html}{\out{</div>}}
258 | }
259 | \subsection{Returns}{
260 | Total of missing values per column (named \code{numeric()}).
261 | }
262 | }
263 | }
264 | 


--------------------------------------------------------------------------------
/man/as_duckdb_backend.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/as_duckdb_backend.R
 3 | \name{as_duckdb_backend}
 4 | \alias{as_duckdb_backend}
 5 | \title{Convert to DuckDB Backend}
 6 | \usage{
 7 | as_duckdb_backend(data, path = getOption("mlr3db.duckdb_dir", ":temp:"), ...)
 8 | }
 9 | \arguments{
10 | \item{data}{(\code{data.frame()} | \link[mlr3:DataBackend]{mlr3::DataBackend})\cr
11 | See description.}
12 | 
13 | \item{path}{(\code{character(1)})\cr
14 | Path for the DuckDB databases.
15 | Either a valid path to a directory which will be created if it not exists, or one of the special strings:
16 | \itemize{
17 | \item \code{":temp:"} (default): Temporary directory of the R session is used, see \code{\link[=tempdir]{tempdir()}}.
18 | Note that this directory will be removed during the shutdown of the R session.
19 | Also note that this usually does not work for parallelization on remote workers.
20 | Set to a custom path instead or use special string \code{":user:"} instead.
21 | \item \code{":user:"}: User cache directory as returned by \code{\link[=R_user_dir]{R_user_dir()}} is used.
22 | }
23 | 
24 | The default for this argument can be configured via option \code{"mlr3db.sqlite_dir"} or \code{"mlr3db.duckdb_dir"},
25 | respectively. The database files will use the hash of the \link{DataBackend} as filename with
26 | file extension \code{".duckdb"} or \code{".sqlite"}.
27 | If the database already exists on the file system, the converters will just established a new read-only
28 | connection.}
29 | 
30 | \item{...}{(\code{any})\cr
31 | Additional arguments, passed to \link{DataBackendDuckDB}.}
32 | }
33 | \value{
34 | \link{DataBackendDuckDB} or \link{Task}.
35 | }
36 | \description{
37 | Converts to a \link{DataBackendDuckDB} using the \CRANpkg{duckdb} database, depending on the input type:
38 | \itemize{
39 | \item \code{data.frame}: Creates a new \link{DataBackendDataTable} first using \code{\link[=as_data_backend]{as_data_backend()}}, then proceeds
40 | with the conversion from \link{DataBackendDataTable} to \link{DataBackendDuckDB}.
41 | \item \link[mlr3:DataBackend]{mlr3::DataBackend}: Creates a new DuckDB data base in the specified path.
42 | The filename is determined by the hash of the \link{DataBackend}.
43 | If the file already exists, a connection to the existing database is established and the existing
44 | files are reused.
45 | }
46 | 
47 | The created backend automatically reconnects to the database if the connection was lost, e.g. because
48 | the object was serialized to the filesystem and restored in a different R session.
49 | The only requirement is that the path does not change and that the path is accessible
50 | on all workers.
51 | }
52 | 


--------------------------------------------------------------------------------
/man/as_polars_backend.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/as_polars_backend.R
 3 | \name{as_polars_backend}
 4 | \alias{as_polars_backend}
 5 | \title{Convert to Polars Backend}
 6 | \usage{
 7 | as_polars_backend(data, streaming = FALSE, ...)
 8 | }
 9 | \arguments{
10 | \item{data}{(\code{data.frame()} | \link[mlr3:DataBackend]{mlr3::DataBackend})\cr
11 | See description.}
12 | 
13 | \item{streaming}{(\code{logical(1)})\cr
14 | Whether the data should be only scanned (recommended for large data sets) and streamed with
15 | every \link{DataBackendPolars} operation or loaded into memory completely.}
16 | 
17 | \item{...}{(\code{any})\cr
18 | Additional arguments, passed to \link{DataBackendPolars}.}
19 | }
20 | \value{
21 | \link{DataBackendPolars} or \link{Task}.
22 | }
23 | \description{
24 | Converts to a \link{DataBackendPolars} using the \CRANpkg{polars} database, depending on the input type:
25 | \itemize{
26 | \item \code{data.frame}: Creates a new \link{DataBackendDataTable} first using \code{\link[=as_data_backend]{as_data_backend()}}, then proceeds
27 | with the conversion from \link{DataBackendDataTable} to \link{DataBackendPolars}.
28 | \item \link[mlr3:DataBackend]{mlr3::DataBackend}: Creates a new \link{DataBackendPolars}.
29 | }
30 | 
31 | There is no automatic connection to the origin file set.
32 | If the data is obtained using scanning and the data is streamed, a \code{connector} can be set manually but is not required.
33 | }
34 | 


--------------------------------------------------------------------------------
/man/as_sqlite_backend.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/as_sqlite_backend.R
 3 | \name{as_sqlite_backend}
 4 | \alias{as_sqlite_backend}
 5 | \title{Convert to SQLite Backend}
 6 | \usage{
 7 | as_sqlite_backend(data, path = getOption("mlr3db.sqlite_dir", ":temp:"), ...)
 8 | }
 9 | \arguments{
10 | \item{data}{(\code{data.frame()} | \link[mlr3:DataBackend]{mlr3::DataBackend}\cr
11 | See description.}
12 | 
13 | \item{path}{(\code{character(1)})\cr
14 | Path for the DuckDB databases.
15 | Either a valid path to a directory which will be created if it not exists, or one of the special strings:
16 | \itemize{
17 | \item \code{":temp:"} (default): Temporary directory of the R session is used, see \code{\link[=tempdir]{tempdir()}}.
18 | Note that this directory will be removed during the shutdown of the R session.
19 | Also note that this usually does not work for parallelization on remote workers.
20 | Set to a custom path instead or use special string \code{":user:"} instead.
21 | \item \code{":user:"}: User cache directory as returned by \code{\link[=R_user_dir]{R_user_dir()}} is used.
22 | }
23 | 
24 | The default for this argument can be configured via option \code{"mlr3db.sqlite_dir"} or \code{"mlr3db.duckdb_dir"},
25 | respectively. The database files will use the hash of the \link{DataBackend} as filename with
26 | file extension \code{".duckdb"} or \code{".sqlite"}.
27 | If the database already exists on the file system, the converters will just established a new read-only
28 | connection.}
29 | 
30 | \item{...}{(\code{any})\cr
31 | Additional arguments, passed to \link{DataBackendDplyr}.}
32 | }
33 | \value{
34 | \link{DataBackendDplyr} or \link{Task}.
35 | }
36 | \description{
37 | Converts to a \link{DataBackendDplyr} using a \CRANpkg{RSQLite} database, depending on the input type:
38 | \itemize{
39 | \item \code{data.frame}: Creates a new \link{DataBackendDataTable} first using \code{\link[=as_data_backend]{as_data_backend()}}, then proceeds
40 | with the conversion from \link{DataBackendDataTable} to \link{DataBackendDplyr}.
41 | \item \link[mlr3:DataBackend]{mlr3::DataBackend}: Creates a new SQLite data base in the specified path.
42 | The filename is determined by the hash of the \link{DataBackend}.
43 | If the file already exists, a connection to the existing database is established and the existing
44 | files are reused.
45 | }
46 | 
47 | The created backend automatically reconnects to the database if the connection was lost, e.g. because
48 | the object was serialized to the filesystem and restored in a different R session.
49 | The only requirement is that the path does not change and that the path is accessible
50 | on all workers.
51 | }
52 | 


--------------------------------------------------------------------------------
/man/figures/logo_navbar.png:
--------------------------------------------------------------------------------
  1 | 
  2 | 
  3 | 
  4 | 
  5 | 
  6 | 
  7 | <!DOCTYPE html>
  8 | <html lang="en">
  9 |   <head>
 10 |     <meta charset="utf-8">
 11 |   <link rel="dns-prefetch" href="https://github.githubassets.com">
 12 |   <link rel="dns-prefetch" href="https://avatars0.githubusercontent.com">
 13 |   <link rel="dns-prefetch" href="https://avatars1.githubusercontent.com">
 14 |   <link rel="dns-prefetch" href="https://avatars2.githubusercontent.com">
 15 |   <link rel="dns-prefetch" href="https://avatars3.githubusercontent.com">
 16 |   <link rel="dns-prefetch" href="https://github-cloud.s3.amazonaws.com">
 17 |   <link rel="dns-prefetch" href="https://user-images.githubusercontent.com/">
 18 | 
 19 | 
 20 | 
 21 |   <link crossorigin="anonymous" media="all" integrity="sha512-KYH8zRCvGYQoVsdDKgYaJRXDN9CwQu0YkPVgbKm4cOiqLAxNisg2Kjex6tfrEB3yTAwtXcFY/sxBVj/3IkIiqg==" rel="stylesheet" href="https://github.githubassets.com/assets/frameworks-a70126cbff30372f13f599b76353080b.css" />
 22 |   
 23 |     <link crossorigin="anonymous" media="all" integrity="sha512-C2PeOYJLfGX0l1usuxFpXXEX27kP3TXRWl7jQ/qpMF59td5XFUUqB/EmZL2loRRBzouPP96e09oq2jovH+smEA==" rel="stylesheet" href="https://github.githubassets.com/assets/github-0d139b56f7fdba32feb4dfab70407a06.css" />
 24 |     
 25 |     
 26 |     
 27 |     
 28 | 
 29 |   <meta name="viewport" content="width=device-width">
 30 |   
 31 |   <title>mlr3/logo_navbar.png at master · mlr-org/mlr3</title>
 32 |     <meta name="description" content="mlr3: Machine Learning in R - next generation. Contribute to mlr-org/mlr3 development by creating an account on GitHub.">
 33 |     <link rel="search" type="application/opensearchdescription+xml" href="/opensearch.xml" title="GitHub">
 34 |   <link rel="fluid-icon" href="https://github.com/fluidicon.png" title="GitHub">
 35 |   <meta property="fb:app_id" content="1401488693436528">
 36 | 
 37 |     
 38 |     <meta property="og:image" content="https://avatars0.githubusercontent.com/u/12941794?s=400&amp;v=4" /><meta property="og:site_name" content="GitHub" /><meta property="og:type" content="object" /><meta property="og:title" content="mlr-org/mlr3" /><meta property="og:url" content="https://github.com/mlr-org/mlr3" /><meta property="og:description" content="mlr3: Machine Learning in R - next generation. Contribute to mlr-org/mlr3 development by creating an account on GitHub." />
 39 | 
 40 |   <link rel="assets" href="https://github.githubassets.com/">
 41 |   <link rel="web-socket" href="wss://live.github.com/_sockets/VjI6MzU5MTA0NzY2OjQ1YTIxOGQ5YThlZmZhMTIyOGI5ZDY2ZDIzMmM3NzEyZDM2N2IxYmU5MjMwNTY0NTFhY2Q0NThmNzExODgzYTE=--84e2b5eaaa99571ba7daae8de58cf59c0ec583ba">
 42 |   <meta name="pjax-timeout" content="1000">
 43 |   <link rel="sudo-modal" href="/sessions/sudo_modal">
 44 |   <meta name="request-id" content="B73C:3E702:6F9EDAD:AC00ACD:5C6A7D4D" data-pjax-transient>
 45 | 
 46 | 
 47 |   
 48 | 
 49 |   <meta name="selected-link" value="repo_source" data-pjax-transient>
 50 | 
 51 |       <meta name="google-site-verification" content="KT5gs8h0wvaagLKAVWq8bbeNwnZZK1r1XQysX3xurLU">
 52 |     <meta name="google-site-verification" content="ZzhVyEFwb7w3e0-uOTltm8Jsck2F5StVihD0exw2fsA">
 53 |     <meta name="google-site-verification" content="GXs5KoUUkNCoaAZn7wPN-t01Pywp9M3sEjnt_3_ZWPc">
 54 | 
 55 |   <meta name="octolytics-host" content="collector.githubapp.com" /><meta name="octolytics-app-id" content="github" /><meta name="octolytics-event-url" content="https://collector.githubapp.com/github-external/browser_event" /><meta name="octolytics-dimension-request_id" content="B73C:3E702:6F9EDAD:AC00ACD:5C6A7D4D" /><meta name="octolytics-dimension-region_edge" content="ams" /><meta name="octolytics-dimension-region_render" content="iad" /><meta name="octolytics-actor-id" content="1260920" /><meta name="octolytics-actor-login" content="mllg" /><meta name="octolytics-actor-hash" content="f7aeeecccdf37d6a03717ec38758c6abb399e83682dd8c02aa95e2fd17a182c2" />
 56 | <meta name="analytics-location" content="/&lt;user-name&gt;/&lt;repo-name&gt;/blob/show" data-pjax-transient="true" />
 57 | 
 58 | 
 59 | 
 60 |     <meta name="google-analytics" content="UA-3769691-2">
 61 | 
 62 |   <meta class="js-ga-set" name="userId" content="f4dbdca162b49ec8cf959d0e2bac7c9a">
 63 | 
 64 | <meta class="js-ga-set" name="dimension1" content="Logged In">
 65 | 
 66 | 
 67 | 
 68 |   
 69 | 
 70 |       <meta name="hostname" content="github.com">
 71 |     <meta name="user-login" content="mllg">
 72 | 
 73 |       <meta name="expected-hostname" content="github.com">
 74 |     <meta name="js-proxy-site-detection-payload" content="NzM1NzdlOThkNDY5MmEyNTlkZGIyYmFhYTIzMjA3MDczZDg0OGQyYWYzNDhjZjk5MWJhZGI2ODgzYzc3NzM4Ynx7InJlbW90ZV9hZGRyZXNzIjoiMTI5LjIxNy4yMDcuNTMiLCJyZXF1ZXN0X2lkIjoiQjczQzozRTcwMjo2RjlFREFEOkFDMDBBQ0Q6NUM2QTdENEQiLCJ0aW1lc3RhbXAiOjE1NTA0ODI3NjcsImhvc3QiOiJnaXRodWIuY29tIn0=">
 75 | 
 76 |     <meta name="enabled-features" content="UNIVERSE_BANNER,MARKETPLACE_PLAN_RESTRICTION_EDITOR,NOTIFY_ON_BLOCK,RELATED_ISSUES,MARKETPLACE_BROWSING_V2,MARKETPLACE_INSIGHTS_V2">
 77 | 
 78 |   <meta name="html-safe-nonce" content="8e20ebe0a81f2825381fba549235eb96a9d8b2ae">
 79 | 
 80 |   <meta http-equiv="x-pjax-version" content="53406b9e2302455b958c2cf9bc5b6be8">
 81 |   
 82 | 
 83 |       <link href="https://github.com/mlr-org/mlr3/commits/master.atom" rel="alternate" title="Recent Commits to mlr3:master" type="application/atom+xml">
 84 | 
 85 |   <meta name="go-import" content="github.com/mlr-org/mlr3 git https://github.com/mlr-org/mlr3.git">
 86 | 
 87 |   <meta name="octolytics-dimension-user_id" content="12941794" /><meta name="octolytics-dimension-user_login" content="mlr-org" /><meta name="octolytics-dimension-repository_id" content="146200962" /><meta name="octolytics-dimension-repository_nwo" content="mlr-org/mlr3" /><meta name="octolytics-dimension-repository_public" content="true" /><meta name="octolytics-dimension-repository_is_fork" content="false" /><meta name="octolytics-dimension-repository_network_root_id" content="146200962" /><meta name="octolytics-dimension-repository_network_root_nwo" content="mlr-org/mlr3" /><meta name="octolytics-dimension-repository_explore_github_marketplace_ci_cta_shown" content="false" />
 88 | 
 89 | 
 90 |     <link rel="canonical" href="https://github.com/mlr-org/mlr3/blob/master/man/figures/logo_navbar.png" data-pjax-transient>
 91 | 
 92 | 
 93 |   <meta name="browser-stats-url" content="https://api.github.com/_private/browser/stats">
 94 | 
 95 |   <meta name="browser-errors-url" content="https://api.github.com/_private/browser/errors">
 96 | 
 97 |   <link rel="mask-icon" href="https://github.githubassets.com/pinned-octocat.svg" color="#000000">
 98 |   <link rel="icon" type="image/x-icon" class="js-site-favicon" href="https://github.githubassets.com/favicon.ico">
 99 | 
100 | <meta name="theme-color" content="#1e2327">
101 | 
102 | 
103 |   <meta name="u2f-support" content="true">
104 | 
105 | 
106 |   <link rel="manifest" href="/manifest.json" crossOrigin="use-credentials">
107 | 
108 |   </head>
109 | 
110 |   <body class="logged-in env-production page-blob">
111 |     
112 | 
113 |   <div class="position-relative js-header-wrapper ">
114 |     <a href="#start-of-content" tabindex="1" class="p-3 bg-blue text-white show-on-focus js-skip-to-content">Skip to content</a>
115 |     <div id="js-pjax-loader-bar" class="pjax-loader-bar"><div class="progress"></div></div>
116 | 
117 |     
118 |     
119 |     
120 | 
121 | 
122 |         
123 | <header class="Header  f5" role="banner">
124 |   <div class="d-flex flex-justify-between px-3 ">
125 |     <div class="d-flex flex-justify-between ">
126 |       <div class="">
127 |         <a class="header-logo-invertocat" href="https://github.com/" data-hotkey="g d" aria-label="Homepage" data-ga-click="Header, go to dashboard, icon:logo">
128 |   <svg height="32" class="octicon octicon-mark-github" viewBox="0 0 16 16" version="1.1" width="32" aria-hidden="true"><path fill-rule="evenodd" d="M8 0C3.58 0 0 3.58 0 8c0 3.54 2.29 6.53 5.47 7.59.4.07.55-.17.55-.38 0-.19-.01-.82-.01-1.49-2.01.37-2.53-.49-2.69-.94-.09-.23-.48-.94-.82-1.13-.28-.15-.68-.52-.01-.53.63-.01 1.08.58 1.23.82.72 1.21 1.87.87 2.33.66.07-.52.28-.87.51-1.07-1.78-.2-3.64-.89-3.64-3.95 0-.87.31-1.59.82-2.15-.08-.2-.36-1.02.08-2.12 0 0 .67-.21 2.2.82.64-.18 1.32-.27 2-.27.68 0 1.36.09 2 .27 1.53-1.04 2.2-.82 2.2-.82.44 1.1.16 1.92.08 2.12.51.56.82 1.27.82 2.15 0 3.07-1.87 3.75-3.65 3.95.29.25.54.73.54 1.48 0 1.07-.01 1.93-.01 2.2 0 .21.15.46.55.38A8.013 8.013 0 0 0 16 8c0-4.42-3.58-8-8-8z"/></svg>
129 | </a>
130 | 
131 |       </div>
132 | 
133 |     </div>
134 | 
135 |     <div class="HeaderMenu d-flex flex-justify-between flex-auto">
136 |       <nav class="d-flex" aria-label="Global">
137 |             <div class="">
138 |               <div class="header-search scoped-search site-scoped-search js-site-search position-relative js-jump-to"
139 |   role="combobox"
140 |   aria-owns="jump-to-results"
141 |   aria-label="Search or jump to"
142 |   aria-haspopup="listbox"
143 |   aria-expanded="false"
144 | >
145 |   <div class="position-relative">
146 |     <!-- '"` --><!-- </textarea></xmp> --></option></form><form class="js-site-search-form" data-scope-type="Repository" data-scope-id="146200962" data-scoped-search-url="/mlr-org/mlr3/search" data-unscoped-search-url="/search" action="/mlr-org/mlr3/search" accept-charset="UTF-8" method="get"><input name="utf8" type="hidden" value="&#x2713;" />
147 |       <label class="form-control header-search-wrapper header-search-wrapper-jump-to position-relative d-flex flex-justify-between flex-items-center js-chromeless-input-container">
148 |         <input type="text"
149 |           class="form-control header-search-input jump-to-field js-jump-to-field js-site-search-focus js-site-search-field is-clearable"
150 |           data-hotkey="s,/"
151 |           name="q"
152 |           value=""
153 |           placeholder="Search or jump to…"
154 |           data-unscoped-placeholder="Search or jump to…"
155 |           data-scoped-placeholder="Search or jump to…"
156 |           autocapitalize="off"
157 |           aria-autocomplete="list"
158 |           aria-controls="jump-to-results"
159 |           aria-label="Search or jump to…"
160 |           data-jump-to-suggestions-path="/_graphql/GetSuggestedNavigationDestinations#csrf-token=k7LNaOW4cuZFmNXiJIim1cvZ8bGsB6spfb4KNQrKiR8j6W0rsEh0go/e7nVEqauabnnnUGTGD4ldAvJK0O3zfw=="
161 |           spellcheck="false"
162 |           autocomplete="off"
163 |           >
164 |           <input type="hidden" class="js-site-search-type-field" name="type" >
165 |             <img src="https://github.githubassets.com/images/search-key-slash.svg" alt="" class="mr-2 header-search-key-slash">
166 | 
167 |             <div class="Box position-absolute overflow-hidden d-none jump-to-suggestions js-jump-to-suggestions-container">
168 |               
169 | <ul class="d-none js-jump-to-suggestions-template-container">
170 |   
171 | 
172 | <li class="d-flex flex-justify-start flex-items-center p-0 f5 navigation-item js-navigation-item js-jump-to-suggestion" role="option">
173 |   <a tabindex="-1" class="no-underline d-flex flex-auto flex-items-center jump-to-suggestions-path js-jump-to-suggestion-path js-navigation-open p-2" href="">
174 |     <div class="jump-to-octicon js-jump-to-octicon flex-shrink-0 mr-2 text-center d-none">
175 |       <svg height="16" width="16" class="octicon octicon-repo flex-shrink-0 js-jump-to-octicon-repo d-none" title="Repository" aria-label="Repository" viewBox="0 0 12 16" version="1.1" role="img"><path fill-rule="evenodd" d="M4 9H3V8h1v1zm0-3H3v1h1V6zm0-2H3v1h1V4zm0-2H3v1h1V2zm8-1v12c0 .55-.45 1-1 1H6v2l-1.5-1.5L3 16v-2H1c-.55 0-1-.45-1-1V1c0-.55.45-1 1-1h10c.55 0 1 .45 1 1zm-1 10H1v2h2v-1h3v1h5v-2zm0-10H2v9h9V1z"/></svg>
176 |       <svg height="16" width="16" class="octicon octicon-project flex-shrink-0 js-jump-to-octicon-project d-none" title="Project" aria-label="Project" viewBox="0 0 15 16" version="1.1" role="img"><path fill-rule="evenodd" d="M10 12h3V2h-3v10zm-4-2h3V2H6v8zm-4 4h3V2H2v12zm-1 1h13V1H1v14zM14 0H1a1 1 0 0 0-1 1v14a1 1 0 0 0 1 1h13a1 1 0 0 0 1-1V1a1 1 0 0 0-1-1z"/></svg>
177 |       <svg height="16" width="16" class="octicon octicon-search flex-shrink-0 js-jump-to-octicon-search d-none" title="Search" aria-label="Search" viewBox="0 0 16 16" version="1.1" role="img"><path fill-rule="evenodd" d="M15.7 13.3l-3.81-3.83A5.93 5.93 0 0 0 13 6c0-3.31-2.69-6-6-6S1 2.69 1 6s2.69 6 6 6c1.3 0 2.48-.41 3.47-1.11l3.83 3.81c.19.2.45.3.7.3.25 0 .52-.09.7-.3a.996.996 0 0 0 0-1.41v.01zM7 10.7c-2.59 0-4.7-2.11-4.7-4.7 0-2.59 2.11-4.7 4.7-4.7 2.59 0 4.7 2.11 4.7 4.7 0 2.59-2.11 4.7-4.7 4.7z"/></svg>
178 |     </div>
179 | 
180 |     <img class="avatar mr-2 flex-shrink-0 js-jump-to-suggestion-avatar d-none" alt="" aria-label="Team" src="" width="28" height="28">
181 | 
182 |     <div class="jump-to-suggestion-name js-jump-to-suggestion-name flex-auto overflow-hidden text-left no-wrap css-truncate css-truncate-target">
183 |     </div>
184 | 
185 |     <div class="border rounded-1 flex-shrink-0 bg-gray px-1 text-gray-light ml-1 f6 d-none js-jump-to-badge-search">
186 |       <span class="js-jump-to-badge-search-text-default d-none" aria-label="in this repository">
187 |         In this repository
188 |       </span>
189 |       <span class="js-jump-to-badge-search-text-global d-none" aria-label="in all of GitHub">
190 |         All GitHub
191 |       </span>
192 |       <span aria-hidden="true" class="d-inline-block ml-1 v-align-middle">↵</span>
193 |     </div>
194 | 
195 |     <div aria-hidden="true" class="border rounded-1 flex-shrink-0 bg-gray px-1 text-gray-light ml-1 f6 d-none d-on-nav-focus js-jump-to-badge-jump">
196 |       Jump to
197 |       <span class="d-inline-block ml-1 v-align-middle">↵</span>
198 |     </div>
199 |   </a>
200 | </li>
201 | 
202 | </ul>
203 | 
204 | <ul class="d-none js-jump-to-no-results-template-container">
205 |   <li class="d-flex flex-justify-center flex-items-center f5 d-none js-jump-to-suggestion p-2">
206 |     <span class="text-gray">No suggested jump to results</span>
207 |   </li>
208 | </ul>
209 | 
210 | <ul id="jump-to-results" role="listbox" class="p-0 m-0 js-navigation-container jump-to-suggestions-results-container js-jump-to-suggestions-results-container">
211 |   
212 | 
213 | <li class="d-flex flex-justify-start flex-items-center p-0 f5 navigation-item js-navigation-item js-jump-to-scoped-search d-none" role="option">
214 |   <a tabindex="-1" class="no-underline d-flex flex-auto flex-items-center jump-to-suggestions-path js-jump-to-suggestion-path js-navigation-open p-2" href="">
215 |     <div class="jump-to-octicon js-jump-to-octicon flex-shrink-0 mr-2 text-center d-none">
216 |       <svg height="16" width="16" class="octicon octicon-repo flex-shrink-0 js-jump-to-octicon-repo d-none" title="Repository" aria-label="Repository" viewBox="0 0 12 16" version="1.1" role="img"><path fill-rule="evenodd" d="M4 9H3V8h1v1zm0-3H3v1h1V6zm0-2H3v1h1V4zm0-2H3v1h1V2zm8-1v12c0 .55-.45 1-1 1H6v2l-1.5-1.5L3 16v-2H1c-.55 0-1-.45-1-1V1c0-.55.45-1 1-1h10c.55 0 1 .45 1 1zm-1 10H1v2h2v-1h3v1h5v-2zm0-10H2v9h9V1z"/></svg>
217 |       <svg height="16" width="16" class="octicon octicon-project flex-shrink-0 js-jump-to-octicon-project d-none" title="Project" aria-label="Project" viewBox="0 0 15 16" version="1.1" role="img"><path fill-rule="evenodd" d="M10 12h3V2h-3v10zm-4-2h3V2H6v8zm-4 4h3V2H2v12zm-1 1h13V1H1v14zM14 0H1a1 1 0 0 0-1 1v14a1 1 0 0 0 1 1h13a1 1 0 0 0 1-1V1a1 1 0 0 0-1-1z"/></svg>
218 |       <svg height="16" width="16" class="octicon octicon-search flex-shrink-0 js-jump-to-octicon-search d-none" title="Search" aria-label="Search" viewBox="0 0 16 16" version="1.1" role="img"><path fill-rule="evenodd" d="M15.7 13.3l-3.81-3.83A5.93 5.93 0 0 0 13 6c0-3.31-2.69-6-6-6S1 2.69 1 6s2.69 6 6 6c1.3 0 2.48-.41 3.47-1.11l3.83 3.81c.19.2.45.3.7.3.25 0 .52-.09.7-.3a.996.996 0 0 0 0-1.41v.01zM7 10.7c-2.59 0-4.7-2.11-4.7-4.7 0-2.59 2.11-4.7 4.7-4.7 2.59 0 4.7 2.11 4.7 4.7 0 2.59-2.11 4.7-4.7 4.7z"/></svg>
219 |     </div>
220 | 
221 |     <img class="avatar mr-2 flex-shrink-0 js-jump-to-suggestion-avatar d-none" alt="" aria-label="Team" src="" width="28" height="28">
222 | 
223 |     <div class="jump-to-suggestion-name js-jump-to-suggestion-name flex-auto overflow-hidden text-left no-wrap css-truncate css-truncate-target">
224 |     </div>
225 | 
226 |     <div class="border rounded-1 flex-shrink-0 bg-gray px-1 text-gray-light ml-1 f6 d-none js-jump-to-badge-search">
227 |       <span class="js-jump-to-badge-search-text-default d-none" aria-label="in this repository">
228 |         In this repository
229 |       </span>
230 |       <span class="js-jump-to-badge-search-text-global d-none" aria-label="in all of GitHub">
231 |         All GitHub
232 |       </span>
233 |       <span aria-hidden="true" class="d-inline-block ml-1 v-align-middle">↵</span>
234 |     </div>
235 | 
236 |     <div aria-hidden="true" class="border rounded-1 flex-shrink-0 bg-gray px-1 text-gray-light ml-1 f6 d-none d-on-nav-focus js-jump-to-badge-jump">
237 |       Jump to
238 |       <span class="d-inline-block ml-1 v-align-middle">↵</span>
239 |     </div>
240 |   </a>
241 | </li>
242 | 
243 |   
244 | 
245 | <li class="d-flex flex-justify-start flex-items-center p-0 f5 navigation-item js-navigation-item js-jump-to-global-search d-none" role="option">
246 |   <a tabindex="-1" class="no-underline d-flex flex-auto flex-items-center jump-to-suggestions-path js-jump-to-suggestion-path js-navigation-open p-2" href="">
247 |     <div class="jump-to-octicon js-jump-to-octicon flex-shrink-0 mr-2 text-center d-none">
248 |       <svg height="16" width="16" class="octicon octicon-repo flex-shrink-0 js-jump-to-octicon-repo d-none" title="Repository" aria-label="Repository" viewBox="0 0 12 16" version="1.1" role="img"><path fill-rule="evenodd" d="M4 9H3V8h1v1zm0-3H3v1h1V6zm0-2H3v1h1V4zm0-2H3v1h1V2zm8-1v12c0 .55-.45 1-1 1H6v2l-1.5-1.5L3 16v-2H1c-.55 0-1-.45-1-1V1c0-.55.45-1 1-1h10c.55 0 1 .45 1 1zm-1 10H1v2h2v-1h3v1h5v-2zm0-10H2v9h9V1z"/></svg>
249 |       <svg height="16" width="16" class="octicon octicon-project flex-shrink-0 js-jump-to-octicon-project d-none" title="Project" aria-label="Project" viewBox="0 0 15 16" version="1.1" role="img"><path fill-rule="evenodd" d="M10 12h3V2h-3v10zm-4-2h3V2H6v8zm-4 4h3V2H2v12zm-1 1h13V1H1v14zM14 0H1a1 1 0 0 0-1 1v14a1 1 0 0 0 1 1h13a1 1 0 0 0 1-1V1a1 1 0 0 0-1-1z"/></svg>
250 |       <svg height="16" width="16" class="octicon octicon-search flex-shrink-0 js-jump-to-octicon-search d-none" title="Search" aria-label="Search" viewBox="0 0 16 16" version="1.1" role="img"><path fill-rule="evenodd" d="M15.7 13.3l-3.81-3.83A5.93 5.93 0 0 0 13 6c0-3.31-2.69-6-6-6S1 2.69 1 6s2.69 6 6 6c1.3 0 2.48-.41 3.47-1.11l3.83 3.81c.19.2.45.3.7.3.25 0 .52-.09.7-.3a.996.996 0 0 0 0-1.41v.01zM7 10.7c-2.59 0-4.7-2.11-4.7-4.7 0-2.59 2.11-4.7 4.7-4.7 2.59 0 4.7 2.11 4.7 4.7 0 2.59-2.11 4.7-4.7 4.7z"/></svg>
251 |     </div>
252 | 
253 |     <img class="avatar mr-2 flex-shrink-0 js-jump-to-suggestion-avatar d-none" alt="" aria-label="Team" src="" width="28" height="28">
254 | 
255 |     <div class="jump-to-suggestion-name js-jump-to-suggestion-name flex-auto overflow-hidden text-left no-wrap css-truncate css-truncate-target">
256 |     </div>
257 | 
258 |     <div class="border rounded-1 flex-shrink-0 bg-gray px-1 text-gray-light ml-1 f6 d-none js-jump-to-badge-search">
259 |       <span class="js-jump-to-badge-search-text-default d-none" aria-label="in this repository">
260 |         In this repository
261 |       </span>
262 |       <span class="js-jump-to-badge-search-text-global d-none" aria-label="in all of GitHub">
263 |         All GitHub
264 |       </span>
265 |       <span aria-hidden="true" class="d-inline-block ml-1 v-align-middle">↵</span>
266 |     </div>
267 | 
268 |     <div aria-hidden="true" class="border rounded-1 flex-shrink-0 bg-gray px-1 text-gray-light ml-1 f6 d-none d-on-nav-focus js-jump-to-badge-jump">
269 |       Jump to
270 |       <span class="d-inline-block ml-1 v-align-middle">↵</span>
271 |     </div>
272 |   </a>
273 | </li>
274 | 
275 | 
276 |     <li class="d-flex flex-justify-center flex-items-center p-0 f5 js-jump-to-suggestion">
277 |       <img src="https://github.githubassets.com/images/spinners/octocat-spinner-128.gif" alt="Octocat Spinner Icon" class="m-2" width="28">
278 |     </li>
279 | </ul>
280 | 
281 |             </div>
282 |       </label>
283 | </form>  </div>
284 | </div>
285 | 
286 |             </div>
287 | 
288 |           <ul class="d-flex pl-2 flex-items-center text-bold list-style-none">
289 |             <li>
290 |               <a class="js-selected-navigation-item HeaderNavlink px-2" data-hotkey="g p" data-ga-click="Header, click, Nav menu - item:pulls context:user" aria-label="Pull requests you created" data-selected-links="/pulls /pulls/assigned /pulls/mentioned /pulls" href="/pulls">
291 |                 Pull requests
292 | </a>            </li>
293 |             <li>
294 |               <a class="js-selected-navigation-item HeaderNavlink px-2" data-hotkey="g i" data-ga-click="Header, click, Nav menu - item:issues context:user" aria-label="Issues you created" data-selected-links="/issues /issues/assigned /issues/mentioned /issues" href="/issues">
295 |                 Issues
296 | </a>            </li>
297 |               <li class="position-relative">
298 |                 <a class="js-selected-navigation-item HeaderNavlink px-2" data-ga-click="Header, click, Nav menu - item:marketplace context:user" data-octo-click="marketplace_click" data-octo-dimensions="location:nav_bar" data-selected-links=" /marketplace" href="/marketplace">
299 |                    Marketplace
300 | </a>                  
301 |               </li>
302 |             <li>
303 |               <a class="js-selected-navigation-item HeaderNavlink px-2" data-ga-click="Header, click, Nav menu - item:explore" data-selected-links="/explore /trending /trending/developers /integrations /integrations/feature/code /integrations/feature/collaborate /integrations/feature/ship showcases showcases_search showcases_landing /explore" href="/explore">
304 |                 Explore
305 | </a>            </li>
306 |           </ul>
307 |       </nav>
308 | 
309 |       <div class="d-flex">
310 |         
311 | <ul class="user-nav d-flex flex-items-center list-style-none" id="user-links">
312 |   <li class="dropdown">
313 |     <span class="d-inline-block  px-2">
314 |       
315 |     <a aria-label="You have unread notifications" class="notification-indicator tooltipped tooltipped-s  js-socket-channel js-notification-indicator" data-hotkey="g n" data-ga-click="Header, go to notifications, icon:unread" data-channel="notification-changed:1260920" href="/notifications">
316 |         <span class="mail-status unread"></span>
317 |         <svg class="octicon octicon-bell" viewBox="0 0 14 16" version="1.1" width="14" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M14 12v1H0v-1l.73-.58c.77-.77.81-2.55 1.19-4.42C2.69 3.23 6 2 6 2c0-.55.45-1 1-1s1 .45 1 1c0 0 3.39 1.23 4.16 5 .38 1.88.42 3.66 1.19 4.42l.66.58H14zm-7 4c1.11 0 2-.89 2-2H5c0 1.11.89 2 2 2z"/></svg>
318 | </a>
319 |     </span>
320 |   </li>
321 | 
322 |   <li class="dropdown">
323 |     <details class="details-overlay details-reset d-flex px-2 flex-items-center">
324 |       <summary class="HeaderNavlink"
325 |          aria-label="Create new…"
326 |          data-ga-click="Header, create new, icon:add">
327 |         <svg class="octicon octicon-plus float-left mr-1 mt-1" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M12 9H7v5H5V9H0V7h5V2h2v5h5v2z"/></svg>
328 |         <span class="dropdown-caret mt-1"></span>
329 |       </summary>
330 |       <details-menu class="dropdown-menu dropdown-menu-sw">
331 |         
332 | <a role="menuitem" class="dropdown-item" href="/new" data-ga-click="Header, create new repository">
333 |   New repository
334 | </a>
335 | 
336 |   <a role="menuitem" class="dropdown-item" href="/new/import" data-ga-click="Header, import a repository">
337 |     Import repository
338 |   </a>
339 | 
340 | <a role="menuitem" class="dropdown-item" href="https://gist.github.com/" data-ga-click="Header, create new gist">
341 |   New gist
342 | </a>
343 | 
344 |   <a role="menuitem" class="dropdown-item" href="/organizations/new" data-ga-click="Header, create new organization">
345 |     New organization
346 |   </a>
347 | 
348 | 
349 |   <div class="dropdown-divider"></div>
350 |   <div class="dropdown-header">
351 |     <span title="mlr-org/mlr3">This repository</span>
352 |   </div>
353 |     <a role="menuitem" class="dropdown-item" href="/mlr-org/mlr3/issues/new" data-ga-click="Header, create new issue">
354 |       New issue
355 |     </a>
356 | 
357 | 
358 |       </details-menu>
359 |     </details>
360 |   </li>
361 | 
362 |   <li class="dropdown">
363 | 
364 |     <details class="details-overlay details-reset d-flex pl-2 flex-items-center">
365 |       <summary class="HeaderNavlink name mt-1"
366 |         aria-label="View profile and more"
367 |         data-ga-click="Header, show menu, icon:avatar">
368 |         <img alt="@mllg" class="avatar float-left mr-1" src="https://avatars2.githubusercontent.com/u/1260920?s=40&amp;v=4" height="20" width="20">
369 |         <span class="dropdown-caret"></span>
370 |       </summary>
371 |       <details-menu class="dropdown-menu dropdown-menu-sw">
372 |         <div class="header-nav-current-user css-truncate"><a role="menuitem" class="no-underline user-profile-link px-3 pt-2 pb-2 mb-n2 mt-n1 d-block" href="/mllg" data-ga-click="Header, go to profile, text:Signed in as">Signed in as <strong class="css-truncate-target">mllg</strong></a></div>
373 |         <div role="none" class="dropdown-divider"></div>
374 | 
375 |         <div class="px-3 f6 user-status-container js-user-status-context pb-1" data-url="/users/status?compact=1&amp;link_mentions=0&amp;truncate=1">
376 |           
377 | <div class="js-user-status-container user-status-compact" data-team-hovercards-enabled>
378 |   <details class="js-user-status-details details-reset details-overlay details-overlay-dark">
379 |     <summary class="btn-link no-underline js-toggle-user-status-edit toggle-user-status-edit width-full" aria-haspopup="dialog" role="menuitem" data-hydro-click="{&quot;event_type&quot;:&quot;user_profile.click&quot;,&quot;payload&quot;:{&quot;profile_user_id&quot;:12941794,&quot;target&quot;:&quot;EDIT_USER_STATUS&quot;,&quot;user_id&quot;:1260920,&quot;client_id&quot;:&quot;2061749677.1536305900&quot;,&quot;originating_request_id&quot;:&quot;B73C:3E702:6F9EDAD:AC00ACD:5C6A7D4D&quot;,&quot;originating_url&quot;:&quot;https://github.com/mlr-org/mlr3/blob/master/man/figures/logo_navbar.png&quot;}}" data-hydro-click-hmac="3a9fd1695e6470209a993719d30da716a764ef8717a45f5eeeb83c8a7fb60400">
380 |       <div class="f6 d-inline-block v-align-middle  user-status-emoji-only-header pl-0 circle lh-condensed user-status-header " style="max-width: 29px">
381 |         <div class="user-status-emoji-container flex-shrink-0 mr-1">
382 |           <svg class="octicon octicon-smiley" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8 0C3.58 0 0 3.58 0 8s3.58 8 8 8 8-3.58 8-8-3.58-8-8-8zm4.81 12.81a6.72 6.72 0 0 1-2.17 1.45c-.83.36-1.72.53-2.64.53-.92 0-1.81-.17-2.64-.53-.81-.34-1.55-.83-2.17-1.45a6.773 6.773 0 0 1-1.45-2.17A6.59 6.59 0 0 1 1.21 8c0-.92.17-1.81.53-2.64.34-.81.83-1.55 1.45-2.17.62-.62 1.36-1.11 2.17-1.45A6.59 6.59 0 0 1 8 1.21c.92 0 1.81.17 2.64.53.81.34 1.55.83 2.17 1.45.62.62 1.11 1.36 1.45 2.17.36.83.53 1.72.53 2.64 0 .92-.17 1.81-.53 2.64-.34.81-.83 1.55-1.45 2.17zM4 6.8v-.59c0-.66.53-1.19 1.2-1.19h.59c.66 0 1.19.53 1.19 1.19v.59c0 .67-.53 1.2-1.19 1.2H5.2C4.53 8 4 7.47 4 6.8zm5 0v-.59c0-.66.53-1.19 1.2-1.19h.59c.66 0 1.19.53 1.19 1.19v.59c0 .67-.53 1.2-1.19 1.2h-.59C9.53 8 9 7.47 9 6.8zm4 3.2c-.72 1.88-2.91 3-5 3s-4.28-1.13-5-3c-.14-.39.23-1 .66-1h8.59c.41 0 .89.61.75 1z"/></svg>
383 |         </div>
384 |       </div>
385 |       <div class="d-inline-block v-align-middle user-status-message-wrapper f6 lh-condensed ws-normal pt-1">
386 |           <span class="link-gray">Set your status</span>
387 |       </div>
388 | </summary>    <details-dialog class="details-dialog rounded-1 anim-fade-in fast Box Box--overlay" role="dialog" tabindex="-1">
389 |       <!-- '"` --><!-- </textarea></xmp> --></option></form><form class="position-relative flex-auto js-user-status-form" action="/users/status?compact=1&amp;link_mentions=0&amp;truncate=1" accept-charset="UTF-8" method="post"><input name="utf8" type="hidden" value="&#x2713;" /><input type="hidden" name="_method" value="put" /><input type="hidden" name="authenticity_token" value="hHaq4NP4bMov42TycVkTbcmT51M5+XynIc1CP707fs/IosFM/Jqyw/A79Rz1ee8MwXFkdeY8wEET4Is311a4CA==" />
390 |         <div class="Box-header bg-gray border-bottom p-3">
391 |           <button class="Box-btn-octicon js-toggle-user-status-edit btn-octicon float-right" type="reset" aria-label="Close dialog" data-close-dialog>
392 |             <svg class="octicon octicon-x" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M7.48 8l3.75 3.75-1.48 1.48L6 9.48l-3.75 3.75-1.48-1.48L4.52 8 .77 4.25l1.48-1.48L6 6.52l3.75-3.75 1.48 1.48L7.48 8z"/></svg>
393 |           </button>
394 |           <h3 class="Box-title f5 text-bold text-gray-dark">Edit status</h3>
395 |         </div>
396 |         <input type="hidden" name="emoji" class="js-user-status-emoji-field" value="">
397 |         <input type="hidden" name="organization_id" class="js-user-status-org-id-field" value="">
398 |         <div class="px-3 py-2 text-gray-dark">
399 |           <div class="js-characters-remaining-container js-suggester-container position-relative mt-2">
400 |             <div class="input-group d-table form-group my-0 js-user-status-form-group">
401 |               <span class="input-group-button d-table-cell v-align-middle" style="width: 1%">
402 |                 <button type="button" aria-label="Choose an emoji" class="btn-outline btn js-toggle-user-status-emoji-picker bg-white btn-open-emoji-picker">
403 |                   <span class="js-user-status-original-emoji" hidden></span>
404 |                   <span class="js-user-status-custom-emoji"></span>
405 |                   <span class="js-user-status-no-emoji-icon" >
406 |                     <svg class="octicon octicon-smiley" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8 0C3.58 0 0 3.58 0 8s3.58 8 8 8 8-3.58 8-8-3.58-8-8-8zm4.81 12.81a6.72 6.72 0 0 1-2.17 1.45c-.83.36-1.72.53-2.64.53-.92 0-1.81-.17-2.64-.53-.81-.34-1.55-.83-2.17-1.45a6.773 6.773 0 0 1-1.45-2.17A6.59 6.59 0 0 1 1.21 8c0-.92.17-1.81.53-2.64.34-.81.83-1.55 1.45-2.17.62-.62 1.36-1.11 2.17-1.45A6.59 6.59 0 0 1 8 1.21c.92 0 1.81.17 2.64.53.81.34 1.55.83 2.17 1.45.62.62 1.11 1.36 1.45 2.17.36.83.53 1.72.53 2.64 0 .92-.17 1.81-.53 2.64-.34.81-.83 1.55-1.45 2.17zM4 6.8v-.59c0-.66.53-1.19 1.2-1.19h.59c.66 0 1.19.53 1.19 1.19v.59c0 .67-.53 1.2-1.19 1.2H5.2C4.53 8 4 7.47 4 6.8zm5 0v-.59c0-.66.53-1.19 1.2-1.19h.59c.66 0 1.19.53 1.19 1.19v.59c0 .67-.53 1.2-1.19 1.2h-.59C9.53 8 9 7.47 9 6.8zm4 3.2c-.72 1.88-2.91 3-5 3s-4.28-1.13-5-3c-.14-.39.23-1 .66-1h8.59c.41 0 .89.61.75 1z"/></svg>
407 |                   </span>
408 |                 </button>
409 |               </span>
410 |               <input type="text" autocomplete="off" autofocus data-maxlength="80" class="js-suggester-field d-table-cell width-full form-control js-user-status-message-field js-characters-remaining-field" placeholder="What's happening?" name="message" required value="" aria-label="What is your current status?">
411 |               <div class="error">Could not update your status, please try again.</div>
412 |             </div>
413 |             <div class="suggester-container">
414 |               <div class="suggester js-suggester js-navigation-container" data-url="/autocomplete/user-suggestions" data-no-org-url="/autocomplete/user-suggestions" data-org-url="/suggestions" hidden>
415 |               </div>
416 |             </div>
417 |             <div style="margin-left: 53px" class="my-1 text-small label-characters-remaining js-characters-remaining" data-suffix="remaining" hidden>
418 |               80 remaining
419 |             </div>
420 |           </div>
421 |           <include-fragment class="js-user-status-emoji-picker" data-url="/users/status/emoji"></include-fragment>
422 |           <div class="overflow-auto" style="max-height: 33vh">
423 |             <div class="user-status-suggestions js-user-status-suggestions">
424 |               <h4 class="f6 text-normal my-3">Suggestions:</h4>
425 |               <div class="mx-3 mt-2 clearfix">
426 |                   <div class="float-left col-6">
427 |                       <button type="button" value=":palm_tree:" class="d-flex flex-items-baseline flex-items-stretch lh-condensed f6 btn-link link-gray no-underline js-predefined-user-status mb-1">
428 |                         <div class="emoji-status-width mr-2 v-align-middle js-predefined-user-status-emoji">
429 |                           <g-emoji alias="palm_tree" fallback-src="https://github.githubassets.com/images/icons/emoji/unicode/1f334.png">🌴</g-emoji>
430 |                         </div>
431 |                         <div class="d-flex flex-items-center no-underline js-predefined-user-status-message" style="border-left: 1px solid transparent">
432 |                           On vacation
433 |                         </div>
434 |                       </button>
435 |                       <button type="button" value=":face_with_thermometer:" class="d-flex flex-items-baseline flex-items-stretch lh-condensed f6 btn-link link-gray no-underline js-predefined-user-status mb-1">
436 |                         <div class="emoji-status-width mr-2 v-align-middle js-predefined-user-status-emoji">
437 |                           <g-emoji alias="face_with_thermometer" fallback-src="https://github.githubassets.com/images/icons/emoji/unicode/1f912.png">🤒</g-emoji>
438 |                         </div>
439 |                         <div class="d-flex flex-items-center no-underline js-predefined-user-status-message" style="border-left: 1px solid transparent">
440 |                           Out sick
441 |                         </div>
442 |                       </button>
443 |                   </div>
444 |                   <div class="float-left col-6">
445 |                       <button type="button" value=":house:" class="d-flex flex-items-baseline flex-items-stretch lh-condensed f6 btn-link link-gray no-underline js-predefined-user-status mb-1">
446 |                         <div class="emoji-status-width mr-2 v-align-middle js-predefined-user-status-emoji">
447 |                           <g-emoji alias="house" fallback-src="https://github.githubassets.com/images/icons/emoji/unicode/1f3e0.png">🏠</g-emoji>
448 |                         </div>
449 |                         <div class="d-flex flex-items-center no-underline js-predefined-user-status-message" style="border-left: 1px solid transparent">
450 |                           Working from home
451 |                         </div>
452 |                       </button>
453 |                       <button type="button" value=":dart:" class="d-flex flex-items-baseline flex-items-stretch lh-condensed f6 btn-link link-gray no-underline js-predefined-user-status mb-1">
454 |                         <div class="emoji-status-width mr-2 v-align-middle js-predefined-user-status-emoji">
455 |                           <g-emoji alias="dart" fallback-src="https://github.githubassets.com/images/icons/emoji/unicode/1f3af.png">🎯</g-emoji>
456 |                         </div>
457 |                         <div class="d-flex flex-items-center no-underline js-predefined-user-status-message" style="border-left: 1px solid transparent">
458 |                           Focusing
459 |                         </div>
460 |                       </button>
461 |                   </div>
462 |               </div>
463 |             </div>
464 |             <div class="user-status-limited-availability-container">
465 |               <div class="form-checkbox my-0">
466 |                 <input type="checkbox" name="limited_availability" value="1" class="js-user-status-limited-availability-checkbox" data-default-message="I may be slow to respond." aria-describedby="limited-availability-help-text-truncate-true" id="limited-availability-truncate-true">
467 |                 <label class="d-block f5 text-gray-dark mb-1" for="limited-availability-truncate-true">
468 |                   Busy
469 |                 </label>
470 |                 <p class="note" id="limited-availability-help-text-truncate-true">
471 |                   When others mention you, assign you, or request your review,
472 |                   GitHub will let them know that you have limited availability.
473 |                 </p>
474 |               </div>
475 |             </div>
476 |           </div>
477 |           <include-fragment class="js-user-status-org-picker" data-url="/users/status/organizations"></include-fragment>
478 |         </div>
479 |         <div class="d-flex flex-items-center flex-justify-between p-3 border-top">
480 |           <button type="submit" disabled class="width-full btn btn-primary mr-2 js-user-status-submit">
481 |             Set status
482 |           </button>
483 |           <button type="button" disabled class="width-full js-clear-user-status-button btn ml-2 ">
484 |             Clear status
485 |           </button>
486 |         </div>
487 | </form>    </details-dialog>
488 |   </details>
489 | </div>
490 | 
491 |         </div>
492 |         <div role="none" class="dropdown-divider"></div>
493 | 
494 |         <a role="menuitem" class="dropdown-item" href="/mllg" data-ga-click="Header, go to profile, text:your profile">Your profile</a>
495 |         <a role="menuitem" class="dropdown-item" href="/mllg?tab=repositories" data-ga-click="Header, go to repositories, text:your repositories">Your repositories</a>
496 | 
497 |         <a role="menuitem" class="dropdown-item" href="/mllg?tab=projects" data-ga-click="Header, go to projects, text:your projects">Your projects</a>
498 | 
499 |         <a role="menuitem" class="dropdown-item" href="/mllg?tab=stars" data-ga-click="Header, go to starred repos, text:your stars">Your stars</a>
500 |           <a role="menuitem" class="dropdown-item" href="https://gist.github.com/" data-ga-click="Header, your gists, text:your gists">Your gists</a>
501 | 
502 |         <div role="none" class="dropdown-divider"></div>
503 |         <a role="menuitem" class="dropdown-item" href="https://help.github.com" data-ga-click="Header, go to help, text:help">Help</a>
504 |         <a role="menuitem" class="dropdown-item" href="/settings/profile" data-ga-click="Header, go to settings, icon:settings">Settings</a>
505 |         <!-- '"` --><!-- </textarea></xmp> --></option></form><form class="logout-form" action="/logout" accept-charset="UTF-8" method="post"><input name="utf8" type="hidden" value="&#x2713;" /><input type="hidden" name="authenticity_token" value="ROJpI+A1KYDql8yaNOIG29wUZiYVUUKpX+i/QsEk4cf/eKTPLgz0EDlwPfx0qKLZRZPHcxUVkKXJB+ICQ7eh/g==" />
506 |           
507 |           <button type="submit" class="dropdown-item dropdown-signout" data-ga-click="Header, sign out, icon:logout" role="menuitem">
508 |             Sign out
509 |           </button>
510 | </form>      </details-menu>
511 |     </details>
512 |   </li>
513 | </ul>
514 | 
515 | 
516 | 
517 |         <!-- '"` --><!-- </textarea></xmp> --></option></form><form class="sr-only right-0" action="/logout" accept-charset="UTF-8" method="post"><input name="utf8" type="hidden" value="&#x2713;" /><input type="hidden" name="authenticity_token" value="7Vmly7IqJlBAPhIMrvWLGrJDc2ss5ujQQ+4qIcP0CMZWw2gnfBP7wJPZ42ruvy8YK8TSPiyiOtzVAXdhQWdI/w==" />
518 |           <button type="submit" class="dropdown-item dropdown-signout" data-ga-click="Header, sign out, icon:logout">
519 |             Sign out
520 |           </button>
521 | </form>      </div>
522 |     </div>
523 |   </div>
524 | </header>
525 | 
526 |       
527 | 
528 |   </div>
529 | 
530 |   <div id="start-of-content" class="show-on-focus"></div>
531 | 
532 |     <div id="js-flash-container">
533 | 
534 | </div>
535 | 
536 | 
537 | 
538 |   <div role="main" class="application-main " data-commit-hovercards-enabled>
539 |         <div itemscope itemtype="http://schema.org/SoftwareSourceCode" class="">
540 |     <div id="js-repo-pjax-container" data-pjax-container >
541 |       
542 | 
543 | 
544 |   
545 | 
546 | 
547 |   
548 | 
549 | 
550 | 
551 | 
552 |   <div class="pagehead repohead instapaper_ignore readability-menu experiment-repo-nav  ">
553 |     <div class="repohead-details-container clearfix container">
554 | 
555 |       <ul class="pagehead-actions">
556 | 
557 |   <li>
558 |         <!-- '"` --><!-- </textarea></xmp> --></option></form><form data-remote="true" class="js-social-form js-social-container" action="/notifications/subscribe" accept-charset="UTF-8" method="post"><input name="utf8" type="hidden" value="&#x2713;" /><input type="hidden" name="authenticity_token" value="7kZunjVnY9HOmUZhfetsqrXT11/jzR7z0uDdyPrZotiQ94BP+f1uO7RdJJjbN1D1ok5+pOxk6+OaC1rmOc7DSA==" />      <input type="hidden" name="repository_id" id="repository_id" value="146200962" class="form-control" />
559 | 
560 |       <details class="details-reset details-overlay select-menu float-left">
561 |         <summary class="btn btn-sm btn-with-count select-menu-button" data-ga-click="Repository, click Watch settings, action:blob#show">
562 |           <span data-menu-button>
563 |               <svg class="octicon octicon-eye v-align-text-bottom" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8.06 2C3 2 0 8 0 8s3 6 8.06 6C13 14 16 8 16 8s-3-6-7.94-6zM8 12c-2.2 0-4-1.78-4-4 0-2.2 1.8-4 4-4 2.22 0 4 1.8 4 4 0 2.22-1.78 4-4 4zm2-4c0 1.11-.89 2-2 2-1.11 0-2-.89-2-2 0-1.11.89-2 2-2 1.11 0 2 .89 2 2z"/></svg>
564 |               Unwatch
565 |           </span>
566 |         </summary>
567 |         <details-menu class="select-menu-modal position-absolute mt-5" style="z-index: 99;">
568 |           <div class="select-menu-header">
569 |             <span class="select-menu-title">Notifications</span>
570 |           </div>
571 |           <div class="select-menu-list">
572 |             <button type="submit" name="do" value="included" class="select-menu-item width-full" aria-checked="false" role="menuitemradio">
573 |               <svg class="octicon octicon-check select-menu-item-icon" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M12 5l-8 8-4-4 1.5-1.5L4 10l6.5-6.5L12 5z"/></svg>
574 |               <div class="select-menu-item-text">
575 |                 <span class="select-menu-item-heading">Not watching</span>
576 |                 <span class="description">Be notified only when participating or @mentioned.</span>
577 |                 <span class="hidden-select-button-text" data-menu-button-contents>
578 |                   <svg class="octicon octicon-eye v-align-text-bottom" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8.06 2C3 2 0 8 0 8s3 6 8.06 6C13 14 16 8 16 8s-3-6-7.94-6zM8 12c-2.2 0-4-1.78-4-4 0-2.2 1.8-4 4-4 2.22 0 4 1.8 4 4 0 2.22-1.78 4-4 4zm2-4c0 1.11-.89 2-2 2-1.11 0-2-.89-2-2 0-1.11.89-2 2-2 1.11 0 2 .89 2 2z"/></svg>
579 |                   Watch
580 |                 </span>
581 |               </div>
582 |             </button>
583 | 
584 |             <button type="submit" name="do" value="release_only" class="select-menu-item width-full" aria-checked="false" role="menuitemradio">
585 |               <svg class="octicon octicon-check select-menu-item-icon" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M12 5l-8 8-4-4 1.5-1.5L4 10l6.5-6.5L12 5z"/></svg>
586 |               <div class="select-menu-item-text">
587 |                 <span class="select-menu-item-heading">Releases only</span>
588 |                 <span class="description">Be notified of new releases, and when participating or @mentioned.</span>
589 |                 <span class="hidden-select-button-text" data-menu-button-contents>
590 |                   <svg class="octicon octicon-eye v-align-text-bottom" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8.06 2C3 2 0 8 0 8s3 6 8.06 6C13 14 16 8 16 8s-3-6-7.94-6zM8 12c-2.2 0-4-1.78-4-4 0-2.2 1.8-4 4-4 2.22 0 4 1.8 4 4 0 2.22-1.78 4-4 4zm2-4c0 1.11-.89 2-2 2-1.11 0-2-.89-2-2 0-1.11.89-2 2-2 1.11 0 2 .89 2 2z"/></svg>
591 |                   Unwatch releases
592 |                 </span>
593 |               </div>
594 |             </button>
595 | 
596 |             <button type="submit" name="do" value="subscribed" class="select-menu-item width-full" aria-checked="true" role="menuitemradio">
597 |               <svg class="octicon octicon-check select-menu-item-icon" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M12 5l-8 8-4-4 1.5-1.5L4 10l6.5-6.5L12 5z"/></svg>
598 |               <div class="select-menu-item-text">
599 |                 <span class="select-menu-item-heading">Watching</span>
600 |                 <span class="description">Be notified of all conversations.</span>
601 |                 <span class="hidden-select-button-text" data-menu-button-contents>
602 |                   <svg class="octicon octicon-eye v-align-text-bottom" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8.06 2C3 2 0 8 0 8s3 6 8.06 6C13 14 16 8 16 8s-3-6-7.94-6zM8 12c-2.2 0-4-1.78-4-4 0-2.2 1.8-4 4-4 2.22 0 4 1.8 4 4 0 2.22-1.78 4-4 4zm2-4c0 1.11-.89 2-2 2-1.11 0-2-.89-2-2 0-1.11.89-2 2-2 1.11 0 2 .89 2 2z"/></svg>
603 |                   Unwatch
604 |                 </span>
605 |               </div>
606 |             </button>
607 | 
608 |             <button type="submit" name="do" value="ignore" class="select-menu-item width-full" aria-checked="false" role="menuitemradio">
609 |               <svg class="octicon octicon-check select-menu-item-icon" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M12 5l-8 8-4-4 1.5-1.5L4 10l6.5-6.5L12 5z"/></svg>
610 |               <div class="select-menu-item-text">
611 |                 <span class="select-menu-item-heading">Ignoring</span>
612 |                 <span class="description">Never be notified.</span>
613 |                 <span class="hidden-select-button-text" data-menu-button-contents>
614 |                   <svg class="octicon octicon-mute v-align-text-bottom" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8 2.81v10.38c0 .67-.81 1-1.28.53L3 10H1c-.55 0-1-.45-1-1V7c0-.55.45-1 1-1h2l3.72-3.72C7.19 1.81 8 2.14 8 2.81zm7.53 3.22l-1.06-1.06-1.97 1.97-1.97-1.97-1.06 1.06L11.44 8 9.47 9.97l1.06 1.06 1.97-1.97 1.97 1.97 1.06-1.06L13.56 8l1.97-1.97z"/></svg>
615 |                   Stop ignoring
616 |                 </span>
617 |               </div>
618 |             </button>
619 |           </div>
620 |         </details-menu>
621 |       </details>
622 |       <a class="social-count js-social-count"
623 |         href="/mlr-org/mlr3/watchers"
624 |         aria-label="17 users are watching this repository">
625 |         17
626 |       </a>
627 | </form>
628 |   </li>
629 | 
630 |   <li>
631 |       <div class="js-toggler-container js-social-container starring-container on">
632 |     <!-- '"` --><!-- </textarea></xmp> --></option></form><form class="starred js-social-form" action="/mlr-org/mlr3/unstar" accept-charset="UTF-8" method="post"><input name="utf8" type="hidden" value="&#x2713;" /><input type="hidden" name="authenticity_token" value="PQXzaM5cfNB+qB3jyjGKWi2S79lhk2bgdHJv665EzjzuIs59A/rJx0jtN03nPIRgvlvcfVDwRZYZcsoe2cAPhQ==" />
633 |       <input type="hidden" name="context" value="repository"></input>
634 |       <button
635 |         type="submit"
636 |         class="btn btn-sm btn-with-count js-toggler-target"
637 |         aria-label="Unstar this repository" title="Unstar mlr-org/mlr3"
638 |         data-ga-click="Repository, click unstar button, action:blob#show; text:Unstar">
639 |         <svg class="octicon octicon-star v-align-text-bottom" viewBox="0 0 14 16" version="1.1" width="14" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M14 6l-4.9-.64L7 1 4.9 5.36 0 6l3.6 3.26L2.67 14 7 11.67 11.33 14l-.93-4.74L14 6z"/></svg>
640 |         Unstar
641 |       </button>
642 |         <a class="social-count js-social-count" href="/mlr-org/mlr3/stargazers"
643 |            aria-label="62 users starred this repository">
644 |           62
645 |         </a>
646 | </form>
647 |     <!-- '"` --><!-- </textarea></xmp> --></option></form><form class="unstarred js-social-form" action="/mlr-org/mlr3/star" accept-charset="UTF-8" method="post"><input name="utf8" type="hidden" value="&#x2713;" /><input type="hidden" name="authenticity_token" value="nXAtxMVtgIkzKbyiF3KOzhvGsZpsXk0FvaltMWbRPCxFH9RRMq4WQvEwOXF6zGKxjvoJifLjuNww+TWJ/vtN+Q==" />
648 |       <input type="hidden" name="context" value="repository"></input>
649 |       <button
650 |         type="submit"
651 |         class="btn btn-sm btn-with-count js-toggler-target"
652 |         aria-label="Star this repository" title="Star mlr-org/mlr3"
653 |         data-ga-click="Repository, click star button, action:blob#show; text:Star">
654 |         <svg class="octicon octicon-star v-align-text-bottom" viewBox="0 0 14 16" version="1.1" width="14" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M14 6l-4.9-.64L7 1 4.9 5.36 0 6l3.6 3.26L2.67 14 7 11.67 11.33 14l-.93-4.74L14 6z"/></svg>
655 |         Star
656 |       </button>
657 |         <a class="social-count js-social-count" href="/mlr-org/mlr3/stargazers"
658 |            aria-label="62 users starred this repository">
659 |           62
660 |         </a>
661 | </form>  </div>
662 | 
663 |   </li>
664 | 
665 |   <li>
666 |           <details class="details-reset details-overlay details-overlay-dark d-inline-block float-left"
667 |             data-deferred-details-content-url="/mlr-org/mlr3/fork?fragment=1">
668 |             <summary class="btn btn-sm btn-with-count"
669 |               title="Fork your own copy of mlr-org/mlr3 to your account"
670 |               data-ga-click="Repository, show fork modal, action:blob#show; text:Fork">
671 |               <svg class="octicon octicon-repo-forked v-align-text-bottom" viewBox="0 0 10 16" version="1.1" width="10" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8 1a1.993 1.993 0 0 0-1 3.72V6L5 8 3 6V4.72A1.993 1.993 0 0 0 2 1a1.993 1.993 0 0 0-1 3.72V6.5l3 3v1.78A1.993 1.993 0 0 0 5 15a1.993 1.993 0 0 0 1-3.72V9.5l3-3V4.72A1.993 1.993 0 0 0 8 1zM2 4.2C1.34 4.2.8 3.65.8 3c0-.65.55-1.2 1.2-1.2.65 0 1.2.55 1.2 1.2 0 .65-.55 1.2-1.2 1.2zm3 10c-.66 0-1.2-.55-1.2-1.2 0-.65.55-1.2 1.2-1.2.65 0 1.2.55 1.2 1.2 0 .65-.55 1.2-1.2 1.2zm3-10c-.66 0-1.2-.55-1.2-1.2 0-.65.55-1.2 1.2-1.2.65 0 1.2.55 1.2 1.2 0 .65-.55 1.2-1.2 1.2z"/></svg>
672 |               Fork
673 |             </summary>
674 |             <details-dialog class="anim-fade-in fast Box Box--overlay d-flex flex-column">
675 |               <div class="Box-header">
676 |                 <button class="Box-btn-octicon btn-octicon float-right" type="button" aria-label="Close dialog" data-close-dialog>
677 |                   <svg class="octicon octicon-x" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M7.48 8l3.75 3.75-1.48 1.48L6 9.48l-3.75 3.75-1.48-1.48L4.52 8 .77 4.25l1.48-1.48L6 6.52l3.75-3.75 1.48 1.48L7.48 8z"/></svg>
678 |                 </button>
679 |                 <h3 class="Box-title">Fork mlr3</h3>
680 |               </div>
681 |               <div class="overflow-auto text-center">
682 |                 <include-fragment>
683 |                   <div class="octocat-spinner my-3" aria-label="Loading..."></div>
684 |                   <p class="f5 text-gray">If this dialog fails to load, you can visit <a href="/mlr-org/mlr3/fork">the fork page</a> directly.</p>
685 |                 </include-fragment>
686 |               </div>
687 |             </details-dialog>
688 |           </details>
689 | 
690 |     <a href="/mlr-org/mlr3/network/members" class="social-count"
691 |        aria-label="3 users forked this repository">
692 |       3
693 |     </a>
694 |   </li>
695 | </ul>
696 | 
697 |       <h1 class="public ">
698 |   <svg class="octicon octicon-repo" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M4 9H3V8h1v1zm0-3H3v1h1V6zm0-2H3v1h1V4zm0-2H3v1h1V2zm8-1v12c0 .55-.45 1-1 1H6v2l-1.5-1.5L3 16v-2H1c-.55 0-1-.45-1-1V1c0-.55.45-1 1-1h10c.55 0 1 .45 1 1zm-1 10H1v2h2v-1h3v1h5v-2zm0-10H2v9h9V1z"/></svg>
699 |   <span class="author" itemprop="author"><a class="url fn" rel="author" data-hovercard-type="organization" data-hovercard-url="/orgs/mlr-org/hovercard" href="/mlr-org">mlr-org</a></span><!--
700 | --><span class="path-divider">/</span><!--
701 | --><strong itemprop="name"><a data-pjax="#js-repo-pjax-container" href="/mlr-org/mlr3">mlr3</a></strong>
702 | 
703 | </h1>
704 | 
705 |     </div>
706 |     
707 | <nav class="reponav js-repo-nav js-sidenav-container-pjax container"
708 |      itemscope
709 |      itemtype="http://schema.org/BreadcrumbList"
710 |     aria-label="Repository"
711 |      data-pjax="#js-repo-pjax-container">
712 | 
713 |   <span itemscope itemtype="http://schema.org/ListItem" itemprop="itemListElement">
714 |     <a class="js-selected-navigation-item selected reponav-item" itemprop="url" data-hotkey="g c" aria-current="page" data-selected-links="repo_source repo_downloads repo_commits repo_releases repo_tags repo_branches repo_packages /mlr-org/mlr3" href="/mlr-org/mlr3">
715 |       <svg class="octicon octicon-code" viewBox="0 0 14 16" version="1.1" width="14" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M9.5 3L8 4.5 11.5 8 8 11.5 9.5 13 14 8 9.5 3zm-5 0L0 8l4.5 5L6 11.5 2.5 8 6 4.5 4.5 3z"/></svg>
716 |       <span itemprop="name">Code</span>
717 |       <meta itemprop="position" content="1">
718 | </a>  </span>
719 | 
720 |     <span itemscope itemtype="http://schema.org/ListItem" itemprop="itemListElement">
721 |       <a itemprop="url" data-hotkey="g i" class="js-selected-navigation-item reponav-item" data-selected-links="repo_issues repo_labels repo_milestones /mlr-org/mlr3/issues" href="/mlr-org/mlr3/issues">
722 |         <svg class="octicon octicon-issue-opened" viewBox="0 0 14 16" version="1.1" width="14" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M7 2.3c3.14 0 5.7 2.56 5.7 5.7s-2.56 5.7-5.7 5.7A5.71 5.71 0 0 1 1.3 8c0-3.14 2.56-5.7 5.7-5.7zM7 1C3.14 1 0 4.14 0 8s3.14 7 7 7 7-3.14 7-7-3.14-7-7-7zm1 3H6v5h2V4zm0 6H6v2h2v-2z"/></svg>
723 |         <span itemprop="name">Issues</span>
724 |         <span class="Counter">16</span>
725 |         <meta itemprop="position" content="2">
726 | </a>    </span>
727 | 
728 |   <span itemscope itemtype="http://schema.org/ListItem" itemprop="itemListElement">
729 |     <a data-hotkey="g p" itemprop="url" class="js-selected-navigation-item reponav-item" data-selected-links="repo_pulls checks /mlr-org/mlr3/pulls" href="/mlr-org/mlr3/pulls">
730 |       <svg class="octicon octicon-git-pull-request" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M11 11.28V5c-.03-.78-.34-1.47-.94-2.06C9.46 2.35 8.78 2.03 8 2H7V0L4 3l3 3V4h1c.27.02.48.11.69.31.21.2.3.42.31.69v6.28A1.993 1.993 0 0 0 10 15a1.993 1.993 0 0 0 1-3.72zm-1 2.92c-.66 0-1.2-.55-1.2-1.2 0-.65.55-1.2 1.2-1.2.65 0 1.2.55 1.2 1.2 0 .65-.55 1.2-1.2 1.2zM4 3c0-1.11-.89-2-2-2a1.993 1.993 0 0 0-1 3.72v6.56A1.993 1.993 0 0 0 2 15a1.993 1.993 0 0 0 1-3.72V4.72c.59-.34 1-.98 1-1.72zm-.8 10c0 .66-.55 1.2-1.2 1.2-.65 0-1.2-.55-1.2-1.2 0-.65.55-1.2 1.2-1.2.65 0 1.2.55 1.2 1.2zM2 4.2C1.34 4.2.8 3.65.8 3c0-.65.55-1.2 1.2-1.2.65 0 1.2.55 1.2 1.2 0 .65-.55 1.2-1.2 1.2z"/></svg>
731 |       <span itemprop="name">Pull requests</span>
732 |       <span class="Counter">0</span>
733 |       <meta itemprop="position" content="3">
734 | </a>  </span>
735 | 
736 |     <a data-hotkey="g w" data-skip-pjax="true" class="js-selected-navigation-item reponav-item" data-selected-links="repo_actions /mlr-org/mlr3/actions" href="/mlr-org/mlr3/actions">
737 |       <svg class="octicon octicon-play" viewBox="0 0 14 16" version="1.1" width="14" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M14 8A7 7 0 1 1 0 8a7 7 0 0 1 14 0zm-8.223 3.482l4.599-3.066a.5.5 0 0 0 0-.832L5.777 4.518A.5.5 0 0 0 5 4.934v6.132a.5.5 0 0 0 .777.416z"/></svg>
738 |       Actions
739 | </a>
740 | 
741 | 
742 |     <a class="js-selected-navigation-item reponav-item" data-hotkey="g w" data-selected-links="repo_wiki /mlr-org/mlr3/wiki" href="/mlr-org/mlr3/wiki">
743 |       <svg class="octicon octicon-book" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M3 5h4v1H3V5zm0 3h4V7H3v1zm0 2h4V9H3v1zm11-5h-4v1h4V5zm0 2h-4v1h4V7zm0 2h-4v1h4V9zm2-6v9c0 .55-.45 1-1 1H9.5l-1 1-1-1H2c-.55 0-1-.45-1-1V3c0-.55.45-1 1-1h5.5l1 1 1-1H15c.55 0 1 .45 1 1zm-8 .5L7.5 3H2v9h6V3.5zm7-.5H9.5l-.5.5V12h6V3z"/></svg>
744 |       Wiki
745 | </a>
746 |     <a class="js-selected-navigation-item reponav-item" data-selected-links="repo_graphs repo_contributors dependency_graph pulse alerts security people /mlr-org/mlr3/pulse" href="/mlr-org/mlr3/pulse">
747 |       <svg class="octicon octicon-graph" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M16 14v1H0V0h1v14h15zM5 13H3V8h2v5zm4 0H7V3h2v10zm4 0h-2V6h2v7z"/></svg>
748 |       Insights
749 | </a>
750 |     <a class="js-selected-navigation-item reponav-item" data-selected-links="repo_settings repo_branch_settings hooks integration_installations repo_keys_settings issue_template_editor /mlr-org/mlr3/settings" href="/mlr-org/mlr3/settings">
751 |       <svg class="octicon octicon-gear" viewBox="0 0 14 16" version="1.1" width="14" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M14 8.77v-1.6l-1.94-.64-.45-1.09.88-1.84-1.13-1.13-1.81.91-1.09-.45-.69-1.92h-1.6l-.63 1.94-1.11.45-1.84-.88-1.13 1.13.91 1.81-.45 1.09L0 7.23v1.59l1.94.64.45 1.09-.88 1.84 1.13 1.13 1.81-.91 1.09.45.69 1.92h1.59l.63-1.94 1.11-.45 1.84.88 1.13-1.13-.92-1.81.47-1.09L14 8.75v.02zM7 11c-1.66 0-3-1.34-3-3s1.34-3 3-3 3 1.34 3 3-1.34 3-3 3z"/></svg>
752 |       Settings
753 | </a>
754 | </nav>
755 | 
756 | 
757 |   </div>
758 | <div class="container new-discussion-timeline experiment-repo-nav  ">
759 |   <div class="repository-content ">
760 | 
761 |     
762 |     
763 | 
764 | 
765 | 
766 |   
767 |     <a class="d-none js-permalink-shortcut" data-hotkey="y" href="/mlr-org/mlr3/blob/27379d5e42105ea8ac67b22da2f56805fff9c425/man/figures/logo_navbar.png">Permalink</a>
768 | 
769 |     <!-- blob contrib key: blob_contributors:v21:52bcb720baa663ccaec0335a8f08b7fb -->
770 | 
771 |     
772 | 
773 |     <div class="file-navigation">
774 |       
775 | <details class="details-reset details-overlay select-menu branch-select-menu float-left">
776 |   <summary class="btn btn-sm select-menu-button css-truncate"
777 |            data-hotkey="w"
778 |            
779 |            title="Switch branches or tags">
780 |     <i>Branch:</i>
781 |     <span class="css-truncate-target">master</span>
782 |   </summary>
783 | 
784 |   <details-menu class="select-menu-modal position-absolute" style="z-index: 99;" src="/mlr-org/mlr3/ref-list/master/man/figures/logo_navbar.png?source_action=show&amp;source_controller=blob" preload>
785 |     <include-fragment class="select-menu-loading-overlay anim-pulse">
786 |       <svg height="32" class="octicon octicon-octoface" viewBox="0 0 16 16" version="1.1" width="32" aria-hidden="true"><path fill-rule="evenodd" d="M14.7 5.34c.13-.32.55-1.59-.13-3.31 0 0-1.05-.33-3.44 1.3-1-.28-2.07-.32-3.13-.32s-2.13.04-3.13.32c-2.39-1.64-3.44-1.3-3.44-1.3-.68 1.72-.26 2.99-.13 3.31C.49 6.21 0 7.33 0 8.69 0 13.84 3.33 15 7.98 15S16 13.84 16 8.69c0-1.36-.49-2.48-1.3-3.35zM8 14.02c-3.3 0-5.98-.15-5.98-3.35 0-.76.38-1.48 1.02-2.07 1.07-.98 2.9-.46 4.96-.46 2.07 0 3.88-.52 4.96.46.65.59 1.02 1.3 1.02 2.07 0 3.19-2.68 3.35-5.98 3.35zM5.49 9.01c-.66 0-1.2.8-1.2 1.78s.54 1.79 1.2 1.79c.66 0 1.2-.8 1.2-1.79s-.54-1.78-1.2-1.78zm5.02 0c-.66 0-1.2.79-1.2 1.78s.54 1.79 1.2 1.79c.66 0 1.2-.8 1.2-1.79s-.53-1.78-1.2-1.78z"/></svg>
787 |     </include-fragment>
788 |   </details-menu>
789 | </details>
790 | 
791 |       <div class="BtnGroup float-right">
792 |         <a href="/mlr-org/mlr3/find/master"
793 |               class="js-pjax-capture-input btn btn-sm BtnGroup-item"
794 |               data-pjax
795 |               data-hotkey="t">
796 |           Find file
797 |         </a>
798 |         <clipboard-copy for="blob-path" class="btn btn-sm BtnGroup-item">
799 |           Copy path
800 |         </clipboard-copy>
801 |       </div>
802 |       <div id="blob-path" class="breadcrumb">
803 |         <span class="repo-root js-repo-root"><span class="js-path-segment"><a data-pjax="true" href="/mlr-org/mlr3"><span>mlr3</span></a></span></span><span class="separator">/</span><span class="js-path-segment"><a data-pjax="true" href="/mlr-org/mlr3/tree/master/man"><span>man</span></a></span><span class="separator">/</span><span class="js-path-segment"><a data-pjax="true" href="/mlr-org/mlr3/tree/master/man/figures"><span>figures</span></a></span><span class="separator">/</span><strong class="final-path">logo_navbar.png</strong>
804 |       </div>
805 |     </div>
806 | 
807 | 
808 |     <include-fragment src="/mlr-org/mlr3/contributors/master/man/figures/logo_navbar.png" class="commit-tease commit-loader">
809 |       <div>
810 |         Fetching contributors&hellip;
811 |       </div>
812 | 
813 |       <div class="commit-tease-contributors">
814 |           <img alt="" class="loader-loading float-left" src="https://github.githubassets.com/images/spinners/octocat-spinner-32-EAF2F5.gif" width="16" height="16" />
815 |         <span class="loader-error">Cannot retrieve contributors at this time</span>
816 |       </div>
817 | </include-fragment>
818 | 
819 | 
820 | 
821 | 
822 |     <div class="file ">
823 |       
824 | <div class="file-header">
825 | 
826 |   <div class="file-actions">
827 | 
828 |     <div class="BtnGroup">
829 |       <a id="raw-url" class="btn btn-sm BtnGroup-item" href="/mlr-org/mlr3/raw/master/man/figures/logo_navbar.png">Download</a>
830 |       <a rel="nofollow" class="btn btn-sm BtnGroup-item" href="/mlr-org/mlr3/commits/master/man/figures/logo_navbar.png">History</a>
831 |     </div>
832 | 
833 | 
834 | 
835 |         <!-- '"` --><!-- </textarea></xmp> --></option></form><form class="inline-form" action="/mlr-org/mlr3/delete/master/man/figures/logo_navbar.png" accept-charset="UTF-8" method="post"><input name="utf8" type="hidden" value="&#x2713;" /><input type="hidden" name="authenticity_token" value="QPytIb9UrgUATV4kjGjQfsfA5y7RzOqihyULHDUSyKH6rDlHtDY7vU++SzQbpkTblZVf0pKAt2DigWAewaBDcw==" />
836 |           <button class="btn-octicon btn-octicon-danger tooltipped tooltipped-nw" type="submit"
837 |             aria-label="Delete this file" data-disable-with>
838 |             <svg class="octicon octicon-trashcan" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M11 2H9c0-.55-.45-1-1-1H5c-.55 0-1 .45-1 1H2c-.55 0-1 .45-1 1v1c0 .55.45 1 1 1v9c0 .55.45 1 1 1h7c.55 0 1-.45 1-1V5c.55 0 1-.45 1-1V3c0-.55-.45-1-1-1zm-1 12H3V5h1v8h1V5h1v8h1V5h1v8h1V5h1v9zm1-10H2V3h9v1z"/></svg>
839 |           </button>
840 | </form>  </div>
841 | 
842 |   <div class="file-info">
843 |     1.91 KB
844 |   </div>
845 | </div>
846 | 
847 |       
848 | 
849 |   <div itemprop="text" class="blob-wrapper data type-text ">
850 |       <div class="image">
851 |           <span class="border-wrap"><img src="/mlr-org/mlr3/blob/master/man/figures/logo_navbar.png?raw=true" alt="logo_navbar.png"></span>
852 |       </div>
853 |   </div>
854 | 
855 |     </div>
856 | 
857 |   
858 | 
859 |   <details class="details-reset details-overlay details-overlay-dark">
860 |     <summary data-hotkey="l" aria-label="Jump to line"></summary>
861 |     <details-dialog class="Box Box--overlay d-flex flex-column anim-fade-in fast linejump" aria-label="Jump to line">
862 |       <!-- '"` --><!-- </textarea></xmp> --></option></form><form class="js-jump-to-line-form Box-body d-flex" action="" accept-charset="UTF-8" method="get"><input name="utf8" type="hidden" value="&#x2713;" />
863 |         <input class="form-control flex-auto mr-3 linejump-input js-jump-to-line-field" type="text" placeholder="Jump to line&hellip;" aria-label="Jump to line" autofocus>
864 |         <button type="submit" class="btn" data-close-dialog>Go</button>
865 | </form>    </details-dialog>
866 |   </details>
867 | 
868 | 
869 | 
870 |   </div>
871 |   <div class="modal-backdrop js-touch-events"></div>
872 | </div>
873 | 
874 |     </div>
875 |   </div>
876 |   
877 | 
878 |   </div>
879 | 
880 |         
881 | <div class="footer container-lg px-3" role="contentinfo">
882 |   <div class="position-relative d-flex flex-justify-between pt-6 pb-2 mt-6 f6 text-gray border-top border-gray-light ">
883 |     <ul class="list-style-none d-flex flex-wrap ">
884 |       <li class="mr-3">&copy; 2019 <span title="0.44890s from unicorn-fcbd86c57-pck25">GitHub</span>, Inc.</li>
885 |         <li class="mr-3"><a data-ga-click="Footer, go to terms, text:terms" href="https://github.com/site/terms">Terms</a></li>
886 |         <li class="mr-3"><a data-ga-click="Footer, go to privacy, text:privacy" href="https://github.com/site/privacy">Privacy</a></li>
887 |         <li class="mr-3"><a data-ga-click="Footer, go to security, text:security" href="https://github.com/security">Security</a></li>
888 |         <li class="mr-3"><a href="https://githubstatus.com/" data-ga-click="Footer, go to status, text:status">Status</a></li>
889 |         <li><a data-ga-click="Footer, go to help, text:help" href="https://help.github.com">Help</a></li>
890 |     </ul>
891 | 
892 |     <a aria-label="Homepage" title="GitHub" class="footer-octicon mr-lg-4" href="https://github.com">
893 |       <svg height="24" class="octicon octicon-mark-github" viewBox="0 0 16 16" version="1.1" width="24" aria-hidden="true"><path fill-rule="evenodd" d="M8 0C3.58 0 0 3.58 0 8c0 3.54 2.29 6.53 5.47 7.59.4.07.55-.17.55-.38 0-.19-.01-.82-.01-1.49-2.01.37-2.53-.49-2.69-.94-.09-.23-.48-.94-.82-1.13-.28-.15-.68-.52-.01-.53.63-.01 1.08.58 1.23.82.72 1.21 1.87.87 2.33.66.07-.52.28-.87.51-1.07-1.78-.2-3.64-.89-3.64-3.95 0-.87.31-1.59.82-2.15-.08-.2-.36-1.02.08-2.12 0 0 .67-.21 2.2.82.64-.18 1.32-.27 2-.27.68 0 1.36.09 2 .27 1.53-1.04 2.2-.82 2.2-.82.44 1.1.16 1.92.08 2.12.51.56.82 1.27.82 2.15 0 3.07-1.87 3.75-3.65 3.95.29.25.54.73.54 1.48 0 1.07-.01 1.93-.01 2.2 0 .21.15.46.55.38A8.013 8.013 0 0 0 16 8c0-4.42-3.58-8-8-8z"/></svg>
894 | </a>
895 |    <ul class="list-style-none d-flex flex-wrap ">
896 |         <li class="mr-3"><a data-ga-click="Footer, go to contact, text:contact" href="https://github.com/contact">Contact GitHub</a></li>
897 |         <li class="mr-3"><a href="https://github.com/pricing" data-ga-click="Footer, go to Pricing, text:Pricing">Pricing</a></li>
898 |       <li class="mr-3"><a href="https://developer.github.com" data-ga-click="Footer, go to api, text:api">API</a></li>
899 |       <li class="mr-3"><a href="https://training.github.com" data-ga-click="Footer, go to training, text:training">Training</a></li>
900 |         <li class="mr-3"><a href="https://github.blog" data-ga-click="Footer, go to blog, text:blog">Blog</a></li>
901 |         <li><a data-ga-click="Footer, go to about, text:about" href="https://github.com/about">About</a></li>
902 | 
903 |     </ul>
904 |   </div>
905 |   <div class="d-flex flex-justify-center pb-6">
906 |     <span class="f6 text-gray-light"></span>
907 |   </div>
908 | </div>
909 | 
910 | 
911 | 
912 |   <div id="ajax-error-message" class="ajax-error-message flash flash-error">
913 |     <svg class="octicon octicon-alert" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8.893 1.5c-.183-.31-.52-.5-.887-.5s-.703.19-.886.5L.138 13.499a.98.98 0 0 0 0 1.001c.193.31.53.501.886.501h13.964c.367 0 .704-.19.877-.5a1.03 1.03 0 0 0 .01-1.002L8.893 1.5zm.133 11.497H6.987v-2.003h2.039v2.003zm0-3.004H6.987V5.987h2.039v4.006z"/></svg>
914 |     <button type="button" class="flash-close js-ajax-error-dismiss" aria-label="Dismiss error">
915 |       <svg class="octicon octicon-x" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M7.48 8l3.75 3.75-1.48 1.48L6 9.48l-3.75 3.75-1.48-1.48L4.52 8 .77 4.25l1.48-1.48L6 6.52l3.75-3.75 1.48 1.48L7.48 8z"/></svg>
916 |     </button>
917 |     You can’t perform that action at this time.
918 |   </div>
919 | 
920 | 
921 |     <script crossorigin="anonymous" integrity="sha512-47ZXWJASen/yLysPiEpAb7/WvHBIHIRKo+7W5g0YYFiInTWqpjYBHTpeHut0QWEf51gExNhSEy55XQmxrZ+0xA==" type="application/javascript" src="https://github.githubassets.com/assets/compat-742699bf681282d2e3cf809d2b9de73a.js"></script>
922 |     <script crossorigin="anonymous" integrity="sha512-YfiOQfcBmPBSdKjr8AOICO9fwE7C3m6h7nTT1o9oWwVsonJudi++Oqyd2wCynfJ6pyTXVFsqsv0aNhc+KJOuFw==" type="application/javascript" src="https://github.githubassets.com/assets/frameworks-482260f8755c70642a3ef1f1448e1c47.js"></script>
923 |     
924 |     <script crossorigin="anonymous" async="async" integrity="sha512-l9Ar5oP2cfw418WS8z+wBLS74iChIxHgs+tPxVtSKZqwGmd0ZUVCiDQ5JFbAHFwvs9G/MsKap4cHgZvYmQU1lA==" type="application/javascript" src="https://github.githubassets.com/assets/github-89163211800622292b190e405ff22204.js"></script>
925 |     
926 |     
927 |     
928 |   <div class="js-stale-session-flash stale-session-flash flash flash-warn flash-banner d-none">
929 |     <svg class="octicon octicon-alert" viewBox="0 0 16 16" version="1.1" width="16" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M8.893 1.5c-.183-.31-.52-.5-.887-.5s-.703.19-.886.5L.138 13.499a.98.98 0 0 0 0 1.001c.193.31.53.501.886.501h13.964c.367 0 .704-.19.877-.5a1.03 1.03 0 0 0 .01-1.002L8.893 1.5zm.133 11.497H6.987v-2.003h2.039v2.003zm0-3.004H6.987V5.987h2.039v4.006z"/></svg>
930 |     <span class="signed-in-tab-flash">You signed in with another tab or window. <a href="">Reload</a> to refresh your session.</span>
931 |     <span class="signed-out-tab-flash">You signed out in another tab or window. <a href="">Reload</a> to refresh your session.</span>
932 |   </div>
933 |   <template id="site-details-dialog">
934 |   <details class="details-reset details-overlay details-overlay-dark lh-default text-gray-dark" open>
935 |     <summary aria-haspopup="dialog" aria-label="Close dialog"></summary>
936 |     <details-dialog class="Box Box--overlay d-flex flex-column anim-fade-in fast">
937 |       <button class="Box-btn-octicon m-0 btn-octicon position-absolute right-0 top-0" type="button" aria-label="Close dialog" data-close-dialog>
938 |         <svg class="octicon octicon-x" viewBox="0 0 12 16" version="1.1" width="12" height="16" aria-hidden="true"><path fill-rule="evenodd" d="M7.48 8l3.75 3.75-1.48 1.48L6 9.48l-3.75 3.75-1.48-1.48L4.52 8 .77 4.25l1.48-1.48L6 6.52l3.75-3.75 1.48 1.48L7.48 8z"/></svg>
939 |       </button>
940 |       <div class="octocat-spinner my-6 js-details-dialog-spinner"></div>
941 |     </details-dialog>
942 |   </details>
943 | </template>
944 | 
945 |   <div class="Popover js-hovercard-content position-absolute" style="display: none; outline: none;" tabindex="0">
946 |   <div class="Popover-message Popover-message--bottom-left Popover-message--large Box box-shadow-large" style="width:360px;">
947 |   </div>
948 | </div>
949 | 
950 | <div id="hovercard-aria-description" class="sr-only">
951 |   Press h to open a hovercard with more details.
952 | </div>
953 | 
954 |   <div aria-live="polite" class="js-global-screen-reader-notice sr-only"></div>
955 | 
956 |   </body>
957 | </html>
958 | 
959 | 


--------------------------------------------------------------------------------
/man/mlr3db-package.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/zzz.R
 3 | \docType{package}
 4 | \name{mlr3db-package}
 5 | \alias{mlr3db}
 6 | \alias{mlr3db-package}
 7 | \title{mlr3db: Data Base Backend for 'mlr3'}
 8 | \description{
 9 | Extends the 'mlr3' package with a backend to transparently work with databases such as 'SQLite', 'DuckDB', 'MySQL', 'MariaDB', or 'PostgreSQL'. The package provides two additional backends: 'DataBackendDplyr' relies on the abstraction of package 'dbplyr' to interact with most DBMS. 'DataBackendDuckDB' operates on 'DuckDB' data bases and also on Apache Parquet files.
10 | }
11 | \section{Options}{
12 | 
13 | \itemize{
14 | \item \code{mlr3db.sqlite_dir}: Default directory to store SQLite databases constructed
15 | with \code{\link[=as_sqlite_backend]{as_sqlite_backend()}}..
16 | \item \code{mlr3db.sqlite_dir}: Default directory to store DuckDB databases constructed
17 | with \code{\link[=as_duckdb_backend]{as_duckdb_backend()}}..
18 | }
19 | }
20 | 
21 | \seealso{
22 | Useful links:
23 | \itemize{
24 |   \item \url{https:///mlr3db.mlr-org.com}
25 |   \item \url{https://github.com/mlr-org/mlr3db}
26 |   \item Report bugs at \url{https://github.com/mlr-org/mlr3db/issues}
27 | }
28 | 
29 | }
30 | \author{
31 | \strong{Maintainer}: Michel Lang \email{michellang@gmail.com} (\href{https://orcid.org/0000-0001-9754-0393}{ORCID})
32 | 
33 | Authors:
34 | \itemize{
35 |   \item Lona Koers \email{lona.koers@gmail.com}
36 | }
37 | 
38 | }
39 | 


--------------------------------------------------------------------------------
/mlr3db.Rproj:
--------------------------------------------------------------------------------
 1 | Version: 1.0
 2 | 
 3 | RestoreWorkspace: No
 4 | SaveWorkspace: No
 5 | AlwaysSaveHistory: Default
 6 | 
 7 | EnableCodeIndexing: Yes
 8 | UseSpacesForTab: Yes
 9 | NumSpacesForTab: 2
10 | Encoding: UTF-8
11 | 
12 | RnwWeave: Sweave
13 | LaTeX: pdfLaTeX
14 | 
15 | AutoAppendNewline: Yes
16 | StripTrailingWhitespace: Yes
17 | LineEndingConversion: Posix
18 | 
19 | BuildType: Package
20 | PackageUseDevtools: Yes
21 | PackageRoxygenize: rd,collate,namespace
22 | 


--------------------------------------------------------------------------------
/pkgdown/_pkgdown.yml:
--------------------------------------------------------------------------------
 1 | url: https://mlr3db.mlr-org.com
 2 | 
 3 | template:
 4 |   bootstrap: 5
 5 |   package: mlr3pkgdowntemplate
 6 | 
 7 | development:
 8 |   mode: auto
 9 |   version_label: default
10 |   version_tooltip: "Version"
11 | 
12 | toc:
13 |   depth: 3
14 | 
15 | navbar:
16 |   structure:
17 |     left:  [reference, news, book]
18 |     right: [search, github, mattermost, stackoverflow, rss]
19 |   components:
20 |     home: ~
21 |     reference:
22 |       icon: fa fa-file-alt
23 |       text: Reference
24 |       href: reference/index.html
25 |     mattermost:
26 |       icon: fa fa-comments
27 |       href: https://lmmisld-lmu-stats-slds.srv.mwn.de/mlr_invite/
28 |     book:
29 |       text: mlr3book
30 |       icon: fa fa-link
31 |       href: https://mlr3book.mlr-org.com
32 |     stackoverflow:
33 |       icon: fab fa-stack-overflow
34 |       href: https://stackoverflow.com/questions/tagged/mlr3
35 |     rss:
36 |       icon: fa-rss
37 |       href: https://mlr-org.com/
38 | 


--------------------------------------------------------------------------------
/pkgdown/favicon/apple-touch-icon-120x120.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/pkgdown/favicon/apple-touch-icon-120x120.png


--------------------------------------------------------------------------------
/pkgdown/favicon/apple-touch-icon-152x152.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/pkgdown/favicon/apple-touch-icon-152x152.png


--------------------------------------------------------------------------------
/pkgdown/favicon/apple-touch-icon-180x180.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/pkgdown/favicon/apple-touch-icon-180x180.png


--------------------------------------------------------------------------------
/pkgdown/favicon/apple-touch-icon-60x60.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/pkgdown/favicon/apple-touch-icon-60x60.png


--------------------------------------------------------------------------------
/pkgdown/favicon/apple-touch-icon-76x76.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/pkgdown/favicon/apple-touch-icon-76x76.png


--------------------------------------------------------------------------------
/pkgdown/favicon/apple-touch-icon.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/pkgdown/favicon/apple-touch-icon.png


--------------------------------------------------------------------------------
/pkgdown/favicon/favicon-16x16.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/pkgdown/favicon/favicon-16x16.png


--------------------------------------------------------------------------------
/pkgdown/favicon/favicon-32x32.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/pkgdown/favicon/favicon-32x32.png


--------------------------------------------------------------------------------
/pkgdown/favicon/favicon.ico:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/mlr-org/mlr3db/b0b90a9968d5f86fc07629367c3a7ed1f8c00e5f/pkgdown/favicon/favicon.ico


--------------------------------------------------------------------------------
/tests/testthat.R:
--------------------------------------------------------------------------------
1 | if (requireNamespace("testthat", quietly = TRUE)) {
2 |   library("testthat")
3 |   library("mlr3db")
4 |   test_check("mlr3db")
5 | }
6 | 


--------------------------------------------------------------------------------
/tests/testthat/helper.R:
--------------------------------------------------------------------------------
 1 | library(checkmate)
 2 | lapply(list.files(system.file("testthat", package = "mlr3"), pattern = "^helper.*\\.[rR]", full.names = TRUE), source)
 3 | 
 4 | as_tbl = function(data, primary_key = "row_id") {
 5 |   data[[primary_key]] = seq_len(nrow(data))
 6 |   tibble::as_tibble(data)
 7 | }
 8 | 
 9 | as_sqlite_tbl = function(data, primary_key = "row_id") {
10 |   data[[primary_key]] = seq_len(nrow(data))
11 | 
12 |   con = DBI::dbConnect(RSQLite::SQLite(), ":memory:")
13 |   dplyr::copy_to(con, data)
14 |   dplyr::tbl(con, "data")
15 | }
16 | 
17 | disconnect = function(x) {
18 |   UseMethod("disconnect")
19 | }
20 | 
21 | disconnect.tbl_dbi = function(x) {
22 |   disconnect(x$src$con)
23 | }
24 | registerS3method("disconnect", "tbl_dbi", disconnect.tbl_dbi)
25 | 
26 | disconnect.SQLiteConnection = function(x) {
27 |   DBI::dbDisconnect(x)
28 | }
29 | registerS3method("disconnect", "SQLiteConnection", disconnect.SQLiteConnection)
30 | 
31 | disconnect.DataBackend = function(x) {
32 |   x$finalize()
33 | }
34 | registerS3method("disconnect", "DataBackend", disconnect.DataBackend)
35 | 
36 | extract_db_dir = function(b) {
37 |   if (inherits(b, "DataBackendDplyr")) {
38 |     mlr3misc::get_private(b)$.data$src$con@dbname
39 |   } else if (inherits(b, "DataBackendDuckDB")) {
40 |     mlr3misc::get_private(b)$.data@driver@dbdir
41 |   } else {
42 |     stop("Unknown Backend")
43 |   }
44 | }
45 | 


--------------------------------------------------------------------------------
/tests/testthat/setup.R:
--------------------------------------------------------------------------------
1 | lg = lgr::get_logger("mlr3")
2 | old_threshold = lg$threshold
3 | lg$set_threshold("warn")
4 | 


--------------------------------------------------------------------------------
/tests/testthat/teardown.R:
--------------------------------------------------------------------------------
1 | lg$set_threshold(old_threshold)
2 | 


--------------------------------------------------------------------------------
/tests/testthat/test_as_duckdb_backend.R:
--------------------------------------------------------------------------------
 1 | skip_if_not_installed("duckdb")
 2 | 
 3 | test_that("data", {
 4 |   b = as_duckdb_backend(iris, path = tempfile())
 5 |   expect_r6(b, "DataBackendDuckDB")
 6 |   expect_backend(b)
 7 |   expect_iris_backend(b)
 8 | })
 9 | 
10 | test_that("DataBackend", {
11 |   b = as_duckdb_backend(mlr3::mlr_tasks$get("iris")$backend, path = tempfile())
12 |   expect_r6(b, "DataBackendDuckDB")
13 |   expect_iris_backend(b)
14 |   expect_backend(b)
15 | })
16 | 
17 | test_that("Task", {
18 |   task = mlr3::tsk("iris")
19 |   task$backend = as_duckdb_backend(task$backend, path = tempfile())
20 |   expect_r6(task$backend, "DataBackendDuckDB")
21 |   expect_backend(task$backend)
22 |   expect_task(task)
23 | })
24 | 
25 | test_that("connector is automatically set", {
26 |   b = as_duckdb_backend(iris, path = tempfile())
27 |   expect_function(b$connector)
28 |   expect_set_equal(ls(environment(b$connector), all.names = TRUE), "path")
29 | })
30 | 
31 | test_that("parquet converter", {
32 |   file = system.file(file.path("extdata", "userdata1.parquet"), package = "mlr3db")
33 |   b = as_duckdb_backend(file)
34 |   expect_backend(b)
35 | })
36 | 


--------------------------------------------------------------------------------
/tests/testthat/test_as_polars_backend.R:
--------------------------------------------------------------------------------
 1 | skip_if_not_installed("polars")
 2 | 
 3 | test_that("data.frame", {
 4 |   b = as_polars_backend(iris)
 5 |   expect_r6(b, "DataBackendPolars")
 6 |   expect_backend(b)
 7 |   expect_iris_backend(b)
 8 | })
 9 | 
10 | test_that("DataBackend", {
11 |   # without streaming
12 |   b = as_polars_backend(mlr3::mlr_tasks$get("iris")$backend)
13 |   expect_r6(b, "DataBackendPolars")
14 |   expect_iris_backend(b)
15 |   expect_backend(b)
16 | 
17 |   # with streaming
18 |   b = as_polars_backend(mlr3::mlr_tasks$get("iris")$backend, streaming = TRUE)
19 |   expect_r6(b, "DataBackendPolars")
20 |   expect_iris_backend(b)
21 |   expect_backend(b)
22 | })
23 | 
24 | test_that("Task", {
25 |   task = mlr3::tsk("iris")
26 |   task$backend = as_polars_backend(task$backend)
27 |   expect_r6(task$backend, "DataBackendPolars")
28 |   expect_backend(task$backend)
29 |   expect_task(task)
30 | })
31 | 
32 | 


--------------------------------------------------------------------------------
/tests/testthat/test_as_sqlite_backend.R:
--------------------------------------------------------------------------------
 1 | skip_if_not_installed("dplyr")
 2 | skip_if_not_installed("dbplyr")
 3 | skip_if_not_installed("RSQLite")
 4 | 
 5 | test_that("data", {
 6 |   b = as_sqlite_backend(iris, path = tempfile())
 7 |   expect_r6(b, "DataBackendDplyr")
 8 |   expect_backend(b)
 9 |   expect_iris_backend(b)
10 | })
11 | 
12 | test_that("DataBackend", {
13 |   b = as_sqlite_backend(mlr3::mlr_tasks$get("iris")$backend, path = tempfile())
14 |   expect_r6(b, "DataBackendDplyr")
15 |   expect_iris_backend(b)
16 |   expect_backend(b)
17 | })
18 | 
19 | test_that("Task", {
20 |   task = mlr3::tsk("iris")
21 |   task$backend = as_sqlite_backend(task$backend)
22 |   expect_r6(task$backend, "DataBackendDplyr")
23 |   expect_backend(task$backend)
24 |   expect_task(task)
25 | })
26 | 
27 | test_that("connector is automatically set", {
28 |   b = as_sqlite_backend(iris, path = tempfile())
29 |   expect_function(b$connector)
30 |   expect_set_equal(ls(environment(b$connector), all.names = TRUE), "path")
31 | })
32 | 


--------------------------------------------------------------------------------
/tests/testthat/test_dplyr.R:
--------------------------------------------------------------------------------
 1 | skip_if_not_installed("dplyr")
 2 | skip_if_not_installed("dbplyr")
 3 | 
 4 | test_that("valid DataBackend (tbl/tibble)", {
 5 |   data = iris
 6 |   data$Petal.Length[91:120] = NA
 7 |   data = as_tbl(data)
 8 |   b = DataBackendDplyr$new(data, "row_id")
 9 |   expect_backend(b)
10 |   expect_iris_backend(b, n_missing = 30L)
11 | })
12 | 
13 | test_that("valid DataBackend (tbl/sqlite)", {
14 |   skip_if_not_installed("RSQLite")
15 |   data = iris
16 |   data$Petal.Length[91:120] = NA
17 |   data = as_sqlite_tbl(data)
18 |   b = DataBackendDplyr$new(data, "row_id")
19 |   expect_backend(b)
20 |   expect_iris_backend(b, n_missing = 30L)
21 | })
22 | 
23 | test_that("valid DataBackend (as_sqlite_backend)", {
24 |   skip_if_not_installed("RSQLite")
25 |   data = iris
26 |   data$Petal.Length[91:120] = NA
27 |   b = as_sqlite_backend(data)
28 |   expect_backend(b)
29 |   expect_iris_backend(b, n_missing = 30L)
30 | })
31 | 
32 | test_that("strings_as_factors", {
33 |   skip_if_not_installed("RSQLite")
34 | 
35 |   data = iris
36 | 
37 |   tbl = as_sqlite_tbl(data)
38 |   b = DataBackendDplyr$new(data = tbl, "row_id", strings_as_factors = FALSE)
39 |   expect_character(b$head()$Species, any.missing = FALSE)
40 |   expect_character(b$data(b$rownames[1], "Species")$Species, any.missing = FALSE)
41 | 
42 |   tbl = as_sqlite_tbl(data)
43 |   b = DataBackendDplyr$new(data = tbl, "row_id", strings_as_factors = TRUE)
44 |   expect_factor(b$head()$Species, any.missing = FALSE)
45 |   expect_factor(b$data(b$rownames[1], "Species")$Species, any.missing = FALSE)
46 | 
47 |   tbl = as_sqlite_tbl(data)
48 |   b = DataBackendDplyr$new(data = tbl, "row_id", strings_as_factors = "Species")
49 |   expect_factor(b$head()$Species, any.missing = FALSE)
50 |   expect_factor(b$data(b$rownames[1], "Species")$Species, any.missing = FALSE)
51 | 
52 |   expect_error(DataBackendDplyr$new(data = tbl, "row_id", strings_as_factors = "Sepal.Length"))
53 | })
54 | 
55 | test_that("as_data_backend", {
56 |   skip_if_not_installed("tibble")
57 |   data = iris
58 |   data$row_id = 1:150
59 |   data = tibble::as_tibble(data)
60 |   expect_r6(as_data_backend(data, primary_key = "row_id"), "DataBackendDataTable")
61 | 
62 |   data = as_sqlite_tbl(data = data, primary_key = "row_id")
63 |   b = as_data_backend(data, primary_key = "row_id")
64 |   expect_r6(b, "DataBackendDplyr")
65 | })
66 | 
67 | test_that("distinct with NULL rows", {
68 |   b = as_sqlite_backend(iris)
69 |   expect_equal(
70 |     b$distinct(NULL, b$colnames),
71 |     b$distinct(b$rownames, b$colnames)
72 |   )
73 | })
74 | 
75 | test_that("show_query", {
76 |   b = as_sqlite_backend(iris)
77 |   expect_output(dplyr::show_query(b), "SELECT *")
78 | })
79 | 


--------------------------------------------------------------------------------
/tests/testthat/test_duckdb.R:
--------------------------------------------------------------------------------
 1 | skip_if_not_installed("duckdb")
 2 | 
 3 | test_that("Valid DataBackend", {
 4 |   data = iris
 5 |   data$Petal.Length[91:120] = NA
 6 |   b = as_duckdb_backend(data, path = tempfile())
 7 |   expect_backend(b)
 8 |   expect_iris_backend(b, n_missing = 30L)
 9 | })
10 | 
11 | test_that("strings_as_factors", {
12 |   data = iris
13 |   data[["Species"]] = as.character(data[["Species"]])
14 | 
15 |   b = as_duckdb_backend(data, strings_as_factors = FALSE, path = tempfile())
16 |   expect_character(b$head()$Species, any.missing = FALSE)
17 |   expect_character(b$data(b$rownames[1], "Species")$Species, any.missing = FALSE)
18 | 
19 |   b = as_duckdb_backend(data, strings_as_factors = TRUE, path = tempfile())
20 |   expect_factor(b$head()$Species, any.missing = FALSE)
21 |   expect_factor(b$data(b$rownames[1], "Species")$Species, any.missing = FALSE)
22 | 
23 |   b = as_duckdb_backend(data, strings_as_factors = "Species", path = tempfile())
24 |   expect_factor(b$head()$Species, any.missing = FALSE)
25 |   expect_factor(b$data(b$rownames[1], "Species")$Species, any.missing = FALSE)
26 | 
27 |   expect_error(as_duckdb_backend(data, strings_as_factors = "Sepal.Length", path = tempfile()), "Species")
28 | })
29 | 
30 | test_that("distinct with NULL rows", {
31 |   b = as_duckdb_backend(iris, path = tempfile())
32 |   expect_equal(
33 |     b$distinct(NULL, b$colnames),
34 |     b$distinct(b$rownames, b$colnames)
35 |   )
36 | })
37 | 
38 | test_that("ordering", {
39 |   path = tempfile()
40 |   con = DBI::dbConnect(duckdb::duckdb(), dbdir = path, read_only = FALSE)
41 |   on.exit(DBI::dbDisconnect(con, shutdown = TRUE))
42 | 
43 |   df = data.frame(id = 5:1, x = 1:5)
44 |   DBI::dbWriteTable(con, "data", df, row.names = FALSE)
45 |   b = DataBackendDuckDB$new(con, "data", "id")
46 | 
47 |   expect_equal(b$rownames, 1:5)
48 |   expect_equal(b$colnames, c("id", "x"))
49 |   expect_equal(b$head()$id, 1:5)
50 |   expect_equal(b$data(b$rownames, "id")$id, 1:5)
51 | })
52 | 
53 | 
54 | test_that("single parquet file", {
55 |   file = system.file(file.path("extdata", "userdata1.parquet"), package = "mlr3db")
56 |   b = as_duckdb_backend(file)
57 |   expect_backend(b)
58 | })
59 | 
60 | test_that("multiple parquet file", {
61 |   files = system.file(file.path("extdata", c("userdata1.parquet", "userdata2.parquet")), package = "mlr3db")
62 |   b = as_duckdb_backend(files)
63 |   expect_backend(b)
64 | })
65 | 
66 | test_that("missings are calculated correctly", {
67 |   d = data.frame(x = c(NA, 1), y = c(1, 1))
68 |   b = as_duckdb_backend(d, path = tempfile())
69 |   expect_equal(b$missings(1, "x"), c(x = 1))
70 |   expect_equal(b$missings(2, "x"), c(x = 0))
71 | })
72 | 


--------------------------------------------------------------------------------
/tests/testthat/test_polars.R:
--------------------------------------------------------------------------------
 1 | skip_if_not_installed("polars")
 2 | 
 3 | test_that("valid DataBackend (polars DataFrame)", {
 4 |   data = iris
 5 |   data$Petal.Length[91:120] = NA
 6 |   data = polars::as_polars_df(data)
 7 |   b = as_data_backend(data)
 8 |   expect_backend(b)
 9 |   expect_iris_backend(b, n_missing = 30L)
10 | })
11 | 
12 | test_that("valid DataBackend (polars LazyFrame)", {
13 |   data = iris
14 |   data$Petal.Length[91:120] = NA
15 |   data = polars::as_polars_lf(data)$with_row_index("row_id", offset = 1L)
16 |   b = DataBackendPolars$new(data, "row_id", strings_as_factors = TRUE)
17 |   expect_backend(b)
18 |   expect_iris_backend(b, n_missing = 30L)
19 | })
20 | 
21 | test_that("valid DataBackend with scanning", {
22 |   polars::as_polars_df(iris)$with_row_index("row_id", offset = 1L)$write_parquet("iris.parquet")
23 |   on.exit({
24 |     if (file.exists("iris.parquet")) {
25 |       file.remove("iris.parquet")
26 |     }
27 |   }, add = TRUE)
28 | 
29 |   data = polars::pl$scan_parquet("iris.parquet")
30 | 
31 |   # valid scanning
32 |   b = DataBackendPolars$new(data, "row_id", strings_as_factors = TRUE)
33 |   expect_backend(b)
34 |   expect_equal(b$nrow, nrow(iris))
35 | 
36 |   # valid with connector
37 |   b = DataBackendPolars$new(data, "row_id", strings_as_factors = TRUE,
38 |                             connector = function() polars::pl$scan_parquet("iris.parquet"))
39 |   expect_backend(b)
40 |   expect_equal(b$nrow, nrow(iris))
41 | })
42 | 
43 | test_that("strings_as_factors", {
44 |   data = iris
45 |   data$Species = as.character(data$Species)
46 |   data = polars::as_polars_lf(data)$with_row_index("row_id", offset = 1L)
47 | 
48 |   b_str = DataBackendPolars$new(data = data, "row_id", strings_as_factors = FALSE)
49 |   expect_character(b_str$head()$Species, any.missing = FALSE)
50 |   expect_character(b_str$data(b_str$rownames[1], "Species")$Species, any.missing = FALSE)
51 | 
52 |   b_fact = DataBackendPolars$new(data = data, "row_id", strings_as_factors = TRUE)
53 |   expect_factor(b_fact$head()$Species, any.missing = FALSE)
54 |   expect_factor(b_fact$data(b_fact$rownames[1], "Species")$Species, any.missing = FALSE)
55 | 
56 |   b_species = DataBackendPolars$new(data = data, "row_id", strings_as_factors = "Species")
57 |   expect_factor(b_species$head()$Species, any.missing = FALSE)
58 |   expect_factor(b_species$data(b_species$rownames[1], "Species")$Species, any.missing = FALSE)
59 | 
60 |   expect_error(DataBackendPolars$new(data = data, "row_id", strings_as_factors = "Sepal.Length"))
61 | })
62 | 
63 | test_that("as_data_backend", {
64 |   data = iris
65 | 
66 |   pl_df = polars::as_polars_df(data)$with_row_index("row_id", offset = 1L)
67 |   b = as_data_backend(pl_df, primary_key = "row_id")
68 |   expect_r6(b, "DataBackendDataTable")
69 | 
70 |   pl_lf = polars::as_polars_lf(data)$with_row_index("row_id", offset = 1L)
71 |   b = as_data_backend(pl_lf, primary_key = "row_id")
72 |   expect_r6(b, "DataBackendPolars")
73 | })
74 | 
75 | test_that("distinct with NULL rows", {
76 |   data = polars::as_polars_df(iris)
77 |   b = as_data_backend(data)
78 | 
79 |   expect_equal(
80 |     b$distinct(NULL, b$colnames),
81 |     b$distinct(b$rownames, b$colnames)
82 |   )
83 | })
84 | 


--------------------------------------------------------------------------------
/tests/testthat/test_reconnect.R:
--------------------------------------------------------------------------------
 1 | roundtrip = function(x) {
 2 |   path = tempfile()
 3 |   on.exit(file.remove(path))
 4 |   saveRDS(x, path)
 5 |   readRDS(path)
 6 | }
 7 | 
 8 | test_that("expectations + dplyr", {
 9 |   skip_if_not_installed("dplyr")
10 |   skip_if_not_installed("dbplyr")
11 |   skip_if_not_installed("RSQLite")
12 | 
13 |   b1 = as_sqlite_backend(iris, path = tempfile())
14 |   on.exit(disconnect(b1), add = TRUE)
15 | 
16 |   b2 = roundtrip(b1)
17 |   on.exit(disconnect(b2), add = TRUE)
18 | 
19 |   expect_false(b2$valid)
20 |   expect_backend(b2)
21 |   expect_iris_backend(b2)
22 | })
23 | 
24 | 
25 | test_that("expectations + duckdb", {
26 |   skip_if_not_installed("duckdb")
27 | 
28 |   b1 = as_duckdb_backend(iris, path = tempfile())
29 |   on.exit(disconnect(b1), add = TRUE)
30 |   b2 = roundtrip(b1)
31 |   on.exit(disconnect(b2), add = TRUE)
32 | 
33 |   expect_false(b2$valid)
34 |   expect_backend(b2)
35 |   expect_iris_backend(b2)
36 | })
37 | 
38 | test_that("filtered tbl", {
39 |   skip_if_not_installed("dplyr")
40 |   skip_if_not_installed("dbplyr")
41 |   skip_if_not_installed("RSQLite")
42 | 
43 |   b = as_sqlite_backend(cbind(iris, data.frame(row_id = 1:150)), primary_key = "row_id", path = tempfile())
44 |   path = extract_db_dir(b)
45 |   disconnect(b)
46 | 
47 |   keep = c("row_id", "Sepal.Length", "Petal.Length", "Species")
48 |   con = DBI::dbConnect(RSQLite::SQLite(), path)
49 |   on.exit(disconnect(con), add = TRUE)
50 | 
51 |   tbl = dplyr::tbl(con, "data")
52 |   tbl = dplyr::select_at(tbl, keep)
53 |   tbl = dplyr::filter(tbl, Species == "setosa")
54 |   expect_data_frame(dplyr::collect(tbl), nrows = 50, ncols = 4)
55 | 
56 |   b = DataBackendDplyr$new(tbl, "row_id")
57 |   # on.exit(disconnect(b), add = TRUE)
58 | 
59 |   expect_equal(b$ncol, 4)
60 |   expect_equal(b$nrow, 50)
61 |   expect_set_equal(b$colnames, keep)
62 | 
63 |   b$connector = sqlite_reconnector(path)
64 |   b = roundtrip(b)
65 | 
66 |   expect_equal(b$nrow, 50)
67 |   expect_equal(b$ncol, 4)
68 |   expect_set_equal(b$colnames, keep)
69 | })
70 | 


--------------------------------------------------------------------------------
/tests/testthat/test_train_predict_dplyr.R:
--------------------------------------------------------------------------------
 1 | skip_if_not_installed("dplyr")
 2 | skip_if_not_installed("dbplyr")
 3 | skip_if_not_installed("RSQLite")
 4 | 
 5 | b = as_sqlite_backend(iris)
 6 | task = mlr3::TaskClassif$new("iris_sqlite", b, "Species")
 7 | learner = mlr3::mlr_learners$get("classif.featureless")
 8 | 
 9 | test_that("single step train + predict", {
10 |   expect_learner(learner$train(task, 1:120))
11 |   expect_r6(b, "DataBackendDplyr")
12 |   p = learner$predict(task, 121:150)
13 |   expect_prediction(p)
14 |   expect_data_table(data.table::as.data.table(p), nrows = 30)
15 |   expect_character(learner$errors, len = 0L)
16 | })
17 | 
18 | test_that("resample works", {
19 |   with_future("multisession", {
20 |     rr = mlr3::resample(task, learner, mlr3::rsmp("cv", folds = 3))
21 |   })
22 |   expect_resample_result(rr)
23 | })
24 | 
25 | test_that("predict_newdata", {
26 |   learner$train(task, 1:120)
27 |   p = learner$predict_newdata(b)
28 |   expect_prediction(p)
29 | })
30 | 
31 | disconnect(b)
32 | 


--------------------------------------------------------------------------------
/tests/testthat/test_train_predict_duckdb.R:
--------------------------------------------------------------------------------
 1 | skip_if_not_installed("duckdb")
 2 | 
 3 | b = as_duckdb_backend(iris, path = tempfile())
 4 | task = mlr3::TaskClassif$new("iris_duckdb", b, "Species")
 5 | learner = mlr3::mlr_learners$get("classif.featureless")
 6 | 
 7 | test_that("single step train + predict", {
 8 |   expect_learner(learner$train(task, 1:120))
 9 |   expect_r6(b, "DataBackendDuckDB")
10 |   p = learner$predict(task, 121:150)
11 |   expect_prediction(p)
12 |   expect_data_table(data.table::as.data.table(p), nrows = 30)
13 |   expect_character(learner$errors, len = 0L)
14 | })
15 | 
16 | test_that("resample works", {
17 |   with_future("multisession", {
18 |     rr = mlr3::resample(task, learner, mlr3::rsmp("cv", folds = 3))
19 |   })
20 |   expect_resample_result(rr)
21 | })
22 | 
23 | test_that("predict_newdata", {
24 |   learner$train(task, 1:120)
25 |   p = learner$predict_newdata(b)
26 |   expect_prediction(p)
27 | })
28 | 
29 | disconnect(b)
30 | 


--------------------------------------------------------------------------------
/tests/testthat/test_train_predict_polars.R:
--------------------------------------------------------------------------------
 1 | skip_if_not_installed("polars")
 2 | 
 3 | b = as_polars_backend(iris)
 4 | task = mlr3::TaskClassif$new("iris_polars", b, "Species")
 5 | learner = mlr3::mlr_learners$get("classif.featureless")
 6 | 
 7 | test_that("single step train + predict", {
 8 |   expect_learner(learner$train(task, 1:120))
 9 |   expect_r6(b, "DataBackendPolars")
10 |   p = learner$predict(task, 121:150)
11 |   expect_prediction(p)
12 |   expect_data_table(data.table::as.data.table(p), nrows = 30)
13 |   expect_character(learner$errors, len = 0L)
14 | })
15 | 
16 | test_that("resample works", {
17 |   rr = mlr3::resample(task, learner, mlr3::rsmp("cv", folds = 3))
18 |   expect_resample_result(rr)
19 | })
20 | 
21 | test_that("predict_newdata", {
22 |   learner$train(task, 1:120)
23 |   p = learner$predict_newdata(b)
24 |   expect_prediction(p)
25 | })
26 | 


--------------------------------------------------------------------------------