├── .gitignore
├── .gitattributes
├── _pkgdown.yml
├── data
    ├── HR_data.rda
    └── titanic_data.rda
├── docs
    ├── MI2logo.jpg
    ├── reference
    │   ├── lollipop-1.png
    │   ├── lollipop-2.png
    │   ├── lollipop-3.png
    │   ├── lollipop-4.png
    │   ├── lollipop-5.png
    │   ├── waterfall-1.png
    │   ├── importance-1.png
    │   ├── importance-2.png
    │   ├── importance-3.png
    │   ├── importance-4.png
    │   ├── importance-5.png
    │   ├── importance-6.png
    │   ├── EIX_lollipop-1.png
    │   ├── EIX_waterfall-1.png
    │   ├── interactions-1.png
    │   ├── interactions-2.png
    │   ├── interactions-3.png
    │   ├── interactions-4.png
    │   ├── plot.lollipop-1.png
    │   ├── plot.lollipop-2.png
    │   ├── importanceTable-1.png
    │   ├── importanceTable-2.png
    │   ├── importanceTable-3.png
    │   ├── importanceTable-4.png
    │   ├── plot.importance-1.png
    │   ├── plot.importance-2.png
    │   ├── plot.importance-3.png
    │   ├── plot.importance-4.png
    │   ├── plot.importance-5.png
    │   ├── plot.importance-6.png
    │   ├── interactionsTable-1.png
    │   ├── interactionsTable-2.png
    │   ├── plot.interactions-1.png
    │   ├── plot.interactions-2.png
    │   ├── plot.interactions-3.png
    │   ├── plot.interactions-4.png
    │   ├── plot.importanceTable-1.png
    │   ├── plot.importanceTable-2.png
    │   ├── plot.importanceTable-3.png
    │   ├── plot.importanceTable-4.png
    │   ├── plot.interactionsTable-1.png
    │   ├── plot.interactionsTable-2.png
    │   ├── tableOfTrees.html
    │   ├── calculateGain.html
    │   ├── HR_data.html
    │   ├── index.html
    │   ├── titanic.html
    │   ├── titanic_data.html
    │   ├── countPairs.html
    │   ├── lollipop.html
    │   ├── EIX_lollipop.html
    │   ├── plot.lollipop.html
    │   └── waterfall.html
    ├── pkgdown.yml
    ├── articles
    │   ├── EIX_files
    │   │   └── figure-html
    │   │   │   ├── unnamed-chunk-6-1.png
    │   │   │   ├── unnamed-chunk-7-1.png
    │   │   │   ├── unnamed-chunk-8-1.png
    │   │   │   ├── unnamed-chunk-9-1.png
    │   │   │   ├── unnamed-chunk-10-1.png
    │   │   │   ├── unnamed-chunk-11-1.png
    │   │   │   └── unnamed-chunk-11-2.png
    │   ├── titanic_data_files
    │   │   └── figure-html
    │   │   │   ├── unnamed-chunk-4-1.png
    │   │   │   ├── unnamed-chunk-5-1.png
    │   │   │   ├── unnamed-chunk-6-1.png
    │   │   │   ├── unnamed-chunk-7-1.png
    │   │   │   └── unnamed-chunk-8-1.png
    │   ├── vignette_titanic_files
    │   │   └── figure-html
    │   │   │   ├── unnamed-chunk-4-1.png
    │   │   │   ├── unnamed-chunk-5-1.png
    │   │   │   ├── unnamed-chunk-6-1.png
    │   │   │   ├── unnamed-chunk-7-1.png
    │   │   │   └── unnamed-chunk-8-1.png
    │   └── index.html
    ├── pkgdown.js
    ├── link.svg
    ├── docsearch.js
    ├── jquery.sticky-kit.min.js
    ├── authors.html
    ├── pkgdown.css
    └── index.html
├── cheatsheets
    ├── EIX.pdf
    ├── EIX.png
    └── EIX.pptx
├── .Rbuildignore
├── README.md
├── .travis.yml
├── EIX.Rproj
├── man
    ├── tableOfTrees.Rd
    ├── calculateGain.Rd
    ├── EIX-package.Rd
    ├── HR_data.Rd
    ├── lollipop.Rd
    ├── plot.interactions.Rd
    ├── plot.lollipop.Rd
    ├── waterfall.Rd
    ├── interactions.Rd
    ├── importance.Rd
    ├── titanic_data.Rd
    └── plot.importance.Rd
├── R
    ├── package.R
    ├── HR_data.R
    ├── lollipop.R
    ├── plot_interactions.R
    ├── titanic_data.R
    ├── plot_lollipop.R
    ├── interactions.R
    ├── calculateGain.R
    ├── plot_importance.R
    └── importance.R
├── NAMESPACE
├── DESCRIPTION
└── vignettes
    ├── titanic_data.Rmd
    └── EIX.Rmd


/.gitignore:
--------------------------------------------------------------------------------
1 | .Rproj.user
2 | .Rhistory
3 | .RData
4 | inst/doc
5 | 


--------------------------------------------------------------------------------
/.gitattributes:
--------------------------------------------------------------------------------
1 | # Auto detect text files and perform LF normalization
2 | * text=auto
3 | 


--------------------------------------------------------------------------------
/_pkgdown.yml:
--------------------------------------------------------------------------------
1 | template:
2 |   package: MI2template
3 |   default_assets: false
4 | 
5 | 


--------------------------------------------------------------------------------
/data/HR_data.rda:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/data/HR_data.rda


--------------------------------------------------------------------------------
/docs/MI2logo.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/MI2logo.jpg


--------------------------------------------------------------------------------
/cheatsheets/EIX.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/cheatsheets/EIX.pdf


--------------------------------------------------------------------------------
/cheatsheets/EIX.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/cheatsheets/EIX.png


--------------------------------------------------------------------------------
/cheatsheets/EIX.pptx:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/cheatsheets/EIX.pptx


--------------------------------------------------------------------------------
/data/titanic_data.rda:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/data/titanic_data.rda


--------------------------------------------------------------------------------
/docs/reference/lollipop-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/lollipop-1.png


--------------------------------------------------------------------------------
/docs/reference/lollipop-2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/lollipop-2.png


--------------------------------------------------------------------------------
/docs/reference/lollipop-3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/lollipop-3.png


--------------------------------------------------------------------------------
/docs/reference/lollipop-4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/lollipop-4.png


--------------------------------------------------------------------------------
/docs/reference/lollipop-5.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/lollipop-5.png


--------------------------------------------------------------------------------
/docs/reference/waterfall-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/waterfall-1.png


--------------------------------------------------------------------------------
/docs/reference/importance-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/importance-1.png


--------------------------------------------------------------------------------
/docs/reference/importance-2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/importance-2.png


--------------------------------------------------------------------------------
/docs/reference/importance-3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/importance-3.png


--------------------------------------------------------------------------------
/docs/reference/importance-4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/importance-4.png


--------------------------------------------------------------------------------
/docs/reference/importance-5.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/importance-5.png


--------------------------------------------------------------------------------
/docs/reference/importance-6.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/importance-6.png


--------------------------------------------------------------------------------
/docs/reference/EIX_lollipop-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/EIX_lollipop-1.png


--------------------------------------------------------------------------------
/docs/reference/EIX_waterfall-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/EIX_waterfall-1.png


--------------------------------------------------------------------------------
/docs/reference/interactions-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/interactions-1.png


--------------------------------------------------------------------------------
/docs/reference/interactions-2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/interactions-2.png


--------------------------------------------------------------------------------
/docs/reference/interactions-3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/interactions-3.png


--------------------------------------------------------------------------------
/docs/reference/interactions-4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/interactions-4.png


--------------------------------------------------------------------------------
/docs/reference/plot.lollipop-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.lollipop-1.png


--------------------------------------------------------------------------------
/docs/reference/plot.lollipop-2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.lollipop-2.png


--------------------------------------------------------------------------------
/docs/reference/importanceTable-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/importanceTable-1.png


--------------------------------------------------------------------------------
/docs/reference/importanceTable-2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/importanceTable-2.png


--------------------------------------------------------------------------------
/docs/reference/importanceTable-3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/importanceTable-3.png


--------------------------------------------------------------------------------
/docs/reference/importanceTable-4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/importanceTable-4.png


--------------------------------------------------------------------------------
/docs/reference/plot.importance-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.importance-1.png


--------------------------------------------------------------------------------
/docs/reference/plot.importance-2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.importance-2.png


--------------------------------------------------------------------------------
/docs/reference/plot.importance-3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.importance-3.png


--------------------------------------------------------------------------------
/docs/reference/plot.importance-4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.importance-4.png


--------------------------------------------------------------------------------
/docs/reference/plot.importance-5.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.importance-5.png


--------------------------------------------------------------------------------
/docs/reference/plot.importance-6.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.importance-6.png


--------------------------------------------------------------------------------
/.Rbuildignore:
--------------------------------------------------------------------------------
1 | ^.*\.Rproj$
2 | ^\.Rproj\.user$
3 | ^cheatsheets$
4 | ^.*README.*$
5 | ^.travis.yml$
6 | ^_pkgdown\.yml$
7 | ^docs$
8 | 


--------------------------------------------------------------------------------
/docs/reference/interactionsTable-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/interactionsTable-1.png


--------------------------------------------------------------------------------
/docs/reference/interactionsTable-2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/interactionsTable-2.png


--------------------------------------------------------------------------------
/docs/reference/plot.interactions-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.interactions-1.png


--------------------------------------------------------------------------------
/docs/reference/plot.interactions-2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.interactions-2.png


--------------------------------------------------------------------------------
/docs/reference/plot.interactions-3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.interactions-3.png


--------------------------------------------------------------------------------
/docs/reference/plot.interactions-4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.interactions-4.png


--------------------------------------------------------------------------------
/docs/reference/plot.importanceTable-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.importanceTable-1.png


--------------------------------------------------------------------------------
/docs/reference/plot.importanceTable-2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.importanceTable-2.png


--------------------------------------------------------------------------------
/docs/reference/plot.importanceTable-3.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.importanceTable-3.png


--------------------------------------------------------------------------------
/docs/reference/plot.importanceTable-4.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.importanceTable-4.png


--------------------------------------------------------------------------------
/docs/reference/plot.interactionsTable-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.interactionsTable-1.png


--------------------------------------------------------------------------------
/docs/reference/plot.interactionsTable-2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/reference/plot.interactionsTable-2.png


--------------------------------------------------------------------------------
/docs/pkgdown.yml:
--------------------------------------------------------------------------------
1 | pandoc: 1.19.2.1
2 | pkgdown: 1.3.0
3 | pkgdown_sha: ~
4 | articles:
5 |   EIX: EIX.html
6 |   titanic_data: titanic_data.html
7 | 
8 | 


--------------------------------------------------------------------------------
/docs/articles/EIX_files/figure-html/unnamed-chunk-6-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/EIX_files/figure-html/unnamed-chunk-6-1.png


--------------------------------------------------------------------------------
/docs/articles/EIX_files/figure-html/unnamed-chunk-7-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/EIX_files/figure-html/unnamed-chunk-7-1.png


--------------------------------------------------------------------------------
/docs/articles/EIX_files/figure-html/unnamed-chunk-8-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/EIX_files/figure-html/unnamed-chunk-8-1.png


--------------------------------------------------------------------------------
/docs/articles/EIX_files/figure-html/unnamed-chunk-9-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/EIX_files/figure-html/unnamed-chunk-9-1.png


--------------------------------------------------------------------------------
/docs/articles/EIX_files/figure-html/unnamed-chunk-10-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/EIX_files/figure-html/unnamed-chunk-10-1.png


--------------------------------------------------------------------------------
/docs/articles/EIX_files/figure-html/unnamed-chunk-11-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/EIX_files/figure-html/unnamed-chunk-11-1.png


--------------------------------------------------------------------------------
/docs/articles/EIX_files/figure-html/unnamed-chunk-11-2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/EIX_files/figure-html/unnamed-chunk-11-2.png


--------------------------------------------------------------------------------
/docs/articles/titanic_data_files/figure-html/unnamed-chunk-4-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/titanic_data_files/figure-html/unnamed-chunk-4-1.png


--------------------------------------------------------------------------------
/docs/articles/titanic_data_files/figure-html/unnamed-chunk-5-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/titanic_data_files/figure-html/unnamed-chunk-5-1.png


--------------------------------------------------------------------------------
/docs/articles/titanic_data_files/figure-html/unnamed-chunk-6-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/titanic_data_files/figure-html/unnamed-chunk-6-1.png


--------------------------------------------------------------------------------
/docs/articles/titanic_data_files/figure-html/unnamed-chunk-7-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/titanic_data_files/figure-html/unnamed-chunk-7-1.png


--------------------------------------------------------------------------------
/docs/articles/titanic_data_files/figure-html/unnamed-chunk-8-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/titanic_data_files/figure-html/unnamed-chunk-8-1.png


--------------------------------------------------------------------------------
/docs/articles/vignette_titanic_files/figure-html/unnamed-chunk-4-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/vignette_titanic_files/figure-html/unnamed-chunk-4-1.png


--------------------------------------------------------------------------------
/docs/articles/vignette_titanic_files/figure-html/unnamed-chunk-5-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/vignette_titanic_files/figure-html/unnamed-chunk-5-1.png


--------------------------------------------------------------------------------
/docs/articles/vignette_titanic_files/figure-html/unnamed-chunk-6-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/vignette_titanic_files/figure-html/unnamed-chunk-6-1.png


--------------------------------------------------------------------------------
/docs/articles/vignette_titanic_files/figure-html/unnamed-chunk-7-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/vignette_titanic_files/figure-html/unnamed-chunk-7-1.png


--------------------------------------------------------------------------------
/docs/articles/vignette_titanic_files/figure-html/unnamed-chunk-8-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/ModelOriented/EIX/HEAD/docs/articles/vignette_titanic_files/figure-html/unnamed-chunk-8-1.png


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | ## EIX - Explain Interactions in Xgboost
 2 | A set of tools to explain XGBoost and LightGBM models.
 3 | 
 4 | ## Installation
 5 | 
 6 | Install from GitHub
 7 | ```{r}
 8 | devtools::install_github("ModelOriented/EIX")
 9 | ```
10 | 
11 | ## Cheatsheets
12 | <img src="https://raw.githubusercontent.com/ekarbowiak/EIX/master/cheatsheets/EIX.png"/>
13 | 
14 | 


--------------------------------------------------------------------------------
/.travis.yml:
--------------------------------------------------------------------------------
 1 | language: R
 2 | sudo: false
 3 | cache: packages
 4 | dist: trusty
 5 | 
 6 | before_install:
 7 |     - sudo apt-get install --yes udunits-bin libproj-dev libgeos-dev libgdal-dev libgdal1-dev libudunits2-dev
 8 | 
 9 | env:
10 |   global:
11 |   - R_CHECK_ARGS="--timings"
12 | 
13 | notifications:
14 |   email: false
15 | 
16 | r_packages:
17 |   - archivist
18 |   - DALEX
19 |   - ggplot2
20 |   - covr
21 | 
22 | after_success:
23 |   - Rscript -e 'library(covr); codecov()'
24 | 


--------------------------------------------------------------------------------
/EIX.Rproj:
--------------------------------------------------------------------------------
 1 | Version: 1.0
 2 | 
 3 | RestoreWorkspace: No
 4 | SaveWorkspace: No
 5 | AlwaysSaveHistory: Default
 6 | 
 7 | EnableCodeIndexing: Yes
 8 | UseSpacesForTab: Yes
 9 | NumSpacesForTab: 2
10 | Encoding: UTF-8
11 | 
12 | RnwWeave: Sweave
13 | LaTeX: pdfLaTeX
14 | 
15 | AutoAppendNewline: Yes
16 | StripTrailingWhitespace: Yes
17 | 
18 | BuildType: Package
19 | PackageUseDevtools: Yes
20 | PackageInstallArgs: --no-multiarch --with-keep.source
21 | PackageRoxygenize: rd,collate,namespace
22 | 


--------------------------------------------------------------------------------
/man/tableOfTrees.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/calculateGain.R
 3 | \name{tableOfTrees}
 4 | \alias{tableOfTrees}
 5 | \title{tableOfTrees}
 6 | \usage{
 7 | tableOfTrees(model, data)
 8 | }
 9 | \arguments{
10 | \item{model}{a xgboost or lightgbm model}
11 | 
12 | \item{data}{a data table with data used to train the model}
13 | }
14 | \value{
15 | a data table
16 | }
17 | \description{
18 | tableOfTrees
19 | }
20 | \keyword{internal}
21 | 


--------------------------------------------------------------------------------
/man/calculateGain.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/calculateGain.R
 3 | \name{calculateGain}
 4 | \alias{calculateGain}
 5 | \title{calculateGain}
 6 | \usage{
 7 | calculateGain(xgb.model, data)
 8 | }
 9 | \arguments{
10 | \item{xgb.model}{a xgboost or lightgbm model}
11 | 
12 | \item{data}{a data table with data used to train the model}
13 | }
14 | \value{
15 | a list
16 | }
17 | \description{
18 | List of trees with pairs of variable and other needed fields
19 | }
20 | \keyword{internal}
21 | 


--------------------------------------------------------------------------------
/R/package.R:
--------------------------------------------------------------------------------
 1 | #' EIX package
 2 | #'
 3 | #' Structure mining from 'XGBoost' and 'LightGBM' models.
 4 | #' Key functionalities of this package cover: visualisation of tree-based ensembles models,
 5 | #' identification of interactions, measuring of variable importance,
 6 | #' measuring of interaction importance, explanation of single prediction
 7 | #' with break down plots (based on 'xgboostExplainer' and 'iBreakDown' packages).
 8 | #' To download the 'LightGBM' use the following link: <https://github.com/Microsoft/LightGBM>.
 9 | #' EIX' is a part of the 'DrWhy.AI' universe.
10 | #' @import MASS
11 | #' @import tidyr
12 | #'
13 | #' @name EIX-package
14 | NULL
15 | 


--------------------------------------------------------------------------------
/docs/pkgdown.js:
--------------------------------------------------------------------------------
 1 | $(function() {
 2 |   $("#sidebar").stick_in_parent({offset_top: 40});
 3 |   $('body').scrollspy({
 4 |     target: '#sidebar',
 5 |     offset: 60
 6 |   });
 7 | 
 8 |   var cur_path = location.href;
 9 |   $("#navbar ul li a").each(function(index, value) {
10 |     if (value.text == "Home")
11 |       return;
12 |     if (value.getAttribute("href") === "#")
13 |       return;
14 | 
15 | 	var path = value.href;
16 |     if (cur_path == path) {
17 |       // Add class to parent <li>, and enclosing <li> if in dropdown
18 |       var menu_anchor = $(value);
19 |       menu_anchor.parent().addClass("active");
20 |       menu_anchor.closest("li.dropdown").addClass("active");
21 |     }
22 |   });
23 | });
24 | 


--------------------------------------------------------------------------------
/man/EIX-package.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/package.R
 3 | \name{EIX-package}
 4 | \alias{EIX-package}
 5 | \title{EIX package}
 6 | \description{
 7 | Structure mining from 'XGBoost' and 'LightGBM' models.
 8 | Key functionalities of this package cover: visualisation of tree-based ensembles models,
 9 | identification of interactions, measuring of variable importance,
10 | measuring of interaction importance, explanation of single prediction
11 | with break down plots (based on 'xgboostExplainer' and 'iBreakDown' packages).
12 | To download the 'LightGBM' use the following link: <https://github.com/Microsoft/LightGBM>.
13 | EIX' is a part of the 'DrWhy.AI' universe.
14 | }
15 | 


--------------------------------------------------------------------------------
/NAMESPACE:
--------------------------------------------------------------------------------
 1 | # Generated by roxygen2: do not edit by hand
 2 | 
 3 | S3method(plot,importance)
 4 | S3method(plot,interactions)
 5 | S3method(plot,lollipop)
 6 | export(importance)
 7 | export(interactions)
 8 | export(lollipop)
 9 | export(waterfall)
10 | import(MASS)
11 | import(data.table)
12 | import(ggplot2)
13 | import(iBreakDown)
14 | import(tidyr)
15 | importFrom(DALEX,theme_drwhy)
16 | importFrom(ggiraphExtra,coord_radar)
17 | importFrom(ggrepel,geom_label_repel)
18 | importFrom(ggrepel,geom_text_repel)
19 | importFrom(purrr,map)
20 | importFrom(scales,pseudo_log_trans)
21 | importFrom(stats,frequency)
22 | importFrom(stats,predict)
23 | importFrom(stats,weighted.mean)
24 | importFrom(xgboost,slice)
25 | importFrom(xgboost,xgb.DMatrix)
26 | importFrom(xgboost,xgb.model.dt.tree)
27 | 


--------------------------------------------------------------------------------
/docs/link.svg:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="utf-8"?>
 2 | <!-- Generator: Adobe Illustrator 19.2.1, SVG Export Plug-In . SVG Version: 6.00 Build 0)  -->
 3 | <svg version="1.1" id="Layer_1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" x="0px" y="0px"
 4 | 	 viewBox="0 0 20 20" style="enable-background:new 0 0 20 20;" xml:space="preserve">
 5 | <style type="text/css">
 6 | 	.st0{fill:#75AADB;}
 7 | </style>
 8 | <path class="st0" d="M4,11.3h1.3v1.3H4c-2,0-4-2.3-4-4.7s2.1-4.7,4-4.7h5.3c1.9,0,4,2.3,4,4.7c0,1.9-1.2,3.6-2.7,4.3v-1.5
 9 | 	C11.4,10.2,12,9.1,12,8c0-1.7-1.4-3.3-2.7-3.3H4C2.7,4.7,1.3,6.3,1.3,8S2.7,11.3,4,11.3z M16,7.3h-1.3v1.3H16c1.3,0,2.7,1.6,2.7,3.3
10 | 	s-1.4,3.3-2.7,3.3h-5.3C9.4,15.3,8,13.7,8,12c0-1.1,0.6-2.2,1.3-2.8V7.7C7.9,8.4,6.7,10.1,6.7,12c0,2.4,2.1,4.7,4,4.7H16
11 | 	c1.9,0,4-2.3,4-4.7S18,7.3,16,7.3z"/>
12 | </svg>
13 | 


--------------------------------------------------------------------------------
/R/HR_data.R:
--------------------------------------------------------------------------------
 1 | #' Why are our best and most experienced employees leaving prematurely?
 2 | #'
 3 | #' A dataset from Kaggle competition Human Resources Analytics.
 4 | #' https://www.kaggle.com/ludobenistant/hr-analytics/data
 5 | #'
 6 | #' The description of the dataset was copied from the \code{breakDown} package.
 7 | #'
 8 | #' \itemize{
 9 | #'    \item  satisfaction_level Level of satisfaction (0-1)
10 | #'    \item  last_evaluation Time since last performance evaluation (in Years)
11 | #'    \item  number_project  Number of projects completed while at work
12 | #'    \item  average_montly_hours  Average monthly hours at workplace
13 | #'    \item  time_spend_company  Number of years spent in the company
14 | #'    \item  Work_accident  Whether the employee had a workplace accident
15 | #'    \item  left  Whether the employee left the workplace or not (1 or 0) Factor
16 | #'    \item  promotion_last_5years  Whether the employee was promoted in the last five years
17 | #'    \item  sales  Department in which they work for
18 | #'    \item  salary  Relative level of salary (high)
19 | #' }
20 | #'
21 | #' @name HR_data
22 | #' @format A data table with 14999 rows and 10 variables
23 | #' @source https://www.kaggle.com/ludobenistant/hr-analytics/data, \url{https://cran.r-project.org/package=breakDown}
24 |  NULL
25 | 


--------------------------------------------------------------------------------
/DESCRIPTION:
--------------------------------------------------------------------------------
 1 | Package: EIX
 2 | Title: Explain Interactions in 'XGBoost'
 3 | Version: 1.1
 4 | Authors@R: c(
 5 |   person("Ewelina", "Karbowiak", email = "ewelina.karbowiak12@gmail.com", role = c("aut", "cre")),
 6 |   person("Przemyslaw", "Biecek", email = "przemyslaw.biecek@gmail.com", role = c("aut","ths"))
 7 |   )
 8 | Description: Structure mining from 'XGBoost' and 'LightGBM' models.
 9 |     Key functionalities of this package cover: visualisation of tree-based ensembles models,
10 |     identification of interactions, measuring of variable importance,
11 |     measuring of interaction importance, explanation of single prediction 
12 |     with break down plots (based on 'xgboostExplainer' and 'iBreakDown' packages). 
13 |     To download the 'LightGBM' use the following link: <https://github.com/Microsoft/LightGBM>.
14 |     'EIX' is a part of the 'DrWhy.AI' universe.
15 | Depends: R (>= 3.4.0)
16 | License: GPL-2
17 | Encoding: UTF-8
18 | LazyData: true
19 | Imports:
20 |     MASS,
21 |     ggplot2,
22 |     data.table,
23 |     purrr,
24 |     xgboost,
25 |     DALEX,
26 |     ggrepel,
27 |     ggiraphExtra,
28 |     iBreakDown,
29 |     tidyr,
30 |     scales
31 | RoxygenNote: 7.1.1
32 | Suggests:
33 |     Matrix,
34 |     knitr,
35 |     rmarkdown,
36 |     lightgbm
37 | VignetteBuilder: knitr
38 | URL: https://github.com/ModelOriented/EIX
39 | BugReports: https://github.com/ModelOriented/EIX/issues
40 | 


--------------------------------------------------------------------------------
/man/HR_data.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/HR_data.R
 3 | \name{HR_data}
 4 | \alias{HR_data}
 5 | \title{Why are our best and most experienced employees leaving prematurely?}
 6 | \format{
 7 | A data table with 14999 rows and 10 variables
 8 | }
 9 | \source{
10 | https://www.kaggle.com/ludobenistant/hr-analytics/data, \url{https://cran.r-project.org/package=breakDown}
11 | }
12 | \description{
13 | A dataset from Kaggle competition Human Resources Analytics.
14 | https://www.kaggle.com/ludobenistant/hr-analytics/data
15 | }
16 | \details{
17 | The description of the dataset was copied from the \code{breakDown} package.
18 | 
19 | \itemize{
20 |    \item  satisfaction_level Level of satisfaction (0-1)
21 |    \item  last_evaluation Time since last performance evaluation (in Years)
22 |    \item  number_project  Number of projects completed while at work
23 |    \item  average_montly_hours  Average monthly hours at workplace
24 |    \item  time_spend_company  Number of years spent in the company
25 |    \item  Work_accident  Whether the employee had a workplace accident
26 |    \item  left  Whether the employee left the workplace or not (1 or 0) Factor
27 |    \item  promotion_last_5years  Whether the employee was promoted in the last five years
28 |    \item  sales  Department in which they work for
29 |    \item  salary  Relative level of salary (high)
30 | }
31 | }
32 | 


--------------------------------------------------------------------------------
/man/lollipop.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/lollipop.R
 3 | \name{lollipop}
 4 | \alias{lollipop}
 5 | \title{Tables needed for lollipop plot}
 6 | \usage{
 7 | lollipop(xgb_model, data)
 8 | }
 9 | \arguments{
10 | \item{xgb_model}{a xgboost or lightgbm model.}
11 | 
12 | \item{data}{a data table with data used to train the model.}
13 | }
14 | \value{
15 | an object of the lollipop class
16 | }
17 | \description{
18 | This function calculates two tables needed to generate lollipop plot, which visualise the model.
19 | The first table contains information about all nodes in the trees forming a model.
20 | It includes gain value, depth and ID of each nodes.
21 | The second table contains similarly information about roots in the trees.
22 | }
23 | \examples{
24 | library("EIX")
25 | library("Matrix")
26 | sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
27 | 
28 | library("xgboost")
29 | param <- list(objective = "binary:logistic", max_depth = 2)
30 | xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose = 0)
31 | 
32 | lolli <- lollipop(xgb_model, sm)
33 | plot(lolli, labels = "topAll", log_scale = TRUE)
34 | 
35 | \donttest{
36 | library(lightgbm)
37 | train_data <- lgb.Dataset(sm, label =  HR_data[, left] == 1)
38 | params <- list(objective = "binary", max_depth = 2)
39 | lgb_model <- lgb.train(params, train_data, 25)
40 | 
41 | lolli <- lollipop(lgb_model, sm)
42 | plot(lolli, labels = "topAll", log_scale = TRUE)
43 | 
44 | }
45 | 
46 | }
47 | 


--------------------------------------------------------------------------------
/man/plot.interactions.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/plot_interactions.R
 3 | \name{plot.interactions}
 4 | \alias{plot.interactions}
 5 | \title{Plot importance of interactions or pairs}
 6 | \usage{
 7 | \method{plot}{interactions}(x, ...)
 8 | }
 9 | \arguments{
10 | \item{x}{a result from the \code{interactions} function.}
11 | 
12 | \item{...}{other parameters.}
13 | }
14 | \value{
15 | a ggplot object
16 | }
17 | \description{
18 | This function plots the importance ranking of interactions and pairs in the model.
19 | }
20 | \details{
21 | NOTE: Be careful use of this function with \code{option="pairs"} parameter,
22 |       because high gain of pair can be a result of high gain of child variable.
23 |      As strong interactions should be considered only these pairs of variables,
24 |      where variable on the bottom (child) has higher gain than variable on the top (parent).
25 | }
26 | \examples{
27 | library("EIX")
28 | library("Matrix")
29 | sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
30 | 
31 | library("xgboost")
32 | param <- list(objective = "binary:logistic", max_depth = 2)
33 | xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose=0)
34 | 
35 | inter <- interactions(xgb_model, sm,		option = "interactions")
36 | inter
37 | plot(inter)
38 | 
39 | inter <- interactions(xgb_model, sm,		option = "pairs")
40 | inter
41 | plot(inter)
42 | 
43 | \donttest{
44 | library(lightgbm)
45 | train_data <- lgb.Dataset(sm, label =  HR_data[, left] == 1)
46 | params <- list(objective = "binary", max_depth = 2)
47 | lgb_model <- lgb.train(params, train_data, 25)
48 | 
49 | inter <- interactions(lgb_model, sm,		option = "interactions")
50 | inter
51 | plot(inter)
52 | 
53 | inter <- interactions(lgb_model, sm,		option = "pairs")
54 | inter
55 | plot(inter)
56 | }
57 | 
58 | }
59 | 


--------------------------------------------------------------------------------
/man/plot.lollipop.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/plot_lollipop.R
 3 | \name{plot.lollipop}
 4 | \alias{plot.lollipop}
 5 | \title{Visualiation of the model}
 6 | \usage{
 7 | \method{plot}{lollipop}(x, ..., labels = "topAll", log_scale = TRUE, threshold = 0.1)
 8 | }
 9 | \arguments{
10 | \item{x}{a result from the \code{lollipop} function.}
11 | 
12 | \item{...}{other parameters.}
13 | 
14 | \item{labels}{if "topAll" then labels for the most important interactions (vertical label)
15 | and variables in the roots (horizontal label) will be displayed,
16 | if "interactions" then labels for all interactions,
17 | if "roots" then labels for all variables in the root.}
18 | 
19 | \item{log_scale}{TRUE/FALSE logarithmic scale on the plot. Default TRUE.}
20 | 
21 | \item{threshold}{on the plot will occur only labels with Gain higher than `threshold` of the max Gain value in the model.
22 | The lower threshold, the more labels on the plot. Range from 0 to 1. Default 0.1.}
23 | }
24 | \value{
25 | a ggplot object
26 | }
27 | \description{
28 | The lollipop plots the model with the most important interactions and variables in the roots.
29 | }
30 | \examples{
31 | library("EIX")
32 | library("Matrix")
33 | sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
34 | 
35 | library("xgboost")
36 | param <- list(objective = "binary:logistic", max_depth = 2)
37 | xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose = 0)
38 | 
39 | lolli <- lollipop(xgb_model, sm)
40 | plot(lolli, labels = "topAll", log_scale = TRUE)
41 | 
42 | \donttest{
43 | library(lightgbm)
44 | train_data <- lgb.Dataset(sm, label =  HR_data[, left] == 1)
45 | params <- list(objective = "binary", max_depth = 3)
46 | lgb_model <- lgb.train(params, train_data, 25)
47 | 
48 | lolli <- lollipop(lgb_model, sm)
49 | plot(lolli, labels = "topAll", log_scale = TRUE)
50 | }
51 | 
52 | }
53 | 


--------------------------------------------------------------------------------
/man/waterfall.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/waterfall.R
 3 | \name{waterfall}
 4 | \alias{waterfall}
 5 | \title{Explain prediction of a single observation}
 6 | \usage{
 7 | waterfall(
 8 |   xgb_model,
 9 |   new_observation,
10 |   data,
11 |   type = "binary",
12 |   option = "interactions",
13 |   baseline = 0
14 | )
15 | }
16 | \arguments{
17 | \item{xgb_model}{a xgboost model.}
18 | 
19 | \item{new_observation}{a new observation.}
20 | 
21 | \item{data}{row from the original dataset with the new observation to explain (not one-hot-encoded).
22 | The param above has to be set to merge categorical features.
23 | If you dont wont to merge categorical features, set this parameter the same as \code{new_observation}.}
24 | 
25 | \item{type}{the learning task of the model. Available tasks: "binary" for binary classification  or "regression" for linear regression.}
26 | 
27 | \item{option}{if "variables", the plot includes only single variables,
28 | if "interactions", then only interactions.
29 | Default "interaction".}
30 | 
31 | \item{baseline}{a number or a character "Intercept" (for model intercept).
32 | The baseline for the plot, where the rectangles should start.
33 | Default 0.}
34 | }
35 | \value{
36 | an object of the broken class
37 | }
38 | \description{
39 | This function calculates a table with influence of variables and interactions
40 | on the prediction of a given observation. It supports only xgboost models.
41 | }
42 | \details{
43 | The function contains code or pieces of code
44 | from \code{breakDown} code created by Przemysław Biecek
45 | and \code{xgboostExplainer} code created by David Foster.
46 | }
47 | \examples{
48 | 
49 | \donttest{
50 | library("EIX")
51 | library("Matrix")
52 | sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
53 | 
54 | library("xgboost")
55 | param <- list(objective = "binary:logistic", max_depth = 2)
56 | xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose=0)
57 | 
58 | data <- HR_data[9,-7]
59 | new_observation <- sm[9,]
60 | 
61 | wf <- waterfall(xgb_model, new_observation, data,  option = "interactions")
62 | wf
63 | 
64 | plot(wf)
65 | }
66 | 
67 | }
68 | 


--------------------------------------------------------------------------------
/man/interactions.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/interactions.R
 3 | \name{interactions}
 4 | \alias{interactions}
 5 | \title{Importance of interactions and pairs in the model}
 6 | \usage{
 7 | interactions(xgb_model, data, option = "interactions")
 8 | }
 9 | \arguments{
10 | \item{xgb_model}{a xgboost or lightgbm model.}
11 | 
12 | \item{data}{a data table with data used to train the model.}
13 | 
14 | \item{option}{if "interactions", the table contains interactions,
15 | if "pairs", this table contains all the pairs in the model.
16 | Default "interactions".}
17 | }
18 | \value{
19 | a data table
20 | }
21 | \description{
22 | This function calculates a table with two measures of importance for interactions and pairs in the model.
23 | }
24 | \details{
25 | Available measures:
26 | \itemize{
27 | \item "sumGain" - sum of Gain value in all nodes, in which given variable occurs,
28 | \item "freqency" - number of occurrences in the nodes for given variable.
29 | }
30 | 
31 | NOTE: Be careful use of this function with \code{option="pairs"} parameter,
32 |       because high gain of pair can be a result of high gain of child variable.
33 |      As strong interactions should be considered only these pairs of variables,
34 |      where variable on the bottom (child) has higher gain than variable on the top (parent).
35 | }
36 | \examples{
37 | library("EIX")
38 | library("Matrix")
39 | sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
40 | 
41 | library("xgboost")
42 | param <- list(objective = "binary:logistic", max_depth = 2)
43 | xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose=0)
44 | 
45 | inter <- interactions(xgb_model, sm, option = "interactions")
46 | inter
47 | plot(inter)
48 | 
49 | inter <- interactions(xgb_model, sm, option = "pairs")
50 | inter
51 | plot(inter)
52 | 
53 | \donttest{
54 | library(lightgbm)
55 | train_data <- lgb.Dataset(sm, label =  HR_data[, left] == 1)
56 | params <- list(objective = "binary", max_depth = 2)
57 | lgb_model <- lgb.train(params, train_data, 25)
58 | 
59 | inter <- interactions(lgb_model, sm, option = "interactions")
60 | inter
61 | plot(inter)
62 | 
63 | inter <- interactions(lgb_model, sm, option = "pairs")
64 | inter
65 | plot(inter)
66 | }
67 | 
68 | }
69 | 


--------------------------------------------------------------------------------
/R/lollipop.R:
--------------------------------------------------------------------------------
 1 | #' Tables needed for lollipop plot
 2 | #'
 3 | #' This function calculates two tables needed to generate lollipop plot, which visualise the model.
 4 | #' The first table contains information about all nodes in the trees forming a model.
 5 | #' It includes gain value, depth and ID of each nodes.
 6 | #' The second table contains similarly information about roots in the trees.
 7 | #'
 8 | #' @param xgb_model a xgboost or lightgbm model.
 9 | #' @param data a data table with data used to train the model.
10 | #'
11 | #' @return an object of the lollipop class
12 | #'
13 | #' @import data.table
14 | #'
15 | #' @examples
16 | #' library("EIX")
17 | #' library("Matrix")
18 | #' sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
19 | #'
20 | #' library("xgboost")
21 | #' param <- list(objective = "binary:logistic", max_depth = 2)
22 | #' xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose = 0)
23 | #'
24 | #' lolli <- lollipop(xgb_model, sm)
25 | #' plot(lolli, labels = "topAll", log_scale = TRUE)
26 | #'
27 | #'\donttest{
28 | #'library(lightgbm)
29 | #'train_data <- lgb.Dataset(sm, label =  HR_data[, left] == 1)
30 | #'params <- list(objective = "binary", max_depth = 2)
31 | #'lgb_model <- lgb.train(params, train_data, 25)
32 | #'
33 | #' lolli <- lollipop(lgb_model, sm)
34 | #' plot(lolli, labels = "topAll", log_scale = TRUE)
35 | #'
36 | #'}
37 | #'
38 | #' @export
39 | 
40 | lollipop <- function(xgb_model, data){
41 | 
42 |   Feature <- Quality <- Node <- Tree <- ID <- depth <-
43 |     interaction <- . <- parentsName <- name_pair <- NULL
44 | 
45 |   trees = rbindlist(calculateGain(xgb_model, data))
46 |   roots <- trees[Node == 0, .(Quality, Feature, Tree, ID, depth)]
47 |   nodes <- trees[Feature != "Leaf", .(Quality,
48 |                                       Feature,
49 |                                       Node,
50 |                                       Tree,
51 |                                       ID,
52 |                                       interaction,
53 |                                       depth,
54 |                                       parentsName,
55 |                                       name_pair)]
56 |   nodes <- nodes[interaction == TRUE, Feature := name_pair]
57 | 
58 |   lollipop <- list(nodes, roots)
59 |   class(lollipop) <- c("lollipop", "list")
60 | 
61 |   return(lollipop)
62 | }
63 | 


--------------------------------------------------------------------------------
/docs/docsearch.js:
--------------------------------------------------------------------------------
 1 | $(function() {
 2 | 
 3 |   // register a handler to move the focus to the search bar
 4 |   // upon pressing shift + "/" (i.e. "?")
 5 |   $(document).on('keydown', function(e) {
 6 |     if (e.shiftKey && e.keyCode == 191) {
 7 |       e.preventDefault();
 8 |       $("#search-input").focus();
 9 |     }
10 |   });
11 | 
12 |   $(document).ready(function() {
13 |     // do keyword highlighting
14 |     /* modified from https://jsfiddle.net/julmot/bL6bb5oo/ */
15 |     var mark = function() {
16 | 
17 |       var referrer = document.URL ;
18 |       var paramKey = "q" ;
19 | 
20 |       if (referrer.indexOf("?") !== -1) {
21 |         var qs = referrer.substr(referrer.indexOf('?') + 1);
22 |         var qs_noanchor = qs.split('#')[0];
23 |         var qsa = qs_noanchor.split('&');
24 |         var keyword = "";
25 | 
26 |         for (var i = 0; i < qsa.length; i++) {
27 |           var currentParam = qsa[i].split('=');
28 | 
29 |           if (currentParam.length !== 2) {
30 |             continue;
31 |           }
32 | 
33 |           if (currentParam[0] == paramKey) {
34 |             keyword = decodeURIComponent(currentParam[1].replace(/\+/g, "%20"));
35 |           }
36 |         }
37 | 
38 |         if (keyword !== "") {
39 |           $(".contents").unmark({
40 |             done: function() {
41 |               $(".contents").mark(keyword);
42 |             }
43 |           });
44 |         }
45 |       }
46 |     };
47 | 
48 |     mark();
49 |   });
50 | });
51 | 
52 | /* Search term highlighting ------------------------------*/
53 | 
54 | function matchedWords(hit) {
55 |   var words = [];
56 | 
57 |   var hierarchy = hit._highlightResult.hierarchy;
58 |   // loop to fetch from lvl0, lvl1, etc.
59 |   for (var idx in hierarchy) {
60 |     words = words.concat(hierarchy[idx].matchedWords);
61 |   }
62 | 
63 |   var content = hit._highlightResult.content;
64 |   if (content) {
65 |     words = words.concat(content.matchedWords);
66 |   }
67 | 
68 |   // return unique words
69 |   var words_uniq = [...new Set(words)];
70 |   return words_uniq;
71 | }
72 | 
73 | function updateHitURL(hit) {
74 | 
75 |   var words = matchedWords(hit);
76 |   var url = "";
77 | 
78 |   if (hit.anchor) {
79 |     url = hit.url_without_anchor + '?q=' + escape(words.join(" ")) + '#' + hit.anchor;
80 |   } else {
81 |     url = hit.url + '?q=' + escape(words.join(" "));
82 |   }
83 | 
84 |   return url;
85 | }
86 | 


--------------------------------------------------------------------------------
/vignettes/titanic_data.Rmd:
--------------------------------------------------------------------------------
 1 | ---
 2 | title: "EIX: Titanic data "
 3 | author: "Ewelina Karbowiak"
 4 | date: "2018-29-03"
 5 | output: rmarkdown::html_vignette
 6 | vignette: >
 7 |   %\VignetteIndexEntry{EIX for Titanic data}
 8 |   %\VignetteEngine{knitr::rmarkdown}
 9 |   %\VignetteEncoding{UTF-8}
10 | ---
11 | 
12 | ```{r, echo=FALSE}
13 | knitr::opts_chunk$set(fig.height = 6, fig.width = 6, fig.align = "center")
14 | 
15 | ```
16 | 
17 | ## Data Info
18 | This vignette shows usage of `EIX` package for titanic data. This dataset was copied from `stablelearner` package. With `EIX` package we explain XGBoost classification model concerning the survival problem. More details about `EIX` package [here](https://modeloriented.github.io/EIX/articles/EIX.html).
19 | 
20 | 
21 | ```{r}
22 | #devtools :: install_github("ModelOriented/EIX")
23 | library("EIX")
24 | library(data.table)
25 | set.seed(4)
26 | titanic_data<-data.table(na.omit(titanic_data))
27 | knitr::kable(head(titanic_data))
28 | 
29 | library("Matrix")
30 | sparse_matrix <- sparse.model.matrix(survived ~ . - 1,  data = titanic_data)
31 | ```
32 | 
33 | 
34 | ## Xgboost model creation
35 | 
36 | 
37 | ```{r, warning=FALSE, message=FALSE}
38 | library("xgboost")
39 | param <- list(objective = "binary:logistic", max_depth = 2)
40 | xgb_model <- xgboost(sparse_matrix, params = param, label = titanic_data[, "survived"] == "yes", nrounds = 50, verbose = FALSE)
41 | ```
42 | 
43 | 
44 | ## Model visualization
45 | 
46 | First let's plot the model.
47 | 
48 | ```{r}
49 | lolli<-lollipop(xgb_model,sparse_matrix)
50 | plot(lolli, threshold=0.02)
51 | ```
52 | 
53 | 
54 | ## Interactions
55 | 
56 | Next we explore interactions using `interactions()` functions and its plot.
57 | 
58 | ```{r}
59 | interactions<-interactions(xgb_model, sparse_matrix, option = "interactions")
60 | head(interactions, 15)
61 | plot(interactions)
62 | ```
63 | 
64 | ## Variables' and interactions’ importance
65 | 
66 | ```{r}
67 | importance<-importance(xgb_model, sparse_matrix, option = "both")
68 | head(importance, 15)
69 | plot(importance, radar=FALSE)
70 | ```
71 | 
72 | ```{r}
73 | plot(importance)
74 | ```
75 | 
76 | ## Explanation of the single prediction including interactions
77 | 
78 | Let's see an explanation of the prediction for an 18-year-old from England who has traveled 3rd class.
79 | 
80 | ```{r}
81 | data <- titanic_data[27,]
82 | new_observation <- sparse_matrix[27,]
83 | wf<-waterfall(xgb_model, new_observation, data, option = "interactions")
84 | wf
85 | plot(wf)
86 | ```
87 | 


--------------------------------------------------------------------------------
/docs/jquery.sticky-kit.min.js:
--------------------------------------------------------------------------------
 1 | /*
 2 |  Sticky-kit v1.1.2 | WTFPL | Leaf Corcoran 2015 | http://leafo.net
 3 | */
 4 | (function(){var b,f;b=this.jQuery||window.jQuery;f=b(window);b.fn.stick_in_parent=function(d){var A,w,J,n,B,K,p,q,k,E,t;null==d&&(d={});t=d.sticky_class;B=d.inner_scrolling;E=d.recalc_every;k=d.parent;q=d.offset_top;p=d.spacer;w=d.bottoming;null==q&&(q=0);null==k&&(k=void 0);null==B&&(B=!0);null==t&&(t="is_stuck");A=b(document);null==w&&(w=!0);J=function(a,d,n,C,F,u,r,G){var v,H,m,D,I,c,g,x,y,z,h,l;if(!a.data("sticky_kit")){a.data("sticky_kit",!0);I=A.height();g=a.parent();null!=k&&(g=g.closest(k));
 5 | if(!g.length)throw"failed to find stick parent";v=m=!1;(h=null!=p?p&&a.closest(p):b("<div />"))&&h.css("position",a.css("position"));x=function(){var c,f,e;if(!G&&(I=A.height(),c=parseInt(g.css("border-top-width"),10),f=parseInt(g.css("padding-top"),10),d=parseInt(g.css("padding-bottom"),10),n=g.offset().top+c+f,C=g.height(),m&&(v=m=!1,null==p&&(a.insertAfter(h),h.detach()),a.css({position:"",top:"",width:"",bottom:""}).removeClass(t),e=!0),F=a.offset().top-(parseInt(a.css("margin-top"),10)||0)-q,
 6 | u=a.outerHeight(!0),r=a.css("float"),h&&h.css({width:a.outerWidth(!0),height:u,display:a.css("display"),"vertical-align":a.css("vertical-align"),"float":r}),e))return l()};x();if(u!==C)return D=void 0,c=q,z=E,l=function(){var b,l,e,k;if(!G&&(e=!1,null!=z&&(--z,0>=z&&(z=E,x(),e=!0)),e||A.height()===I||x(),e=f.scrollTop(),null!=D&&(l=e-D),D=e,m?(w&&(k=e+u+c>C+n,v&&!k&&(v=!1,a.css({position:"fixed",bottom:"",top:c}).trigger("sticky_kit:unbottom"))),e<F&&(m=!1,c=q,null==p&&("left"!==r&&"right"!==r||a.insertAfter(h),
 7 | h.detach()),b={position:"",width:"",top:""},a.css(b).removeClass(t).trigger("sticky_kit:unstick")),B&&(b=f.height(),u+q>b&&!v&&(c-=l,c=Math.max(b-u,c),c=Math.min(q,c),m&&a.css({top:c+"px"})))):e>F&&(m=!0,b={position:"fixed",top:c},b.width="border-box"===a.css("box-sizing")?a.outerWidth()+"px":a.width()+"px",a.css(b).addClass(t),null==p&&(a.after(h),"left"!==r&&"right"!==r||h.append(a)),a.trigger("sticky_kit:stick")),m&&w&&(null==k&&(k=e+u+c>C+n),!v&&k)))return v=!0,"static"===g.css("position")&&g.css({position:"relative"}),
 8 | a.css({position:"absolute",bottom:d,top:"auto"}).trigger("sticky_kit:bottom")},y=function(){x();return l()},H=function(){G=!0;f.off("touchmove",l);f.off("scroll",l);f.off("resize",y);b(document.body).off("sticky_kit:recalc",y);a.off("sticky_kit:detach",H);a.removeData("sticky_kit");a.css({position:"",bottom:"",top:"",width:""});g.position("position","");if(m)return null==p&&("left"!==r&&"right"!==r||a.insertAfter(h),h.remove()),a.removeClass(t)},f.on("touchmove",l),f.on("scroll",l),f.on("resize",
 9 | y),b(document.body).on("sticky_kit:recalc",y),a.on("sticky_kit:detach",H),setTimeout(l,0)}};n=0;for(K=this.length;n<K;n++)d=this[n],J(b(d));return this}}).call(this);
10 | 


--------------------------------------------------------------------------------
/R/plot_interactions.R:
--------------------------------------------------------------------------------
 1 | #' Plot importance of interactions or pairs
 2 | #'
 3 | #' This function plots the importance ranking of interactions and pairs in the model.
 4 | #'
 5 | #' NOTE: Be careful use of this function with \code{option="pairs"} parameter,
 6 | #'       because high gain of pair can be a result of high gain of child variable.
 7 | #'      As strong interactions should be considered only these pairs of variables,
 8 | #'      where variable on the bottom (child) has higher gain than variable on the top (parent).
 9 | #'
10 | #' @param x a result from the \code{interactions} function.
11 | #' @param ... other parameters.
12 | #'
13 | #' @return a ggplot object
14 | #'
15 | #' @import data.table
16 | #' @import ggplot2
17 | #' @importFrom DALEX theme_drwhy
18 | #'
19 | #' @examples
20 | #' library("EIX")
21 | #' library("Matrix")
22 | #' sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
23 | #'
24 | #' library("xgboost")
25 | #' param <- list(objective = "binary:logistic", max_depth = 2)
26 | #' xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose=0)
27 | #'
28 | #' inter <- interactions(xgb_model, sm,		option = "interactions")
29 | #' inter
30 | #' plot(inter)
31 | #'
32 | #' inter <- interactions(xgb_model, sm,		option = "pairs")
33 | #' inter
34 | #' plot(inter)
35 | #'
36 | #' \donttest{
37 | #'library(lightgbm)
38 | #'train_data <- lgb.Dataset(sm, label =  HR_data[, left] == 1)
39 | #'params <- list(objective = "binary", max_depth = 2)
40 | #'lgb_model <- lgb.train(params, train_data, 25)
41 | #'
42 | #' inter <- interactions(lgb_model, sm,		option = "interactions")
43 | #' inter
44 | #' plot(inter)
45 | #'
46 | #' inter <- interactions(lgb_model, sm,		option = "pairs")
47 | #' inter
48 | #' plot(inter)
49 | #'}
50 | #'
51 | #' @export
52 | 
53 | 
54 | plot.interactions <- function(x, ...) {
55 |   Feature <- sumGain <- Child <- Parent <- breaks <- NULL
56 | 
57 |   sumGain <- x$sumGain
58 |   breaks <- c(min(sumGain),
59 |               (max(sumGain - min(sumGain)))/4,
60 |               (max(sumGain - min(sumGain)))/2,
61 |               3*(max(sumGain - min(sumGain)))/4,
62 |               max(sumGain))
63 |   x$breaks <- cut(sumGain, breaks = breaks , right = FALSE, dig.lab = 4, include.lowest = TRUE)
64 |   x$Child <- factor(x$Child, levels = unique(x$Child[order(x$sumGain, decreasing = TRUE)]))
65 | 
66 |   ggplot(data.frame(x), aes(Child, Parent, sumGain)) +
67 |     geom_tile(aes(fill = breaks)) +
68 |     theme_drwhy() +
69 |     theme(axis.text.x = element_text(hjust = 1, angle = 90),
70 |           axis.text.y = element_text(hjust = 1, angle = 0)) +
71 |     scale_fill_manual(name = "sumGain",
72 |                       values = c("#f4f5ff", "#ccccff", "#7f7fff", "#3232ff"),
73 |                       drop = FALSE,
74 |                       breaks = levels(x$breaks),
75 |                       labels = c("very low", "low", "medium", "high")) +
76 |     coord_equal()
77 | 
78 | }
79 | 


--------------------------------------------------------------------------------
/R/titanic_data.R:
--------------------------------------------------------------------------------
 1 | #' Passengers and Crew on the RMS Titanic
 2 | #'
 3 | #' The \code{titanic} data is a complete list of passengers and crew members on  the RMS Titanic.
 4 | #' It includes a variable indicating whether a person did  survive the sinking of the RMS
 5 | #' Titanic on April 15, 1912.
 6 | #'
 7 | #' The description of the dataset was copied from the \code{DALEX} package.
 8 | #'
 9 | #' This dataset was copied from the \code{stablelearner} package and went through few variable
10 | #' transformations. Levels in \code{embarked} was replaced with full names, \code{sibsp}, \code{parch} and \code{fare}
11 | #' were converted to numerical variables and values for crew were replaced with 0.
12 | #' If you use this dataset please cite the original package.
13 | #'
14 | #' From \code{stablelearner}: The website \url{https://www.encyclopedia-titanica.org} offers detailed  information about passengers and crew
15 | #' members on the RMS Titanic. According to the website 1317 passengers and 890 crew member were abord.
16 | #' 8 musicians and 9 employees of the shipyard company are listed as passengers, but travelled with a
17 | #' free ticket, which is why they have \code{NA} values in \code{fare}. In addition to that, \code{fare}
18 | #' is truely missing for a few regular passengers.
19 | #'
20 | #' \itemize{
21 | #' \item gender a factor with levels \code{male} and \code{female}.
22 | #' \item age a numeric value with the persons age on the day of the sinking.
23 | #' \item class a factor specifying the class for passengers or the type of service aboard for crew members.
24 | #' \item embarked a factor with the persons place of of embarkment (Belfast/Cherbourg/Queenstown/Southampton).
25 | #' \item country a factor with the persons home country.
26 | #' \item fare a numeric value with the ticket price (\code{0} for crew members, musicians and employees of the shipyard company).
27 | #' \item sibsp an ordered factor specifying the number if siblings/spouses aboard; adopted from Vanderbild data set (see below).
28 | #' \item parch an ordered factor specifying the number of parents/children aboard; adopted from Vanderbild data set (see below).
29 | #' \item survived a factor with two levels (\code{no} and \code{yes}) specifying whether the person has survived the sinking.
30 | #' }
31 | #'
32 | #' @docType data
33 | #' @keywords titanic_data
34 | #' @name titanic_data
35 | #' @references   \url{https://www.encyclopedia-titanica.org}, \url{http://biostat.mc.vanderbilt.edu/DataSets},
36 | #' \url{https://CRAN.R-project.org/package=stablelearner}, \url{https://cran.r-project.org/package=DALEX}.
37 | #' @source The description of dataset was copied from the \code{DALEX} package.
38 | #' This dataset was copied from the \code{stablelearner} package and went through few variable
39 | #' transformations. The complete list of persons on the RMS titanic was downloaded from
40 | #' \url{https://www.encyclopedia-titanica.org} on April 5, 2016. The  information given
41 | #' in \code{sibsp} and \code{parch} was adopoted from a data set obtained from \url{http://biostat.mc.vanderbilt.edu/DataSets}.
42 | #' @usage data(titanic_data)
43 | #' @format a data frame with 2207 rows and 11 columns
44 | NULL
45 | 


--------------------------------------------------------------------------------
/man/importance.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/importance.R
 3 | \name{importance}
 4 | \alias{importance}
 5 | \title{Importance of variables and interactions in the model}
 6 | \usage{
 7 | importance(xgb_model, data, option = "both", digits = 4)
 8 | }
 9 | \arguments{
10 | \item{xgb_model}{a xgboost or lightgbm model.}
11 | 
12 | \item{data}{a data table with data used to train the model.}
13 | 
14 | \item{option}{if "variables" then table includes only single variables,
15 | if "interactions", then only interactions
16 | if "both", then both single variable and interactions.
17 | Default "both".}
18 | 
19 | \item{digits}{number of significant digits that shall be returned. Will be passed to the signif() functions.}
20 | }
21 | \value{
22 | a data table
23 | }
24 | \description{
25 | This functions calculates a table with selected measures of importance
26 | for variables and interactions.
27 | }
28 | \details{
29 | Available measures:
30 | \itemize{
31 | \item "sumGain" - sum of Gain value in all nodes, in which given variable occurs,
32 | \item "sumCover" - sum of Cover value in all nodes, in which given variable occurs; for LightGBM models: number of observation, which pass through the node,
33 | \item "mean5Gain" - mean gain from 5 occurrences of given variable with the highest gain,
34 | \item "meanGain" - mean Gain value in all nodes, in which given variable occurs,
35 | \item "meanCover" - mean Cover value in all nodes, in which given variable occurs; for LightGBM models: mean number of observation, which pass through the node,
36 | \item "freqency" - number of occurrences in the nodes for given variable.
37 | }
38 | 
39 | Additionally for table with single variables:
40 | \itemize{
41 | \item "meanDepth"  - mean depth weighted by gain,
42 | \item "numberOfRoots" - number of occurrences in the root,
43 | \item "weightedRoot" - mean number of occurrences in the root, which is weighted by gain.
44 | }
45 | }
46 | \examples{
47 | library("EIX")
48 | library("Matrix")
49 | sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
50 | 
51 | library("xgboost")
52 | param <- list(objective = "binary:logistic", max_depth = 2)
53 | xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose=0)
54 | 
55 | imp <- importance(xgb_model, sm, option = "both")
56 | imp
57 | plot(imp,  top = 10)
58 | 
59 | imp <- importance(xgb_model, sm, option = "variables")
60 | imp
61 | plot(imp,  top = nrow(imp))
62 | 
63 |  imp <- importance(xgb_model, sm, option = "interactions")
64 |  imp
65 | plot(imp,  top =  nrow(imp))
66 | 
67 |  imp <- importance(xgb_model, sm, option = "variables")
68 |  imp
69 | plot(imp, top = NULL, radar = FALSE, xmeasure = "sumCover", ymeasure = "sumGain")
70 | 
71 | \donttest{
72 | library(lightgbm)
73 | train_data <- lgb.Dataset(sm, label =  HR_data[, left] == 1)
74 | params <- list(objective = "binary", max_depth = 2)
75 | lgb_model <- lgb.train(params, train_data, 25)
76 | 
77 | imp <- importance(lgb_model, sm, option = "both")
78 | imp
79 | plot(imp,  top = nrow(imp))
80 | 
81 | imp <- importance(lgb_model, sm, option = "variables")
82 | imp
83 | plot(imp, top = NULL, radar = FALSE, xmeasure = "sumCover", ymeasure = "sumGain")
84 | 
85 | }
86 | 
87 | }
88 | 


--------------------------------------------------------------------------------
/man/titanic_data.Rd:
--------------------------------------------------------------------------------
 1 | % Generated by roxygen2: do not edit by hand
 2 | % Please edit documentation in R/titanic_data.R
 3 | \docType{data}
 4 | \name{titanic_data}
 5 | \alias{titanic_data}
 6 | \title{Passengers and Crew on the RMS Titanic}
 7 | \format{
 8 | a data frame with 2207 rows and 11 columns
 9 | }
10 | \source{
11 | The description of dataset was copied from the \code{DALEX} package.
12 | This dataset was copied from the \code{stablelearner} package and went through few variable
13 | transformations. The complete list of persons on the RMS titanic was downloaded from
14 | \url{https://www.encyclopedia-titanica.org} on April 5, 2016. The  information given
15 | in \code{sibsp} and \code{parch} was adopoted from a data set obtained from \url{http://biostat.mc.vanderbilt.edu/DataSets}.
16 | }
17 | \usage{
18 | data(titanic_data)
19 | }
20 | \description{
21 | The \code{titanic} data is a complete list of passengers and crew members on  the RMS Titanic.
22 | It includes a variable indicating whether a person did  survive the sinking of the RMS
23 | Titanic on April 15, 1912.
24 | }
25 | \details{
26 | The description of the dataset was copied from the \code{DALEX} package.
27 | 
28 | This dataset was copied from the \code{stablelearner} package and went through few variable
29 | transformations. Levels in \code{embarked} was replaced with full names, \code{sibsp}, \code{parch} and \code{fare}
30 | were converted to numerical variables and values for crew were replaced with 0.
31 | If you use this dataset please cite the original package.
32 | 
33 | From \code{stablelearner}: The website \url{https://www.encyclopedia-titanica.org} offers detailed  information about passengers and crew
34 | members on the RMS Titanic. According to the website 1317 passengers and 890 crew member were abord.
35 | 8 musicians and 9 employees of the shipyard company are listed as passengers, but travelled with a
36 | free ticket, which is why they have \code{NA} values in \code{fare}. In addition to that, \code{fare}
37 | is truely missing for a few regular passengers.
38 | 
39 | \itemize{
40 | \item gender a factor with levels \code{male} and \code{female}.
41 | \item age a numeric value with the persons age on the day of the sinking.
42 | \item class a factor specifying the class for passengers or the type of service aboard for crew members.
43 | \item embarked a factor with the persons place of of embarkment (Belfast/Cherbourg/Queenstown/Southampton).
44 | \item country a factor with the persons home country.
45 | \item fare a numeric value with the ticket price (\code{0} for crew members, musicians and employees of the shipyard company).
46 | \item sibsp an ordered factor specifying the number if siblings/spouses aboard; adopted from Vanderbild data set (see below).
47 | \item parch an ordered factor specifying the number of parents/children aboard; adopted from Vanderbild data set (see below).
48 | \item survived a factor with two levels (\code{no} and \code{yes}) specifying whether the person has survived the sinking.
49 | }
50 | }
51 | \references{
52 | \url{https://www.encyclopedia-titanica.org}, \url{http://biostat.mc.vanderbilt.edu/DataSets},
53 | \url{https://CRAN.R-project.org/package=stablelearner}, \url{https://cran.r-project.org/package=DALEX}.
54 | }
55 | \keyword{titanic_data}
56 | 


--------------------------------------------------------------------------------
/R/plot_lollipop.R:
--------------------------------------------------------------------------------
 1 | #' Visualiation of the model
 2 | #'
 3 | #' The lollipop plots the model with the most important interactions and variables in the roots.
 4 | #'
 5 | #' @param x a result from the \code{lollipop} function.
 6 | #' @param labels if "topAll" then labels for the most important interactions (vertical label)
 7 | #'               and variables in the roots (horizontal label) will be displayed,
 8 | #'               if "interactions" then labels for all interactions,
 9 | #'               if "roots" then labels for all variables in the root.
10 | #' @param threshold  on the plot will occur only labels with Gain higher than `threshold` of the max Gain value in the model.
11 | #'                   The lower threshold, the more labels on the plot. Range from 0 to 1. Default 0.1.
12 | #' @param log_scale  TRUE/FALSE logarithmic scale on the plot. Default TRUE.
13 | #' @param ... other parameters.
14 | #'
15 | #' @return a ggplot object
16 | #'
17 | #' @import data.table
18 | #' @import ggplot2
19 | #' @importFrom DALEX theme_drwhy
20 | #' @importFrom ggrepel geom_label_repel
21 | #' @importFrom ggrepel geom_text_repel
22 | #' @importFrom scales pseudo_log_trans
23 | #'
24 | #' @examples
25 | #' library("EIX")
26 | #' library("Matrix")
27 | #' sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
28 | #'
29 | #' library("xgboost")
30 | #' param <- list(objective = "binary:logistic", max_depth = 2)
31 | #' xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose = 0)
32 | #'
33 | #' lolli <- lollipop(xgb_model, sm)
34 | #' plot(lolli, labels = "topAll", log_scale = TRUE)
35 | #'
36 | #' \donttest{
37 | #'library(lightgbm)
38 | #'train_data <- lgb.Dataset(sm, label =  HR_data[, left] == 1)
39 | #'params <- list(objective = "binary", max_depth = 3)
40 | #'lgb_model <- lgb.train(params, train_data, 25)
41 | #'
42 | #' lolli <- lollipop(lgb_model, sm)
43 | #' plot(lolli, labels = "topAll", log_scale = TRUE)
44 | #'}
45 | #'
46 | #' @export
47 | 
48 | plot.lollipop<-function(x, ..., labels = "topAll", log_scale = TRUE, threshold=0.1){
49 | 
50 |   Tree <- Quality <- depth <- Feature <- NULL
51 |   nodes <- x[[1]]
52 |   roots <- x[[2]]
53 | 
54 |   p <- ggplot(data = data.frame(nodes), aes(x = Tree, y = Quality, group = as.factor(depth))) +
55 |     geom_line(data = data.frame(roots), color = "red", size = 1.25, alpha = .5) +
56 |     geom_segment(aes(x = Tree, xend = Tree, y = 0, yend = Quality), size = 1.25) +
57 |     geom_point(aes(shape = as.factor(depth), color = as.factor(depth)), size = 3)
58 | 
59 | nodes_labels <- nodes[(interaction == TRUE) & (Quality > threshold * (max(nodes[, Quality]))),]
60 | roots_labels <- roots[Quality > threshold * (max(nodes[, Quality])),]
61 | 
62 |   p <- {
63 |     switch(labels,
64 |            topAll = {
65 |              p + geom_text_repel(data = data.frame(nodes_labels),
66 |                                  aes(label = Feature),
67 |                                  angle = 90, nudge_y = 0.05, direction  = "x", vjust = 0, segment.size = 0.2) +
68 |                  geom_label_repel(data = data.frame(roots_labels),
69 |                                 aes(label =  Feature))
70 |            },
71 |            interactions = {
72 |              p + geom_text_repel(data = data.frame(nodes_labels),
73 |                                                  aes(label=Feature),
74 |                                                  angle = 90, nudge_y = 0.05, direction  = "x", vjust = 0, segment.size = 0.2 )
75 |            },
76 |            roots = {
77 |              p + geom_label_repel(data = data.frame(roots_labels), aes(label = Feature))
78 |            })}
79 | 
80 |   q <- p + theme_drwhy()+ ylab("Gain") +
81 |     scale_shape_discrete("Depth") +
82 |     scale_colour_discrete("Depth") + if (log_scale){scale_x_continuous(trans="pseudo_log")}
83 |   q
84 | }
85 | 
86 | 


--------------------------------------------------------------------------------
/man/plot.importance.Rd:
--------------------------------------------------------------------------------
  1 | % Generated by roxygen2: do not edit by hand
  2 | % Please edit documentation in R/plot_importance.R
  3 | \name{plot.importance}
  4 | \alias{plot.importance}
  5 | \title{Plot importance measures}
  6 | \usage{
  7 | \method{plot}{importance}(
  8 |   x,
  9 |   ...,
 10 |   top = 10,
 11 |   radar = TRUE,
 12 |   text_start_point = 0.5,
 13 |   text_size = 3.5,
 14 |   xmeasure = "sumCover",
 15 |   ymeasure = "sumGain"
 16 | )
 17 | }
 18 | \arguments{
 19 | \item{x}{a result from the \code{importance} function.}
 20 | 
 21 | \item{...}{other parameters.}
 22 | 
 23 | \item{top}{number of positions on the plot or NULL for all variable. Default 10.}
 24 | 
 25 | \item{radar}{TRUE/FALSE. If TRUE the plot shows
 26 | six measures of variables' or interactions' importance in the model.
 27 | If FALSE the plot containing two chosen measures
 28 | of variables' or interactions' importance in the model.}
 29 | 
 30 | \item{text_start_point}{place, where the names of the particular feature start. Available for `radar=TRUE`. Range from 0 to 1. Default 0.5.}
 31 | 
 32 | \item{text_size}{size of the text on the plot. Default 3.5.}
 33 | 
 34 | \item{xmeasure}{measure on the x-axis.Available for `radar=FALSE`. Default "sumCover".}
 35 | 
 36 | \item{ymeasure}{measure on the y-axis. Available for `radar=FALSE`. Default "sumGain".}
 37 | }
 38 | \value{
 39 | a ggplot object
 40 | }
 41 | \description{
 42 | This functions plots selected measures of importance for variables and interactions.
 43 | It is possible to visualise importance table in two ways: radar plot with six measures
 44 | and scatter plot with two choosen measures.
 45 | }
 46 | \details{
 47 | Available measures:
 48 | \itemize{
 49 | \item "sumGain" - sum of Gain value in all nodes, in which given variable occurs,
 50 | \item "sumCover" - sum of Cover value in all nodes, in which given variable occurs; for LightGBM models: number of observation, which pass through the node,
 51 | \item "mean5Gain" - mean gain from 5 occurrences of given variable with the highest gain,
 52 | \item "meanGain" - mean Gain value in all nodes, in which given variable occurs,
 53 | \item "meanCover" - mean Cover value in all nodes, in which given variable occurs; for LightGBM models: mean number of observation, which pass through the node,
 54 | \item "freqency" - number of occurrences in the nodes for given variable.
 55 | }
 56 | 
 57 | Additionally for plots with single variables:
 58 | \itemize{
 59 | \item "meanDepth"  - mean depth weighted by gain,
 60 | \item "numberOfRoots" - number of occurrences in the root,
 61 | \item "weightedRoot" - mean number of occurrences in the root, which is weighted by gain.
 62 | }
 63 | }
 64 | \examples{
 65 | library("EIX")
 66 | library("Matrix")
 67 | sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
 68 | 
 69 | library("xgboost")
 70 | param <- list(objective = "binary:logistic", max_depth = 2)
 71 | xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose=0)
 72 | 
 73 | imp <- importance(xgb_model, sm, option = "both")
 74 | imp
 75 | plot(imp,  top = 10)
 76 | 
 77 | imp <- importance(xgb_model, sm, option = "variables")
 78 | imp
 79 | plot(imp,  top = nrow(imp))
 80 | 
 81 |  imp <- importance(xgb_model, sm, option = "interactions")
 82 |  imp
 83 | plot(imp,  top =  nrow(imp))
 84 | 
 85 |  imp <- importance(xgb_model, sm, option = "variables")
 86 |  imp
 87 | plot(imp, top = NULL, radar = FALSE, xmeasure = "sumCover", ymeasure = "sumGain")
 88 | 
 89 | \donttest{
 90 | library(lightgbm)
 91 | train_data <- lgb.Dataset(sm, label =  HR_data[, left] == 1)
 92 | params <- list(objective = "binary", max_depth = 2)
 93 | lgb_model <- lgb.train(params, train_data, 25)
 94 | 
 95 | imp <- importance(lgb_model, sm, option = "both")
 96 | imp
 97 | plot(imp,  top = nrow(imp))
 98 | 
 99 | imp <- importance(lgb_model, sm, option = "variables")
100 | imp
101 | plot(imp, top = NULL, radar = FALSE, xmeasure = "sumCover", ymeasure = "sumGain")
102 | 
103 | }
104 | 
105 | }
106 | 


--------------------------------------------------------------------------------
/R/interactions.R:
--------------------------------------------------------------------------------
  1 | #' Importance of interactions and pairs in the model
  2 | #'
  3 | #' This function calculates a table with two measures of importance for interactions and pairs in the model.
  4 | #'
  5 | #' Available measures:
  6 | #'\itemize{
  7 | #'\item "sumGain" - sum of Gain value in all nodes, in which given variable occurs,
  8 | #'\item "freqency" - number of occurrences in the nodes for given variable.
  9 | #'}
 10 | #'
 11 | #' NOTE: Be careful use of this function with \code{option="pairs"} parameter,
 12 | #'       because high gain of pair can be a result of high gain of child variable.
 13 | #'      As strong interactions should be considered only these pairs of variables,
 14 | #'      where variable on the bottom (child) has higher gain than variable on the top (parent).
 15 | #'
 16 | #' @param xgb_model a xgboost or lightgbm model.
 17 | #' @param data a data table with data used to train the model.
 18 | #' @param option if "interactions", the table contains interactions,
 19 | #'            if "pairs", this table contains all the pairs in the model.
 20 | #'            Default "interactions".
 21 | #'
 22 | #' @return a data table
 23 | #'
 24 | #' @import data.table
 25 | #' @importFrom purrr map
 26 | #' @importFrom stats frequency
 27 | #'
 28 | #' @examples
 29 | #' library("EIX")
 30 | #' library("Matrix")
 31 | #' sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
 32 | #'
 33 | #' library("xgboost")
 34 | #' param <- list(objective = "binary:logistic", max_depth = 2)
 35 | #' xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose=0)
 36 | #'
 37 | #' inter <- interactions(xgb_model, sm, option = "interactions")
 38 | #' inter
 39 | #' plot(inter)
 40 | #'
 41 | #' inter <- interactions(xgb_model, sm, option = "pairs")
 42 | #' inter
 43 | #' plot(inter)
 44 | #'
 45 | #' \donttest{
 46 | #'library(lightgbm)
 47 | #'train_data <- lgb.Dataset(sm, label =  HR_data[, left] == 1)
 48 | #'params <- list(objective = "binary", max_depth = 2)
 49 | #'lgb_model <- lgb.train(params, train_data, 25)
 50 | #'
 51 | #' inter <- interactions(lgb_model, sm, option = "interactions")
 52 | #' inter
 53 | #' plot(inter)
 54 | #'
 55 | #' inter <- interactions(lgb_model, sm, option = "pairs")
 56 | #' inter
 57 | #' plot(inter)
 58 | #'}
 59 | #'
 60 | #' @export
 61 | #'
 62 | #'
 63 | 
 64 | interactions <- function(xgb_model, data, option = "interactions"){
 65 |   Child <- Parent <- Feature <- sumGain <- . <- NULL
 66 | 
 67 |   if (option == "interactions") {
 68 |     gainTable <- importanceInteraction(xgb_model, data)[, .(Feature, sumGain, frequency)]
 69 |     gainTable <-gainTable[, `:=`(Parent = as.vector(unlist(map(strsplit(gainTable[, Feature], "[:]"), 1))),
 70 |                                  Child = as.vector(unlist(map(strsplit(gainTable[, Feature], "[:]"), 2))))]
 71 |     gainTable <- gainTable[, -1]
 72 |     gainTable <- gainTable[,.(Parent, Child, sumGain, frequency)]
 73 |   }
 74 |   if (option == "pairs") {
 75 |     gainTable <- calculatePairsGainTable(xgb_model, data)
 76 |   }
 77 |   class(gainTable) <- c("interactions", "data.table")
 78 |   return(gainTable)
 79 | 
 80 | }
 81 | 
 82 | #calculatePairsGainTable containing gains of all variables' pairs occur in the model.
 83 | calculatePairsGainTable <- function(xgb_model, data) {
 84 |   name_pair <- childsGain <- Parent <- Child <- sumGain <- N <- . <- NULL
 85 | 
 86 |   treeList <- calculateGain(xgb_model, data)
 87 |   trees <- rbindlist(treeList)
 88 | 
 89 |   importanceCount <- data.table(table(trees[, "name_pair"],dnn = "name_pair"))
 90 |   importanceGain <- trees[, .(sumGain = sum(childsGain)), by = "name_pair"]
 91 |   importance <- merge(importanceCount, importanceGain, by = "name_pair")
 92 |   importance <-
 93 |   importance[, `:=`(Parent = as.vector(unlist(map(strsplit(importance[, name_pair], "[:]"), 1))),
 94 |                      Child = as.vector(unlist(map(strsplit(importance[, name_pair], "[:]"), 2 ))))]
 95 |   importance <- importance[, -1]
 96 |   setorderv(importance, "sumGain", -1)
 97 | 
 98 |   return(importance[,.(Parent, Child, sumGain, frequency = N)])
 99 | }
100 | 


--------------------------------------------------------------------------------
/docs/authors.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html>
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Authors • EIX</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 16 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 20 | 
 21 | 
 22 | <!-- pkgdown -->
 23 | <link href="pkgdown.css" rel="stylesheet">
 24 | <script src="jquery.sticky-kit.min.js"></script>
 25 | <script src="pkgdown.js"></script>
 26 | <!-- mathjax -->
 27 | <script src='https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML'></script>
 28 | 
 29 | <!--[if lt IE 9]>
 30 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 31 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 32 | <![endif]-->
 33 | 
 34 | 
 35 |   </head>
 36 | 
 37 |   <body>
 38 |     <div class="container template-authors">
 39 |       <header>
 40 |       <div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 41 |   <div class="container">
 42 |     <div class="navbar-header">
 43 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 44 |         <span class="icon-bar"></span>
 45 |         <span class="icon-bar"></span>
 46 |         <span class="icon-bar"></span>
 47 |       </button>
 48 | 	  <a class = "navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 49 |         <img src = "https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt = "MI2" height = 46 title = "MI2">
 50 | 	  </a>
 51 |       <a class="navbar-brand navbar-mi2" href="index.html"></a>
 52 |     </div>
 53 |     <div id="navbar" class="navbar-collapse collapse">
 54 |       <ul class="navbar-mi2 nav navbar-nav">
 55 |         <li>
 56 |   <a href="index.html">
 57 |     <span class="fa fa-home fa-lg"></span>
 58 |      
 59 |   </a>
 60 | </li>
 61 | <li>
 62 |   <a href="articles/EIX.html">Get started</a>
 63 | </li>
 64 | <li>
 65 |   <a href="reference/index.html">Reference</a>
 66 | </li>
 67 | <li class="dropdown">
 68 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 69 |     Articles
 70 |      
 71 |     <span class="caret"></span>
 72 |   </a>
 73 |   <ul class="dropdown-menu" role="menu">
 74 |     <li>
 75 |       <a href="articles/titanic_data.html">EIX: Titanic data </a>
 76 |     </li>
 77 |   </ul>
 78 | </li>
 79 |       </ul>
 80 |       
 81 |       <ul class="nav navbar-nav navbar-right">
 82 |         <li>
 83 |   <a href="https://github.com/ModelOriented/EIX">
 84 |     <span class="fa fa-github fa-lg"></span>
 85 |      
 86 |   </a>
 87 | </li>
 88 |       </ul>
 89 |     </div><!--/.nav-collapse -->
 90 |   </div><!--/.container -->
 91 | </div><!--/.navbar -->
 92 | 
 93 |       
 94 |       </header>
 95 | 
 96 |       <div class="row">
 97 |   <div class="contents col-md-12">
 98 |     <div class="page-header">
 99 |       <h1>Authors</h1>
100 |     </div>
101 |     <ul class="list-unstyled">
102 |       <li>
103 |         <p><strong>Ewelina Karbowiak</strong>. Author, maintainer.
104 |         </p>
105 |       </li>
106 |       <li>
107 |         <p><strong>Przemyslaw Biecek</strong>. Author, thesis advisor.
108 |         </p>
109 |       </li>
110 |     </ul>
111 | 
112 |   </div>
113 | 
114 | </div>
115 | 
116 | 
117 |       <footer>
118 |       <div class="copyright">
119 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
120 | </div>
121 | 
122 | <div class="pkgdown">
123 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
124 | </div>
125 | 
126 |       </footer>
127 |    </div>
128 | 
129 |   </body>
130 | </html>
131 | 
132 | 


--------------------------------------------------------------------------------
/docs/articles/index.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html>
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Articles • EIX</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 16 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 20 | 
 21 | 
 22 | <!-- pkgdown -->
 23 | <link href="../pkgdown.css" rel="stylesheet">
 24 | <script src="../jquery.sticky-kit.min.js"></script>
 25 | <script src="../pkgdown.js"></script>
 26 | <!-- mathjax -->
 27 | <script src='https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML'></script>
 28 | 
 29 | <!--[if lt IE 9]>
 30 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 31 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 32 | <![endif]-->
 33 | 
 34 | 
 35 |   </head>
 36 | 
 37 |   <body>
 38 |     <div class="container template-article-index">
 39 |       <header>
 40 |       <div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 41 |   <div class="container">
 42 |     <div class="navbar-header">
 43 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 44 |         <span class="icon-bar"></span>
 45 |         <span class="icon-bar"></span>
 46 |         <span class="icon-bar"></span>
 47 |       </button>
 48 | 	  <a class = "navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 49 |         <img src = "https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt = "MI2" height = 46 title = "MI2">
 50 | 	  </a>
 51 |       <a class="navbar-brand navbar-mi2" href="../index.html"></a>
 52 |     </div>
 53 |     <div id="navbar" class="navbar-collapse collapse">
 54 |       <ul class="navbar-mi2 nav navbar-nav">
 55 |         <li>
 56 |   <a href="../index.html">
 57 |     <span class="fa fa-home fa-lg"></span>
 58 |      
 59 |   </a>
 60 | </li>
 61 | <li>
 62 |   <a href="../articles/EIX.html">Get started</a>
 63 | </li>
 64 | <li>
 65 |   <a href="../reference/index.html">Reference</a>
 66 | </li>
 67 | <li class="dropdown">
 68 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 69 |     Articles
 70 |      
 71 |     <span class="caret"></span>
 72 |   </a>
 73 |   <ul class="dropdown-menu" role="menu">
 74 |     <li>
 75 |       <a href="../articles/titanic_data.html">EIX: Titanic data </a>
 76 |     </li>
 77 |   </ul>
 78 | </li>
 79 |       </ul>
 80 |       
 81 |       <ul class="nav navbar-nav navbar-right">
 82 |         <li>
 83 |   <a href="https://github.com/ModelOriented/EIX">
 84 |     <span class="fa fa-github fa-lg"></span>
 85 |      
 86 |   </a>
 87 | </li>
 88 |       </ul>
 89 |     </div><!--/.nav-collapse -->
 90 |   </div><!--/.container -->
 91 | </div><!--/.navbar -->
 92 | 
 93 |       
 94 |       </header>
 95 | 
 96 |       <div class="row">
 97 |   <div class="col-md-9 contents">
 98 |     <div class="page-header">
 99 |       <h1>Articles</h1>
100 |     </div>
101 | 
102 |     <div class="section ">
103 |       <h3>All vignettes</h3>
104 |       <p class="section-desc"></p>
105 | 
106 |       <ul>
107 |         <li><a href="EIX.html">EIX: Explain Interactions in XGBoost</a></li>
108 |         <li><a href="titanic_data.html">EIX: Titanic data </a></li>
109 |       </ul>
110 |     </div>
111 |   </div>
112 | </div>
113 | 
114 |       <footer>
115 |       <div class="copyright">
116 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
117 | </div>
118 | 
119 | <div class="pkgdown">
120 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
121 | </div>
122 | 
123 |       </footer>
124 |    </div>
125 | 
126 |   </body>
127 | </html>
128 | 
129 | 


--------------------------------------------------------------------------------
/docs/pkgdown.css:
--------------------------------------------------------------------------------
  1 | /* Sticker footer */
  2 | body > .container {
  3 |   display: flex;
  4 |   padding-top: 60px;
  5 |   min-height: calc(100vh);
  6 |   flex-direction: column;
  7 | }
  8 | 
  9 | body > .container .row {
 10 |   flex: 1;
 11 | }
 12 | 
 13 | footer {
 14 |   margin-top: 45px;
 15 |   padding: 35px 0 36px;
 16 |   border-top: 1px solid #e5e5e5;
 17 |   color: #666;
 18 |   display: flex;
 19 | }
 20 | footer p {
 21 |   margin-bottom: 0;
 22 | }
 23 | footer div {
 24 |   flex: 1;
 25 | }
 26 | footer .pkgdown {
 27 |   text-align: right;
 28 | }
 29 | footer p {
 30 |   margin-bottom: 0;
 31 | }
 32 | 
 33 | img.icon {
 34 |   float: right;
 35 | }
 36 | 
 37 | img {
 38 |   max-width: 100%;
 39 | }
 40 | 
 41 | /* Section anchors ---------------------------------*/
 42 | 
 43 | a.anchor {
 44 |   margin-left: -30px;
 45 |   display:inline-block;
 46 |   width: 30px;
 47 |   height: 30px;
 48 |   visibility: hidden;
 49 | 
 50 |   background-image: url(./link.svg);
 51 |   background-repeat: no-repeat;
 52 |   background-size: 20px 20px;
 53 |   background-position: center center;
 54 | }
 55 | 
 56 | .hasAnchor:hover a.anchor {
 57 |   visibility: visible;
 58 | }
 59 | 
 60 | @media (max-width: 767px) {
 61 |   .hasAnchor:hover a.anchor {
 62 |     visibility: hidden;
 63 |   }
 64 | }
 65 | 
 66 | 
 67 | /* Fixes for fixed navbar --------------------------*/
 68 | 
 69 | .contents h1, .contents h2, .contents h3, .contents h4 {
 70 |   padding-top: 60px;
 71 |   margin-top: -60px;
 72 | }
 73 | 
 74 | /* Static header placement on mobile devices */
 75 | @media (max-width: 767px) {
 76 |   .navbar-fixed-top {
 77 |     position: absolute;
 78 |   }
 79 |   .navbar {
 80 |     padding: 0;
 81 |   }
 82 | }
 83 | 
 84 | 
 85 | /* Sidebar --------------------------*/
 86 | 
 87 | #sidebar {
 88 |   margin-top: 30px;
 89 | }
 90 | #sidebar h2 {
 91 |   font-size: 1.5em;
 92 |   margin-top: 1em;
 93 | }
 94 | 
 95 | #sidebar h2:first-child {
 96 |   margin-top: 0;
 97 | }
 98 | 
 99 | #sidebar .list-unstyled li {
100 |   margin-bottom: 0.5em;
101 | }
102 | 
103 | /* Reference index & topics ----------------------------------------------- */
104 | 
105 | .ref-index th {font-weight: normal;}
106 | .ref-index h2 {font-size: 20px;}
107 | 
108 | .ref-index td {vertical-align: top;}
109 | .ref-index .alias {width: 40%;}
110 | .ref-index .title {width: 60%;}
111 | 
112 | .ref-index .alias {width: 40%;}
113 | .ref-index .title {width: 60%;}
114 | 
115 | .ref-arguments th {text-align: right; padding-right: 10px;}
116 | .ref-arguments th, .ref-arguments td {vertical-align: top;}
117 | .ref-arguments .name {width: 20%;}
118 | .ref-arguments .desc {width: 80%;}
119 | 
120 | /* Nice scrolling for wide elements --------------------------------------- */
121 | 
122 | table {
123 |   display: block;
124 |   overflow: auto;
125 | }
126 | 
127 | /* Syntax highlighting ---------------------------------------------------- */
128 | 
129 | pre {
130 |   word-wrap: normal;
131 |   word-break: normal;
132 |   border: 1px solid #eee;
133 | }
134 | 
135 | pre, code {
136 |   background-color: #f8f8f8;
137 |   color: #333;
138 | }
139 | 
140 | pre .img {
141 |   margin: 5px 0;
142 | }
143 | 
144 | pre .img img {
145 |   background-color: #fff;
146 |   display: block;
147 |   height: auto;
148 | }
149 | 
150 | code a, pre a {
151 |   color: #375f84;
152 | }
153 | table {
154 |     display: block;
155 |     overflow: auto;
156 | 	width: 100% !important;
157 | }
158 | 
159 | .fl      {color: #1514b5;}
160 | .fu      {color: #000000;} /* function */
161 | .ch,.st  {color: #036a07;} /* string */
162 | .kw      {color: #264D66;} /* keyword */
163 | .co      {color: #888888;} /* comment */
164 | 
165 | .message { color: black;   font-weight: bolder;}
166 | .error   { color: orange;  font-weight: bolder;}
167 | .warning { color: #6A0366; font-weight: bolder;}
168 | 
169 | .navbar-mi2logo {
170 |     float: left;
171 | 	margin-right: 15px;
172 | 	margin-top: 2px;
173 | }
174 | .navbar-mi2 {
175 | 	background-color: #4a3c89;
176 |     color: #fff !important;
177 | 	margin-right: 0px;
178 | }
179 | .navbar-mi2 > li > a {
180 |     color: #fff !important;
181 | }
182 | .navbar-mi2 > .active > a{
183 |     background-color: #370f54 !important;
184 | }
185 | .navbar-mi2 > .open > a:focus, .nav-pills> .open > a:focus{
186 |     background-color: #370f54 !important;
187 | }
188 | .dropdown-menu > .active > a, .dropdown-menu > .active > a:focus{
189 |     background-color: #370f54 !important;
190 | }
191 | 
192 |  .contents-mi2 > li > a:focus, .nav-pills > li > a:focus {
193 |     background-color: #4a3c89 !important;
194 | 	color: #fff;
195 | }
196 |  .contents-mi2 > li.active > a, .nav-pills > li.active > a{
197 |     background-color: #370f54 !important;
198 | }
199 |  .contents-mi2 > li > a, .nav-pills > li > a{
200 |     background-color: #4a3c89 !important;
201 | 	color: #fff;
202 | }
203 | 
204 | .sidebar-logo {
205 | 	display:block;
206 | 	margin-left:auto;
207 | 	margin-right:auto;
208 | 	text-align: justify;
209 | }


--------------------------------------------------------------------------------
/docs/reference/tableOfTrees.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html>
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>tableOfTrees — tableOfTrees • EIX</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 16 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 20 | 
 21 | 
 22 | <!-- pkgdown -->
 23 | <link href="../pkgdown.css" rel="stylesheet">
 24 | <script src="../jquery.sticky-kit.min.js"></script>
 25 | <script src="../pkgdown.js"></script>
 26 | <!-- mathjax -->
 27 | <script src='https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML'></script>
 28 | 
 29 | <!--[if lt IE 9]>
 30 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 31 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 32 | <![endif]-->
 33 | 
 34 | 
 35 |   </head>
 36 | 
 37 |   <body>
 38 |     <div class="container template-reference-topic">
 39 |       <header>
 40 |       <div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 41 |   <div class="container">
 42 |     <div class="navbar-header">
 43 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 44 |         <span class="icon-bar"></span>
 45 |         <span class="icon-bar"></span>
 46 |         <span class="icon-bar"></span>
 47 |       </button>
 48 | 	  <a class = "navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 49 |         <img src = "https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt = "MI2" height = 46 title = "MI2">
 50 | 	  </a>
 51 |       <a class="navbar-brand navbar-mi2" href="../index.html">tableOfTrees</a>
 52 |     </div>
 53 |     <div id="navbar" class="navbar-collapse collapse">
 54 |       <ul class="navbar-mi2 nav navbar-nav">
 55 |         <li>
 56 |   <a href="../index.html">
 57 |     <span class="fa fa-home fa-lg"></span>
 58 |      
 59 |   </a>
 60 | </li>
 61 | <li>
 62 |   <a href="../articles/EIX.html">Get started</a>
 63 | </li>
 64 | <li>
 65 |   <a href="../reference/index.html">Reference</a>
 66 | </li>
 67 | <li class="dropdown">
 68 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 69 |     Articles
 70 |      
 71 |     <span class="caret"></span>
 72 |   </a>
 73 |   <ul class="dropdown-menu" role="menu">
 74 |     <li>
 75 |       <a href="../articles/titanic_data.html">EIX: Titanic data </a>
 76 |     </li>
 77 |   </ul>
 78 | </li>
 79 |       </ul>
 80 |       
 81 |       <ul class="nav navbar-nav navbar-right">
 82 |         <li>
 83 |   <a href="https://github.com/ModelOriented/EIX">
 84 |     <span class="fa fa-github fa-lg"></span>
 85 |      
 86 |   </a>
 87 | </li>
 88 |       </ul>
 89 |     </div><!--/.nav-collapse -->
 90 |   </div><!--/.container -->
 91 | </div><!--/.navbar -->
 92 | 
 93 |       
 94 |       </header>
 95 | 
 96 |       <div class="row">
 97 |   <div class="col-md-9 contents">
 98 |     <div class="page-header">
 99 |     <h1>tableOfTrees</h1>
100 |     </div>
101 | 
102 |     
103 |     <p>tableOfTrees</p>
104 |     
105 | 
106 |     <pre class="usage"><span class='fu'>tableOfTrees</span>(<span class='no'>model</span>, <span class='no'>data</span>)</pre>
107 |     
108 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a> Arguments</h2>
109 |     <table class="ref-arguments">
110 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
111 |     <tr>
112 |       <th>model</th>
113 |       <td><p>a xgboost or lightgbm model</p></td>
114 |     </tr>
115 |     <tr>
116 |       <th>data</th>
117 |       <td><p>a data table with data used to train the model</p></td>
118 |     </tr>
119 |     </table>
120 |     
121 |     <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
122 | 
123 |     <p>a data table</p>
124 |     
125 | 
126 |   </div>
127 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
128 |     <h2>Contents</h2>
129 |     <ul class="nav nav-pills nav-stacked">
130 |       <li><a href="#arguments">Arguments</a></li>
131 |       
132 |       <li><a href="#value">Value</a></li>
133 |           </ul>
134 | 
135 |   </div>
136 | </div>
137 | 
138 |       <footer>
139 |       <div class="copyright">
140 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
141 | </div>
142 | 
143 | <div class="pkgdown">
144 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
145 | </div>
146 | 
147 |       </footer>
148 |    </div>
149 | 
150 |   </body>
151 | </html>
152 | 
153 | 


--------------------------------------------------------------------------------
/docs/reference/calculateGain.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html>
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>calculateGain — calculateGain • EIX</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 16 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 20 | 
 21 | 
 22 | <!-- pkgdown -->
 23 | <link href="../pkgdown.css" rel="stylesheet">
 24 | <script src="../jquery.sticky-kit.min.js"></script>
 25 | <script src="../pkgdown.js"></script>
 26 | <!-- mathjax -->
 27 | <script src='https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML'></script>
 28 | 
 29 | <!--[if lt IE 9]>
 30 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 31 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 32 | <![endif]-->
 33 | 
 34 | 
 35 |   </head>
 36 | 
 37 |   <body>
 38 |     <div class="container template-reference-topic">
 39 |       <header>
 40 |       <div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 41 |   <div class="container">
 42 |     <div class="navbar-header">
 43 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 44 |         <span class="icon-bar"></span>
 45 |         <span class="icon-bar"></span>
 46 |         <span class="icon-bar"></span>
 47 |       </button>
 48 | 	  <a class = "navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 49 |         <img src = "https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt = "MI2" height = 46 title = "MI2">
 50 | 	  </a>
 51 |       <a class="navbar-brand navbar-mi2" href="../index.html">calculateGain</a>
 52 |     </div>
 53 |     <div id="navbar" class="navbar-collapse collapse">
 54 |       <ul class="navbar-mi2 nav navbar-nav">
 55 |         <li>
 56 |   <a href="../index.html">
 57 |     <span class="fa fa-home fa-lg"></span>
 58 |      
 59 |   </a>
 60 | </li>
 61 | <li>
 62 |   <a href="../articles/EIX.html">Get started</a>
 63 | </li>
 64 | <li>
 65 |   <a href="../reference/index.html">Reference</a>
 66 | </li>
 67 | <li class="dropdown">
 68 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 69 |     Articles
 70 |      
 71 |     <span class="caret"></span>
 72 |   </a>
 73 |   <ul class="dropdown-menu" role="menu">
 74 |     <li>
 75 |       <a href="../articles/titanic_data.html">EIX: Titanic data </a>
 76 |     </li>
 77 |   </ul>
 78 | </li>
 79 |       </ul>
 80 |       
 81 |       <ul class="nav navbar-nav navbar-right">
 82 |         <li>
 83 |   <a href="https://github.com/ModelOriented/EIX">
 84 |     <span class="fa fa-github fa-lg"></span>
 85 |      
 86 |   </a>
 87 | </li>
 88 |       </ul>
 89 |     </div><!--/.nav-collapse -->
 90 |   </div><!--/.container -->
 91 | </div><!--/.navbar -->
 92 | 
 93 |       
 94 |       </header>
 95 | 
 96 |       <div class="row">
 97 |   <div class="col-md-9 contents">
 98 |     <div class="page-header">
 99 |     <h1>calculateGain</h1>
100 |     </div>
101 | 
102 |     
103 |     <p>List of trees with pairs of variable and other needed fields</p>
104 |     
105 | 
106 |     <pre class="usage"><span class='fu'>calculateGain</span>(<span class='no'>xgb.model</span>, <span class='no'>data</span>)</pre>
107 |     
108 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a> Arguments</h2>
109 |     <table class="ref-arguments">
110 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
111 |     <tr>
112 |       <th>xgb.model</th>
113 |       <td><p>a xgboost or lightgbm model</p></td>
114 |     </tr>
115 |     <tr>
116 |       <th>data</th>
117 |       <td><p>a data table with data used to train the model</p></td>
118 |     </tr>
119 |     </table>
120 |     
121 |     <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
122 | 
123 |     <p>a list</p>
124 |     
125 | 
126 |   </div>
127 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
128 |     <h2>Contents</h2>
129 |     <ul class="nav nav-pills nav-stacked">
130 |       <li><a href="#arguments">Arguments</a></li>
131 |       
132 |       <li><a href="#value">Value</a></li>
133 |           </ul>
134 | 
135 |   </div>
136 | </div>
137 | 
138 |       <footer>
139 |       <div class="copyright">
140 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
141 | </div>
142 | 
143 | <div class="pkgdown">
144 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
145 | </div>
146 | 
147 |       </footer>
148 |    </div>
149 | 
150 |   </body>
151 | </html>
152 | 
153 | 


--------------------------------------------------------------------------------
/R/calculateGain.R:
--------------------------------------------------------------------------------
  1 | #' calculateGain
  2 | #'
  3 | #' List of trees with pairs of variable and other needed fields
  4 | #'
  5 | #' @param xgb.model a xgboost or lightgbm model
  6 | #' @param data a data table with data used to train the model
  7 | #'
  8 | #' @return a list
  9 | #'
 10 | #' @import data.table
 11 | #'
 12 | #' @keywords internal
 13 | #'
 14 | 
 15 | # @import stats
 16 | # @import utils
 17 | calculateGain <- function(xgb.model, data) {
 18 | 
 19 |   leaf <- Feature <- Yes <- No <- ID <- parentsGain <- Quality <- parentsCover <-
 20 |     Cover <- name_pair <- childsGain <- depth <- parentsName <- NULL
 21 | 
 22 |   trees = tableOfTrees(xgb.model, data)
 23 |   trees[, leaf := Feature == "Leaf"]
 24 |   trees$depth <- 0
 25 |   treeList = split(trees, as.factor(trees$Tree))
 26 | 
 27 |   for (tree in treeList) {
 28 |     num_nodes = nrow(tree)
 29 |     non_leaf_rows = which(tree[, leaf] == F)
 30 |     for (r in non_leaf_rows) {
 31 |       left = tree[r, Yes]
 32 |       right = tree[r, No]
 33 |       if (tree[ID == left, leaf] == F) {
 34 |        # newDepth <- tree[r , depth] + 1
 35 |         tree[ID == left,`:=`(parentsGain = tree[r, Quality],
 36 |                              parentsCover = tree[r, Cover],
 37 |                              name_pair = paste(tree[r, Feature], tree[ID == left, Feature], sep = ":"),
 38 |                              childsGain = Quality,
 39 |                              depth = tree[r , depth] + 1,
 40 |                              parentsName = tree[r, Feature])]
 41 |         tree[ID == left, interaction := ((parentsGain < childsGain) & (Feature != parentsName))]
 42 |       }
 43 | 
 44 |       if (tree[ID == right, leaf]==F) {
 45 | 
 46 |         #newDepth <- tree[r , depth] + 1
 47 |         tree[ID == right, `:=`(parentsGain = tree[r, Quality],
 48 |                                parentsCover = tree[r, Cover],
 49 |                                name_pair = paste(tree[r, Feature], tree[ID == right, Feature], sep = ":"),
 50 |                                childsGain = Quality,
 51 |                                depth = tree[r , depth] + 1,
 52 |                                parentsName = tree[r, Feature])]
 53 |         tree[ID == right, interaction := ((parentsGain < childsGain) & (Feature != parentsName))]
 54 |       }
 55 |     }
 56 |   }
 57 | 
 58 |   return(treeList)
 59 | }
 60 | 
 61 | #'tableOfTrees
 62 | #'
 63 | #'tableOfTrees
 64 | #'
 65 | #' @param model a xgboost or lightgbm model
 66 | #' @param data a data table with data used to train the model
 67 | #'
 68 | #' @return a data table
 69 | #'
 70 | #' @import data.table
 71 | #' @importFrom xgboost xgb.model.dt.tree
 72 | #'
 73 | #' @keywords internal
 74 | #'
 75 | #  @import lightgbm
 76 | 
 77 | 
 78 | tableOfTrees <- function(model, data){
 79 |   count <- split_feature <- leaf_count <- internal_count <-
 80 |     split_index <- tree_index <- leaf_index <- threshold <-
 81 |     leaf_value <- split_gain <- flag <- node_parent <- leaf_parent<-
 82 |     Node <- Feature <- . <- Cover <- Yes <- No <- ID <-
 83 |     Tree<- Quality <- Missing <-Leaf_old_num<- Split <- NULL
 84 | 
 85 | 
 86 |   if(class(model)[1] == "xgb.Booster") {
 87 |     return(xgb.model.dt.tree(colnames(data), model)[])
 88 |   }
 89 |   if (class(model)[1] == "lgb.Booster") {
 90 |     lgb.trees <- lightgbm::lgb.model.dt.tree(model)
 91 | 
 92 |     lgb.trees <- lgb.trees[, count := ifelse(is.na(split_feature), leaf_count, internal_count)]
 93 | 
 94 |     lgb.trees <- lgb.trees[, max := max(split_index, na.rm = TRUE), by = tree_index]
 95 | 
 96 |     #UWAGA: nie jest tu istotne rodzaj nierówności, interesuje nas, że ktoś jest rodzicem, a nie, czy idzie w prawo i w lewo, dlatego losowe przypisanie Yes, No
 97 | 
 98 |     trees <- lgb.trees[, `:=`(Tree = tree_index,
 99 |                               Node = ifelse(is.na(split_index), max + leaf_index + 1, split_index),
100 |                               Feature = ifelse(is.na(split_feature), "Leaf", split_feature),
101 |                               Split = threshold, Missing = NA, Quality = ifelse(is.na(split_feature), leaf_value, split_gain),
102 |                               Cover = (1/4)*count,
103 |                               Leaf_old_num=leaf_index)]
104 |     trees[, `:=`(ID = paste(Tree, Node, sep = "-"))]
105 | 
106 |     trees[, flag := FALSE]
107 |     treeList = split(trees, as.factor(trees$Tree))
108 | 
109 |     for (tree in treeList) {
110 |       num_nodes = nrow(tree)
111 |       for (i in 1:num_nodes) {
112 |         if (is.na(tree[i, node_parent]) == FALSE) {
113 |           if (tree[Node == tree[i, node_parent] , flag] == FALSE) {
114 |             tree[Node == tree[i, node_parent] , Yes := paste(tree[i, Tree], tree[i, Node], sep = "-")]
115 |             tree[Node == tree[i, node_parent] , flag := TRUE]
116 |           } else{
117 |             tree[Node == tree[i, node_parent] , No := paste(tree[i, Tree], tree[i, Node], sep = "-")]
118 |           }
119 |         }
120 |         if (is.na(tree[i, leaf_parent]) == FALSE) {
121 |           if (tree[Node == tree[i, leaf_parent] , flag] == FALSE) {
122 |             tree[Node == tree[i, leaf_parent] , Yes := paste(tree[i, Tree], tree[i, Node], sep = "-")]
123 |             tree[Node == tree[i, leaf_parent] , flag := TRUE]
124 |           } else{
125 |             tree[Node == tree[i, leaf_parent] , No := paste(tree[i, Tree], tree[i, Node], sep = "-")]
126 |           }
127 |         }
128 |       }
129 |     }
130 |     trees <- rbindlist(treeList)
131 |     trees[, .(Tree, Node, ID, Feature, Split,  Yes, No, Missing,   Quality, Cover)]
132 |     return(trees[, .(Tree, Node, ID, Feature, Split,  Yes, No, Missing,   Quality, Cover,Leaf_old_num)][])
133 |   }
134 |   if (class(model)[1] != "xgb.Booster" || "lgb.Booster") {
135 |     return(cat( "You should choose one of two available models: xgboost, lightgbm \n" ))
136 |   }
137 | }
138 | 


--------------------------------------------------------------------------------
/docs/index.html:
--------------------------------------------------------------------------------
  1 | <!DOCTYPE html>
  2 | <!-- Generated by pkgdown: do not edit by hand --><html>
  3 | <head>
  4 | <meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
  5 | <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | <title>Explain Interactions in 'XGBoost' • EIX</title>
  9 | <!-- jquery --><script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script><!-- Bootstrap --><link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 10 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script><!-- Font Awesome icons --><link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 11 | <!-- pkgdown --><link href="pkgdown.css" rel="stylesheet">
 12 | <script src="jquery.sticky-kit.min.js"></script><script src="pkgdown.js"></script><!-- mathjax --><script src="https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML"></script><!--[if lt IE 9]>
 13 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 14 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 15 | <![endif]-->
 16 | </head>
 17 | <body>
 18 |     <div class="container template-home">
 19 |       <header><div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 20 |   <div class="container">
 21 |     <div class="navbar-header">
 22 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 23 |         <span class="icon-bar"></span>
 24 |         <span class="icon-bar"></span>
 25 |         <span class="icon-bar"></span>
 26 |       </button>
 27 | 	  <a class="navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 28 |         <img src="https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt="MI2" height="46" title="MI2"></a>
 29 |       <a class="navbar-brand navbar-mi2" href="index.html"></a>
 30 |     </div>
 31 |     <div id="navbar" class="navbar-collapse collapse">
 32 |       <ul class="navbar-mi2 nav navbar-nav">
 33 | <li>
 34 |   <a href="index.html">
 35 |     <span class="fa fa-home fa-lg"></span>
 36 |      
 37 |   </a>
 38 | </li>
 39 | <li>
 40 |   <a href="articles/EIX.html">Get started</a>
 41 | </li>
 42 | <li>
 43 |   <a href="reference/index.html">Reference</a>
 44 | </li>
 45 | <li class="dropdown">
 46 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 47 |     Articles
 48 |      
 49 |     <span class="caret"></span>
 50 |   </a>
 51 |   <ul class="dropdown-menu" role="menu">
 52 | <li>
 53 |       <a href="articles/titanic_data.html">EIX: Titanic data </a>
 54 |     </li>
 55 |   </ul>
 56 | </li>
 57 |       </ul>
 58 | <ul class="nav navbar-nav navbar-right">
 59 | <li>
 60 |   <a href="https://github.com/ModelOriented/EIX">
 61 |     <span class="fa fa-github fa-lg"></span>
 62 |      
 63 |   </a>
 64 | </li>
 65 |       </ul>
 66 | </div>
 67 | <!--/.nav-collapse -->
 68 |   </div>
 69 | <!--/.container -->
 70 | </div>
 71 | <!--/.navbar -->
 72 | 
 73 |       
 74 |       </header><div class="row">
 75 |   <div class="contents col-md-9">
 76 |     
 77 | <div id="eix---explain-interactions-in-xgboost" class="section level2">
 78 | <h2 class="hasAnchor">
 79 | <a href="#eix---explain-interactions-in-xgboost" class="anchor"></a>EIX - Explain Interactions in Xgboost</h2>
 80 | <p>A set of tools to explain XGBoost and LightGBM models.</p>
 81 | </div>
 82 | <div id="installation" class="section level2">
 83 | <h2 class="hasAnchor">
 84 | <a href="#installation" class="anchor"></a>Installation</h2>
 85 | <p>Install from GitHub</p>
 86 | <pre class="{r}"><code><a href="https://www.rdocumentation.org/packages/devtools/topics/install_github">devtools::install_github("ModelOriented/EIX")</a></code></pre>
 87 | </div>
 88 | <div id="cheatsheets" class="section level2">
 89 | <h2 class="hasAnchor">
 90 | <a href="#cheatsheets" class="anchor"></a>Cheatsheets</h2>
 91 | <p><img src="https://raw.githubusercontent.com/ekarbowiak/EIX/master/cheatsheets/EIX.png"></p>
 92 | </div>
 93 | 
 94 |   </div>
 95 | 
 96 |   <div class="col-md-3" id="sidebar">
 97 |   	<div class="sidebar-logo">
 98 | 	 <p>
 99 | 		This package is developed by the <a href="http://mi2.mini.pw.edu.pl">MI^2 group</a>. MI^2 (pronounce: Am I square?) is a group of mathematicians and computer scientists that love to play with data. We create tools, do consulting and share our positive attitude. 
100 | 	 </p>
101 | 	</div>
102 |     <div class="links">
103 | <h2>Links</h2>
104 | <ul class="list-unstyled">
105 | <li>Browse source code at <br><a href="https://github.com/ModelOriented/EIX">https://​github.com/​ModelOriented/​EIX</a>
106 | </li>
107 | <li>Report a bug at <br><a href="https://github.com/ModelOriented/EIX/issues">https://​github.com/​ModelOriented/​EIX/​issues</a>
108 | </li>
109 | </ul>
110 | </div>
111 | <div class="license">
112 | <h2>License</h2>
113 | <ul class="list-unstyled">
114 | <li><a href="https://www.r-project.org/Licenses/GPL-2">GPL-2</a></li>
115 | </ul>
116 | </div>
117 | <div class="developers">
118 | <h2>Developers</h2>
119 | <ul class="list-unstyled">
120 | <li>Ewelina Karbowiak <br><small class="roles"> Author, maintainer </small>  </li>
121 | <li>Przemyslaw Biecek <br><small class="roles"> Author, thesis advisor </small>  </li>
122 | </ul>
123 | </div>
124 | 
125 |   </div>
126 | </div>
127 | 
128 | 
129 |       <footer><div class="copyright">
130 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
131 | </div>
132 | 
133 | <div class="pkgdown">
134 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
135 | </div>
136 | 
137 |       </footer>
138 | </div>
139 | 
140 |   </body>
141 | </html>
142 | 


--------------------------------------------------------------------------------
/docs/reference/HR_data.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html>
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Why are our best and most experienced employees leaving prematurely? — HR_data • EIX</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 16 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 20 | 
 21 | 
 22 | <!-- pkgdown -->
 23 | <link href="../pkgdown.css" rel="stylesheet">
 24 | <script src="../jquery.sticky-kit.min.js"></script>
 25 | <script src="../pkgdown.js"></script>
 26 | <!-- mathjax -->
 27 | <script src='https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML'></script>
 28 | 
 29 | <!--[if lt IE 9]>
 30 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 31 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 32 | <![endif]-->
 33 | 
 34 | 
 35 |   </head>
 36 | 
 37 |   <body>
 38 |     <div class="container template-reference-topic">
 39 |       <header>
 40 |       <div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 41 |   <div class="container">
 42 |     <div class="navbar-header">
 43 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 44 |         <span class="icon-bar"></span>
 45 |         <span class="icon-bar"></span>
 46 |         <span class="icon-bar"></span>
 47 |       </button>
 48 | 	  <a class = "navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 49 |         <img src = "https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt = "MI2" height = 46 title = "MI2">
 50 | 	  </a>
 51 |       <a class="navbar-brand navbar-mi2" href="../index.html">Why are our best and most experienced employees leaving prematurely?</a>
 52 |     </div>
 53 |     <div id="navbar" class="navbar-collapse collapse">
 54 |       <ul class="navbar-mi2 nav navbar-nav">
 55 |         <li>
 56 |   <a href="../index.html">
 57 |     <span class="fa fa-home fa-lg"></span>
 58 |      
 59 |   </a>
 60 | </li>
 61 | <li>
 62 |   <a href="../articles/EIX.html">Get started</a>
 63 | </li>
 64 | <li>
 65 |   <a href="../reference/index.html">Reference</a>
 66 | </li>
 67 | <li class="dropdown">
 68 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 69 |     Articles
 70 |      
 71 |     <span class="caret"></span>
 72 |   </a>
 73 |   <ul class="dropdown-menu" role="menu">
 74 |     <li>
 75 |       <a href="../articles/titanic_data.html">EIX: Titanic data </a>
 76 |     </li>
 77 |   </ul>
 78 | </li>
 79 |       </ul>
 80 |       
 81 |       <ul class="nav navbar-nav navbar-right">
 82 |         <li>
 83 |   <a href="https://github.com/ModelOriented/EIX">
 84 |     <span class="fa fa-github fa-lg"></span>
 85 |      
 86 |   </a>
 87 | </li>
 88 |       </ul>
 89 |     </div><!--/.nav-collapse -->
 90 |   </div><!--/.container -->
 91 | </div><!--/.navbar -->
 92 | 
 93 |       
 94 |       </header>
 95 | 
 96 |       <div class="row">
 97 |   <div class="col-md-9 contents">
 98 |     <div class="page-header">
 99 |     <h1>Why are our best and most experienced employees leaving prematurely?</h1>
100 |     </div>
101 | 
102 |     
103 |     <p>A dataset from Kaggle competition Human Resources Analytics.
104 | https://www.kaggle.com/ludobenistant/hr-analytics/data</p>
105 |     
106 | 
107 |         
108 |     <h2 class="hasAnchor" id="format"><a class="anchor" href="#format"></a>Format</h2>
109 | 
110 |     <p>A data table with 14999 rows and 10 variables</p>
111 |     
112 |     <h2 class="hasAnchor" id="source"><a class="anchor" href="#source"></a>Source</h2>
113 | 
114 |     <p>https://www.kaggle.com/ludobenistant/hr-analytics/data, <a href='https://cran.r-project.org/package=breakDown'>https://cran.r-project.org/package=breakDown</a></p>
115 |     
116 |     <h2 class="hasAnchor" id="details"><a class="anchor" href="#details"></a>Details</h2>
117 | 
118 |     <p>The description of the dataset was copied from the <code>breakDown</code> package.</p>
119 | <ul>
120 | <li><p>satisfaction_level Level of satisfaction (0-1)</p></li>
121 | <li><p>last_evaluation Time since last performance evaluation (in Years)</p></li>
122 | <li><p>number_project  Number of projects completed while at work</p></li>
123 | <li><p>average_montly_hours  Average monthly hours at workplace</p></li>
124 | <li><p>time_spend_company  Number of years spent in the company</p></li>
125 | <li><p>Work_accident  Whether the employee had a workplace accident</p></li>
126 | <li><p>left  Whether the employee left the workplace or not (1 or 0) Factor</p></li>
127 | <li><p>promotion_last_5years  Whether the employee was promoted in the last five years</p></li>
128 | <li><p>sales  Department in which they work for</p></li>
129 | <li><p>salary  Relative level of salary (high)</p></li>
130 | </ul>
131 |     
132 | 
133 |   </div>
134 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
135 |     <h2>Contents</h2>
136 |     <ul class="nav nav-pills nav-stacked">
137 |       
138 |       <li><a href="#format">Format</a></li>
139 | 
140 |       <li><a href="#source">Source</a></li>
141 | 
142 |       <li><a href="#details">Details</a></li>
143 |           </ul>
144 | 
145 |   </div>
146 | </div>
147 | 
148 |       <footer>
149 |       <div class="copyright">
150 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
151 | </div>
152 | 
153 | <div class="pkgdown">
154 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
155 | </div>
156 | 
157 |       </footer>
158 |    </div>
159 | 
160 |   </body>
161 | </html>
162 | 
163 | 


--------------------------------------------------------------------------------
/R/plot_importance.R:
--------------------------------------------------------------------------------
  1 | #' Plot importance measures
  2 | #'
  3 | #' This functions plots selected measures of importance for variables and interactions.
  4 | #' It is possible to visualise importance table in two ways: radar plot with six measures
  5 | #' and scatter plot with two choosen measures.
  6 | #'
  7 | #' Available measures:
  8 | #'\itemize{
  9 | #'\item "sumGain" - sum of Gain value in all nodes, in which given variable occurs,
 10 | #'\item "sumCover" - sum of Cover value in all nodes, in which given variable occurs; for LightGBM models: number of observation, which pass through the node,
 11 | #'\item "mean5Gain" - mean gain from 5 occurrences of given variable with the highest gain,
 12 | #'\item "meanGain" - mean Gain value in all nodes, in which given variable occurs,
 13 | #'\item "meanCover" - mean Cover value in all nodes, in which given variable occurs; for LightGBM models: mean number of observation, which pass through the node,
 14 | #'\item "freqency" - number of occurrences in the nodes for given variable.
 15 | #'}
 16 | #'
 17 | #' Additionally for plots with single variables:
 18 | #'\itemize{
 19 | #'\item "meanDepth"  - mean depth weighted by gain,
 20 | #'\item "numberOfRoots" - number of occurrences in the root,
 21 | #'\item "weightedRoot" - mean number of occurrences in the root, which is weighted by gain.
 22 | #'}
 23 | #'
 24 | #' @param x a result from the \code{importance} function.
 25 | #' @param top number of positions on the plot or NULL for all variable. Default 10.
 26 | #' @param radar TRUE/FALSE. If TRUE the plot shows
 27 | #'               six measures of variables' or interactions' importance in the model.
 28 | #'               If FALSE the plot containing two chosen measures
 29 | #'               of variables' or interactions' importance in the model.
 30 | #' @param text_start_point place, where the names of the particular feature start. Available for `radar=TRUE`. Range from 0 to 1. Default 0.5.
 31 | #' @param text_size size of the text on the plot. Default 3.5.
 32 | #' @param xmeasure measure on the x-axis.Available for `radar=FALSE`. Default "sumCover".
 33 | #' @param ymeasure measure on the y-axis. Available for `radar=FALSE`. Default "sumGain".
 34 | #' @param ... other parameters.
 35 | #'
 36 | #' @return a ggplot object
 37 | #'
 38 | #' @import ggplot2
 39 | #' @import data.table
 40 | #' @importFrom DALEX theme_drwhy
 41 | #' @importFrom ggrepel geom_label_repel
 42 | #' @importFrom ggiraphExtra coord_radar
 43 | #'
 44 | #' @examples
 45 | #' library("EIX")
 46 | #' library("Matrix")
 47 | #' sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
 48 | #'
 49 | #' library("xgboost")
 50 | #' param <- list(objective = "binary:logistic", max_depth = 2)
 51 | #' xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose=0)
 52 | #'
 53 | #' imp <- importance(xgb_model, sm, option = "both")
 54 | #' imp
 55 | #' plot(imp,  top = 10)
 56 | #'
 57 | #' imp <- importance(xgb_model, sm, option = "variables")
 58 | #' imp
 59 | #' plot(imp,  top = nrow(imp))
 60 | #'
 61 | #'  imp <- importance(xgb_model, sm, option = "interactions")
 62 | #'  imp
 63 | #' plot(imp,  top =  nrow(imp))
 64 | #'
 65 | #'  imp <- importance(xgb_model, sm, option = "variables")
 66 | #'  imp
 67 | #' plot(imp, top = NULL, radar = FALSE, xmeasure = "sumCover", ymeasure = "sumGain")
 68 | #'
 69 | #'\donttest{
 70 | #'library(lightgbm)
 71 | #'train_data <- lgb.Dataset(sm, label =  HR_data[, left] == 1)
 72 | #'params <- list(objective = "binary", max_depth = 2)
 73 | #'lgb_model <- lgb.train(params, train_data, 25)
 74 | #'
 75 | #' imp <- importance(lgb_model, sm, option = "both")
 76 | #' imp
 77 | #' plot(imp,  top = nrow(imp))
 78 | #'
 79 | #' imp <- importance(lgb_model, sm, option = "variables")
 80 | #' imp
 81 | #' plot(imp, top = NULL, radar = FALSE, xmeasure = "sumCover", ymeasure = "sumGain")
 82 | #'
 83 | #'}
 84 | #'
 85 | #' @export
 86 | 
 87 | 
 88 | plot.importance <- function(x, ...,  top = 10, radar = TRUE, text_start_point = 0.5, text_size=3.5,
 89 |                                  xmeasure = "sumCover", ymeasure = "sumGain"){
 90 | 
 91 |   Feature <- sumGain <- sumCover <- meanGain <- meanCover <-
 92 |     mean5Gain <- . <- value <- variable <- hjust <- NULL
 93 | 
 94 |   if (is.null(top))
 95 |     top <- nrow(x)
 96 | 
 97 | 
 98 |   if (radar == FALSE) {
 99 |     ggplot(data.frame(x[1:top, ]),
100 |            aes_string(x = xmeasure, y = ymeasure, label = "Feature")) +
101 |       geom_point() +
102 |       scale_size() + geom_label_repel() + theme_drwhy()
103 | 
104 |   }else{
105 |     import <- as.data.table(x[1:top, ])
106 |     import <- import[1:top, .(Feature,
107 |                               sumGain = sumGain / max(import[, sumGain]),
108 |                               sumCover = sumCover / max(import[, sumCover]),
109 |                               meanGain = meanGain / max(import[, meanGain]),
110 |                               meanCover = meanCover / max(import[, meanCover]),
111 |                               mean5Gain = mean5Gain / max(import[, mean5Gain]),
112 |                               frequency = frequency / max(import[, frequency]))]
113 |     data<-import[,Feature:= ifelse(nchar(import[,Feature])>20, gsub(":", ": :",import[,Feature]),Feature)]
114 | 
115 |     import$Feature <- factor(import$Feature, levels = import$Feature[order(import$sumGain, decreasing = TRUE)])
116 | 
117 |     #angles and hjust of labels
118 |     numberOfBars=nrow(import)
119 |     angle= 90-360*(row(import)[,1]-0.5)/numberOfBars
120 | 
121 |     import$hjust<-ifelse( angle < -90, 1, 0)
122 |     import$angle<-ifelse(angle < -90, angle+180, angle)
123 | 
124 |     data_to_plot <- melt(import, id = c(1,8,9), measures = 2:6, value.factor = FALSE)
125 |     data<-data_to_plot[,.(hjust=mean(hjust),angle=mean(angle)), by=Feature]
126 | 
127 |     ggplot(data.frame(data_to_plot),
128 |            aes(x = Feature, y = value, colour = variable, group = variable)) +
129 |       geom_line(size = 1.5) +
130 |       geom_point(size = 2.5) +
131 |       theme_drwhy() +
132 |       theme(axis.title.x = element_blank(),
133 |             axis.title.y = element_blank(),
134 |             legend.position = "bottom",
135 |             panel.grid.major.y = element_line(colour = "gray68", linetype = "dashed", size = 0.4),
136 |             axis.line = element_blank(),
137 |             axis.text.x=element_blank(),) +
138 |       labs(fill = "Measures")+
139 |       coord_radar() +
140 |       geom_text(data=data, aes(x=Feature, y= rep(text_start_point,top), label=lapply(strwrap(data[,Feature], width = 10, simplify = FALSE), paste, collapse="\n"), hjust=hjust), color="#371ea3", fontface="bold",alpha=0.6, size=text_size, angle= data$angle, inherit.aes = FALSE )
141 | 
142 |   }
143 | }
144 | 


--------------------------------------------------------------------------------
/docs/reference/index.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html>
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Function reference • EIX</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 16 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 20 | 
 21 | 
 22 | <!-- pkgdown -->
 23 | <link href="../pkgdown.css" rel="stylesheet">
 24 | <script src="../jquery.sticky-kit.min.js"></script>
 25 | <script src="../pkgdown.js"></script>
 26 | <!-- mathjax -->
 27 | <script src='https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML'></script>
 28 | 
 29 | <!--[if lt IE 9]>
 30 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 31 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 32 | <![endif]-->
 33 | 
 34 | 
 35 |   </head>
 36 | 
 37 |   <body>
 38 |     <div class="container template-reference-index">
 39 |       <header>
 40 |       <div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 41 |   <div class="container">
 42 |     <div class="navbar-header">
 43 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 44 |         <span class="icon-bar"></span>
 45 |         <span class="icon-bar"></span>
 46 |         <span class="icon-bar"></span>
 47 |       </button>
 48 | 	  <a class = "navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 49 |         <img src = "https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt = "MI2" height = 46 title = "MI2">
 50 | 	  </a>
 51 |       <a class="navbar-brand navbar-mi2" href="../index.html"></a>
 52 |     </div>
 53 |     <div id="navbar" class="navbar-collapse collapse">
 54 |       <ul class="navbar-mi2 nav navbar-nav">
 55 |         <li>
 56 |   <a href="../index.html">
 57 |     <span class="fa fa-home fa-lg"></span>
 58 |      
 59 |   </a>
 60 | </li>
 61 | <li>
 62 |   <a href="../articles/EIX.html">Get started</a>
 63 | </li>
 64 | <li>
 65 |   <a href="../reference/index.html">Reference</a>
 66 | </li>
 67 | <li class="dropdown">
 68 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 69 |     Articles
 70 |      
 71 |     <span class="caret"></span>
 72 |   </a>
 73 |   <ul class="dropdown-menu" role="menu">
 74 |     <li>
 75 |       <a href="../articles/titanic_data.html">EIX: Titanic data </a>
 76 |     </li>
 77 |   </ul>
 78 | </li>
 79 |       </ul>
 80 |       
 81 |       <ul class="nav navbar-nav navbar-right">
 82 |         <li>
 83 |   <a href="https://github.com/ModelOriented/EIX">
 84 |     <span class="fa fa-github fa-lg"></span>
 85 |      
 86 |   </a>
 87 | </li>
 88 |       </ul>
 89 |     </div><!--/.nav-collapse -->
 90 |   </div><!--/.container -->
 91 | </div><!--/.navbar -->
 92 | 
 93 |       
 94 |       </header>
 95 | 
 96 |       <div class="row">
 97 |   <div class="col-md-9">
 98 |     <div class="page-header">
 99 |       <h1>
100 |         Reference
101 |         <small>version&nbsp;1.0</small>
102 |       </h1>
103 |     </div>
104 | 
105 |     <div class="contents">
106 |       <table class="ref-index">
107 | 
108 |       <colgroup>
109 |         <col class="alias" />
110 |         <col class="title" />
111 |       </colgroup>
112 | 
113 |       <tbody>
114 |         <tr>
115 |           <th colspan="2">
116 |             <h2 id="section-all-functions" class="hasAnchor"><a href="#section-all-functions" class="anchor"></a>All functions</h2>
117 |             <p class="section-desc"></p>
118 |           </th>
119 |         </tr>
120 |         <tr>
121 |           <!--  -->
122 |           <td>
123 |             <p><code><a href="HR_data.html">HR_data</a></code> </p>
124 |           </td>
125 |           <td><p>Why are our best and most experienced employees leaving prematurely?</p></td>
126 |         </tr><tr>
127 |           <!--  -->
128 |           <td>
129 |             <p><code><a href="importance.html">importance()</a></code> </p>
130 |           </td>
131 |           <td><p>Importance of variables and interactions in the model</p></td>
132 |         </tr><tr>
133 |           <!--  -->
134 |           <td>
135 |             <p><code><a href="interactions.html">interactions()</a></code> </p>
136 |           </td>
137 |           <td><p>Importance of interactions and pairs in the model</p></td>
138 |         </tr><tr>
139 |           <!--  -->
140 |           <td>
141 |             <p><code><a href="lollipop.html">lollipop()</a></code> </p>
142 |           </td>
143 |           <td><p>Tables needed for lollipop plot</p></td>
144 |         </tr><tr>
145 |           <!--  -->
146 |           <td>
147 |             <p><code><a href="plot.importance.html">plot(<i>&lt;importance&gt;</i>)</a></code> </p>
148 |           </td>
149 |           <td><p>Plot importance measures</p></td>
150 |         </tr><tr>
151 |           <!--  -->
152 |           <td>
153 |             <p><code><a href="plot.interactions.html">plot(<i>&lt;interactions&gt;</i>)</a></code> </p>
154 |           </td>
155 |           <td><p>Plot importance of interactions or pairs</p></td>
156 |         </tr><tr>
157 |           <!--  -->
158 |           <td>
159 |             <p><code><a href="plot.lollipop.html">plot(<i>&lt;lollipop&gt;</i>)</a></code> </p>
160 |           </td>
161 |           <td><p>Visualiation of the model</p></td>
162 |         </tr><tr>
163 |           <!--  -->
164 |           <td>
165 |             <p><code><a href="titanic_data.html">titanic_data</a></code> </p>
166 |           </td>
167 |           <td><p>Passengers and Crew on the RMS Titanic</p></td>
168 |         </tr><tr>
169 |           <!--  -->
170 |           <td>
171 |             <p><code><a href="waterfall.html">waterfall()</a></code> </p>
172 |           </td>
173 |           <td><p>Explain prediction of a single observation</p></td>
174 |         </tr>
175 |       </tbody>
176 |       </table>
177 |     </div>
178 |   </div>
179 | 
180 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
181 |     <h2>Contents</h2>
182 |     <ul class="nav nav-pills nav-stacked contents-mi2">
183 |       <li><a href="#section-all-functions">All functions</a></li>
184 |     </ul>
185 |   </div>
186 | </div>
187 | 
188 |       <footer>
189 |       <div class="copyright">
190 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
191 | </div>
192 | 
193 | <div class="pkgdown">
194 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
195 | </div>
196 | 
197 |       </footer>
198 |    </div>
199 | 
200 |   </body>
201 | </html>
202 | 
203 | 


--------------------------------------------------------------------------------
/R/importance.R:
--------------------------------------------------------------------------------
  1 | #' Importance of variables and interactions in the model
  2 | #'
  3 | #' This functions calculates a table with selected measures of importance
  4 | #' for variables and interactions.
  5 | #'
  6 | #' Available measures:
  7 | #'\itemize{
  8 | #'\item "sumGain" - sum of Gain value in all nodes, in which given variable occurs,
  9 | #'\item "sumCover" - sum of Cover value in all nodes, in which given variable occurs; for LightGBM models: number of observation, which pass through the node,
 10 | #'\item "mean5Gain" - mean gain from 5 occurrences of given variable with the highest gain,
 11 | #'\item "meanGain" - mean Gain value in all nodes, in which given variable occurs,
 12 | #'\item "meanCover" - mean Cover value in all nodes, in which given variable occurs; for LightGBM models: mean number of observation, which pass through the node,
 13 | #'\item "freqency" - number of occurrences in the nodes for given variable.
 14 | #'}
 15 | #'
 16 | #' Additionally for table with single variables:
 17 | #'\itemize{
 18 | #'\item "meanDepth"  - mean depth weighted by gain,
 19 | #'\item "numberOfRoots" - number of occurrences in the root,
 20 | #'\item "weightedRoot" - mean number of occurrences in the root, which is weighted by gain.
 21 | #'}
 22 | #'
 23 | #' @param xgb_model a xgboost or lightgbm model.
 24 | #' @param data a data table with data used to train the model.
 25 | #' @param option if "variables" then table includes only single variables,
 26 | #'            if "interactions", then only interactions
 27 | #'            if "both", then both single variable and interactions.
 28 | #'            Default "both".
 29 | #' @param digits number of significant digits that shall be returned. Will be passed to the signif() functions.
 30 | #'
 31 | #' @return a data table
 32 | #'
 33 | #' @import data.table
 34 | #' @importFrom stats frequency
 35 | #' @importFrom stats weighted.mean
 36 | #'
 37 | #' @examples
 38 | #' library("EIX")
 39 | #' library("Matrix")
 40 | #' sm <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
 41 | #'
 42 | #' library("xgboost")
 43 | #' param <- list(objective = "binary:logistic", max_depth = 2)
 44 | #' xgb_model <- xgboost(sm, params = param, label = HR_data[, left] == 1, nrounds = 25, verbose=0)
 45 | #'
 46 | #' imp <- importance(xgb_model, sm, option = "both")
 47 | #' imp
 48 | #' plot(imp,  top = 10)
 49 | #'
 50 | #' imp <- importance(xgb_model, sm, option = "variables")
 51 | #' imp
 52 | #' plot(imp,  top = nrow(imp))
 53 | #'
 54 | #'  imp <- importance(xgb_model, sm, option = "interactions")
 55 | #'  imp
 56 | #' plot(imp,  top =  nrow(imp))
 57 | #'
 58 | #'  imp <- importance(xgb_model, sm, option = "variables")
 59 | #'  imp
 60 | #' plot(imp, top = NULL, radar = FALSE, xmeasure = "sumCover", ymeasure = "sumGain")
 61 | #'
 62 | #'\donttest{
 63 | #'library(lightgbm)
 64 | #'train_data <- lgb.Dataset(sm, label =  HR_data[, left] == 1)
 65 | #'params <- list(objective = "binary", max_depth = 2)
 66 | #'lgb_model <- lgb.train(params, train_data, 25)
 67 | #'
 68 | #' imp <- importance(lgb_model, sm, option = "both")
 69 | #' imp
 70 | #' plot(imp,  top = nrow(imp))
 71 | #'
 72 | #' imp <- importance(lgb_model, sm, option = "variables")
 73 | #' imp
 74 | #' plot(imp, top = NULL, radar = FALSE, xmeasure = "sumCover", ymeasure = "sumGain")
 75 | #'
 76 | #'}
 77 | #'
 78 | #' @export
 79 | 
 80 | importance <- function(xgb_model, data, option = "both", digits = 4){
 81 |   importance <- NULL
 82 | 
 83 |   if (option == "both") {
 84 |     importance <- importanceTableMixed(xgb_model, data)
 85 |   }
 86 |   if (option == "variables") {
 87 |     importance <- importanceSingleVariable(xgb_model, data)
 88 |   }
 89 |   if (option == "interactions") {
 90 |     importance <- importanceInteraction(xgb_model, data)
 91 |   }
 92 | 
 93 |   importance <- cbind(importance[, 1], signif(importance[, -1], digits = digits))
 94 |   #importance <- unlist(importance)
 95 | 
 96 |   class(importance) <- c("importance", "data.table")
 97 | 
 98 |   return(importance[])
 99 | 
100 | }
101 | 
102 | importanceTableMixed <- function(xgb_model, data){
103 |   parentsGain <- childsGain <- name_pair <- Cover <- Feature <-
104 |     Gain <- indx <- . <- Quality <- NULL
105 | 
106 |   trees <- noLeavesGainTable(xgb_model, data)
107 | 
108 |   #single variables
109 |   importanceSingle <-
110 |     trees[(interaction == FALSE) | (is.na(interaction)), .(Feature, Gain = Quality, Cover)]
111 | 
112 |   #interactions
113 |   interactions <- trees[interaction == TRUE]
114 |   importanceInter <- interactions[, .(Feature = name_pair, Gain = childsGain, Cover)]
115 |   importance <- rbind(importanceSingle, importanceInter)
116 | 
117 |   importance4 <-
118 |     merge(importance[, .(sumGain = sum(Gain),
119 |                          sumCover = sum(Cover),
120 |                          meanGain = mean(Gain),
121 |                          meanCover = mean(Cover),
122 |                          frequency = .N), by = Feature],
123 |           mean5gain(importance), by = "Feature")
124 | 
125 |   setorderv(importance4, "sumGain", -1)
126 | 
127 |   return(importance4[])
128 | 
129 | }
130 | 
131 | 
132 | importanceInteraction <- function(xgb_model, data) {
133 |   parentsGain <- childsGain <- name_pair <- Cover <- . <- Feature <- Gain <- indx <- NULL
134 | 
135 |   trees <- noLeavesGainTable(xgb_model, data)
136 |   trees <- trees[interaction == TRUE]
137 |   tress <- trees[, `:=`(Feature = name_pair, Gain = childsGain)]
138 |   tress <- trees[, .(Feature, Gain, Cover)]
139 |   importance <- merge(trees[, .(sumGain = sum(Gain),
140 |                                 sumCover = sum(Cover),
141 |                                 meanGain = mean(Gain),
142 |                                 meanCover = mean(Cover),
143 |                                 frequency = .N), by = Feature],
144 |                       mean5gain(trees), by = "Feature")
145 | 
146 |   setorderv(importance, "sumGain", -1)
147 | 
148 |   return(importance[])
149 | }
150 | 
151 | 
152 | importanceSingleVariable <- function(xgb_model, data) {
153 |   Feature <- Gain <- Quality <- Cover <- indx <- . <- NULL
154 | 
155 |   trees <- noLeavesGainTable(xgb_model, data)
156 |   trees[, Gain := Quality]
157 | 
158 |   importance1 <- merge(countRoots(trees),calculateWeightedDepth(trees), by = "Feature", all = TRUE)[, -"sumGain"]
159 | 
160 |   trees <- trees[, .(Feature, Gain, Cover)]
161 | 
162 |   importance2 <- merge(trees[,.(sumGain=sum(Gain),
163 |                                 sumCover=sum(Cover),
164 |                                 meanGain=mean(Gain),
165 |                                 meanCover=mean(Cover),
166 |                                 frequency=.N),,by=Feature],
167 |                        mean5gain(trees), by="Feature")
168 |   importance <- merge(importance1, importance2, by = "Feature")[, -"count"]
169 | 
170 |   setorderv(importance, "sumGain", -1)
171 |   importance[is.na(importance)] <- 0
172 | 
173 |   return(importance[])
174 | 
175 | }
176 | 
177 | #Table with number of roots and weighedRoot
178 | #counts how many times each variable is in the root of the tree and calculates the weighedRoot-number of occurrences in root weighed by Gain.
179 | countRoots <- function(trees) {
180 |   Node <- Quality <- Feature <- sumGain <- . <-
181 |     weightedRoot <- numberOfRoots <- NULL
182 | 
183 |   roots <- trees[Node == 0, ]
184 |   roots <- roots[, .(sumGain = sum(Quality), numberOfRoots = .N), by = Feature]
185 |   sumGains <- sum(roots[, sumGain])
186 |   roots <- roots[, weightedRoot := round(roots[, sumGain] * roots[, numberOfRoots] / sumGains, 4)]
187 | 
188 |   return(roots[])
189 | 
190 | }
191 | 
192 | #Mean form 5 nodes with the highests gain
193 | mean5gain <- function(trees) {
194 |   indx <- Gain <- . <- Feature <- NULL
195 | 
196 |   setorder(setDT(trees), Feature,-Gain)[, indx := seq_len(.N), by = Feature]
197 |   importanceTop <- trees[indx <= 5]
198 |   importance <- importanceTop[, .(mean5Gain = mean(Gain)), by = Feature]
199 | 
200 |   return(importance[])
201 | }
202 | 
203 | #calculates depth mean for every variable weighted by Gain
204 | calculateWeightedDepth <- function(trees) {
205 |   Feature <- depth <- Quality <- . <- NULL
206 | 
207 |   trees <- trees[, .(meanDepth = weighted.mean(depth, Quality), count = .N), by = Feature]
208 | 
209 |   return(trees[])
210 | }
211 | 
212 | 
213 | noLeavesGainTable <- function(xgb_model, data) {
214 |   parentsName <- Feature <- Tree <- name_pair <- parentsGain <- childsGain <-
215 |     . <- Cover <- parentsCover <- interaction <- Node <- Quality <- depth <- NULL
216 | 
217 |   treeList <- calculateGain(xgb_model, data)
218 |   trees <- rbindlist(treeList)
219 |   trees <- trees[Feature != "Leaf", .(Tree, Node, name_pair, parentsGain, childsGain, Cover,
220 |                                       parentsCover, Feature, Quality, parentsName, interaction, depth)]
221 | 
222 |   return(trees[])
223 | }
224 | 


--------------------------------------------------------------------------------
/docs/reference/titanic.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html>
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Passengers and Crew on the RMS Titanic — titanic • EIX</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 16 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 20 | 
 21 | 
 22 | <!-- pkgdown -->
 23 | <link href="../pkgdown.css" rel="stylesheet">
 24 | <script src="../jquery.sticky-kit.min.js"></script>
 25 | <script src="../pkgdown.js"></script>
 26 | <!-- mathjax -->
 27 | <script src='https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML'></script>
 28 | 
 29 | <!--[if lt IE 9]>
 30 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 31 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 32 | <![endif]-->
 33 | 
 34 | 
 35 |   </head>
 36 | 
 37 |   <body>
 38 |     <div class="container template-reference-topic">
 39 |       <header>
 40 |       <div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 41 |   <div class="container">
 42 |     <div class="navbar-header">
 43 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 44 |         <span class="icon-bar"></span>
 45 |         <span class="icon-bar"></span>
 46 |         <span class="icon-bar"></span>
 47 |       </button>
 48 | 	  <a class = "navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 49 |         <img src = "https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt = "MI2" height = 46 title = "MI2">
 50 | 	  </a>
 51 |       <a class="navbar-brand navbar-mi2" href="../index.html">Passengers and Crew on the RMS Titanic</a>
 52 |     </div>
 53 |     <div id="navbar" class="navbar-collapse collapse">
 54 |       <ul class="navbar-mi2 nav navbar-nav">
 55 |         <li>
 56 |   <a href="../index.html">
 57 |     <span class="fa fa-home fa-lg"></span>
 58 |      
 59 |   </a>
 60 | </li>
 61 | <li>
 62 |   <a href="../articles/EIX.html">Get started</a>
 63 | </li>
 64 | <li>
 65 |   <a href="../reference/index.html">Reference</a>
 66 | </li>
 67 | <li class="dropdown">
 68 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 69 |     Articles
 70 |      
 71 |     <span class="caret"></span>
 72 |   </a>
 73 |   <ul class="dropdown-menu" role="menu">
 74 |     <li>
 75 |       <a href="../articles/vignette_titanic.html">EIX: Titanic data </a>
 76 |     </li>
 77 |   </ul>
 78 | </li>
 79 |       </ul>
 80 |       
 81 |       <ul class="nav navbar-nav navbar-right">
 82 |         
 83 |       </ul>
 84 |     </div><!--/.nav-collapse -->
 85 |   </div><!--/.container -->
 86 | </div><!--/.navbar -->
 87 | 
 88 |       
 89 |       </header>
 90 | 
 91 |       <div class="row">
 92 |   <div class="col-md-9 contents">
 93 |     <div class="page-header">
 94 |     <h1>Passengers and Crew on the RMS Titanic</h1>
 95 |     </div>
 96 | 
 97 |     
 98 |     <p>The <code>titanic</code> data is a complete list of passengers and crew members on  the RMS Titanic.
 99 | It includes a variable indicating whether a person did  survive the sinking of the RMS
100 | Titanic on April 15, 1912.</p>
101 |     
102 | 
103 |     <pre class="usage"><span class='fu'><a href='https://www.rdocumentation.org/packages/utils/topics/data'>data</a></span>(<span class='no'>titanic</span>)</pre>
104 |         
105 |     <h2 class="hasAnchor" id="format"><a class="anchor" href="#format"></a>Format</h2>
106 | 
107 |     <p>a data frame with 2207 rows and 11 columns</p>
108 |     
109 |     <h2 class="hasAnchor" id="source"><a class="anchor" href="#source"></a>Source</h2>
110 | 
111 |     <p>The description of dataset was copied from the <code>DALEX</code> package.
112 | This dataset was copied from the <code>stablelearner</code> package and went through few variable
113 | transformations. The complete list of persons on the RMS titanic was downloaded from
114 | <a href='https://www.encyclopedia-titanica.org'>https://www.encyclopedia-titanica.org</a> on April 5, 2016. The  information given
115 | in <code>sibsp</code> and <code>parch</code> was adopoted from a data set obtained from <a href='http://biostat.mc.vanderbilt.edu/DataSets'>http://biostat.mc.vanderbilt.edu/DataSets</a>.</p>
116 |     
117 |     <h2 class="hasAnchor" id="details"><a class="anchor" href="#details"></a>Details</h2>
118 | 
119 |     <p>The description of the dataset was copied from the <code>DALEX</code> package.</p>
120 | <p>This dataset was copied from the <code>stablelearner</code> package and went through few variable
121 | transformations. Levels in <code>embarked</code> was replaced with full names, <code>sibsp</code>, <code>parch</code> and <code>fare</code>
122 | were converted to numerical variables and values for crew were replaced with 0.
123 | If you use this dataset please cite the original package.</p>
124 | <p>From <code>stablelearner</code>: The website <a href='https://www.encyclopedia-titanica.org'>https://www.encyclopedia-titanica.org</a> offers detailed  information about passengers and crew
125 | members on the RMS Titanic. According to the website 1317 passengers and 890 crew member were abord.
126 | 8 musicians and 9 employees of the shipyard company are listed as passengers, but travelled with a
127 | free ticket, which is why they have <code>NA</code> values in <code>fare</code>. In addition to that, <code>fare</code>
128 | is truely missing for a few regular passengers.</p>
129 | <ul>
130 | <li><p>gender a factor with levels <code>male</code> and <code>female</code>.</p></li>
131 | <li><p>age a numeric value with the persons age on the day of the sinking.</p></li>
132 | <li><p>class a factor specifying the class for passengers or the type of service aboard for crew members.</p></li>
133 | <li><p>embarked a factor with the persons place of of embarkment (Belfast/Cherbourg/Queenstown/Southampton).</p></li>
134 | <li><p>country a factor with the persons home country.</p></li>
135 | <li><p>fare a numeric value with the ticket price (<code>0</code> for crew members, musicians and employees of the shipyard company).</p></li>
136 | <li><p>sibsp an ordered factor specifying the number if siblings/spouses aboard; adopted from Vanderbild data set (see below).</p></li>
137 | <li><p>parch an ordered factor specifying the number of parents/children aboard; adopted from Vanderbild data set (see below).</p></li>
138 | <li><p>survived a factor with two levels (<code>no</code> and <code>yes</code>) specifying whether the person has survived the sinking.</p></li>
139 | </ul>
140 |     
141 |     <h2 class="hasAnchor" id="references"><a class="anchor" href="#references"></a>References</h2>
142 | 
143 |     <p><a href='https://www.encyclopedia-titanica.org'>https://www.encyclopedia-titanica.org</a>, <a href='http://biostat.mc.vanderbilt.edu/DataSets'>http://biostat.mc.vanderbilt.edu/DataSets</a>,
144 | <a href='https://CRAN.R-project.org/package=stablelearner'>https://CRAN.R-project.org/package=stablelearner</a>, <a href='https://cran.r-project.org/web/packages/DALEX/index.html'>https://cran.r-project.org/web/packages/DALEX/index.html</a>.</p>
145 |     
146 | 
147 |   </div>
148 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
149 |     <h2>Contents</h2>
150 |     <ul class="nav nav-pills nav-stacked">
151 |       
152 |       <li><a href="#format">Format</a></li>
153 | 
154 |       <li><a href="#source">Source</a></li>
155 | 
156 |       <li><a href="#details">Details</a></li>
157 | 
158 |       <li><a href="#references">References</a></li>
159 |           </ul>
160 | 
161 |   </div>
162 | </div>
163 | 
164 |       <footer>
165 |       <div class="copyright">
166 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
167 | </div>
168 | 
169 | <div class="pkgdown">
170 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
171 | </div>
172 | 
173 |       </footer>
174 |    </div>
175 | 
176 |   </body>
177 | </html>
178 | 
179 | 


--------------------------------------------------------------------------------
/docs/reference/titanic_data.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html>
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Passengers and Crew on the RMS Titanic — titanic_data • EIX</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 16 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 20 | 
 21 | 
 22 | <!-- pkgdown -->
 23 | <link href="../pkgdown.css" rel="stylesheet">
 24 | <script src="../jquery.sticky-kit.min.js"></script>
 25 | <script src="../pkgdown.js"></script>
 26 | <!-- mathjax -->
 27 | <script src='https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML'></script>
 28 | 
 29 | <!--[if lt IE 9]>
 30 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 31 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 32 | <![endif]-->
 33 | 
 34 | 
 35 |   </head>
 36 | 
 37 |   <body>
 38 |     <div class="container template-reference-topic">
 39 |       <header>
 40 |       <div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 41 |   <div class="container">
 42 |     <div class="navbar-header">
 43 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 44 |         <span class="icon-bar"></span>
 45 |         <span class="icon-bar"></span>
 46 |         <span class="icon-bar"></span>
 47 |       </button>
 48 | 	  <a class = "navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 49 |         <img src = "https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt = "MI2" height = 46 title = "MI2">
 50 | 	  </a>
 51 |       <a class="navbar-brand navbar-mi2" href="../index.html">Passengers and Crew on the RMS Titanic</a>
 52 |     </div>
 53 |     <div id="navbar" class="navbar-collapse collapse">
 54 |       <ul class="navbar-mi2 nav navbar-nav">
 55 |         <li>
 56 |   <a href="../index.html">
 57 |     <span class="fa fa-home fa-lg"></span>
 58 |      
 59 |   </a>
 60 | </li>
 61 | <li>
 62 |   <a href="../articles/EIX.html">Get started</a>
 63 | </li>
 64 | <li>
 65 |   <a href="../reference/index.html">Reference</a>
 66 | </li>
 67 | <li class="dropdown">
 68 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 69 |     Articles
 70 |      
 71 |     <span class="caret"></span>
 72 |   </a>
 73 |   <ul class="dropdown-menu" role="menu">
 74 |     <li>
 75 |       <a href="../articles/titanic_data.html">EIX: Titanic data </a>
 76 |     </li>
 77 |   </ul>
 78 | </li>
 79 |       </ul>
 80 |       
 81 |       <ul class="nav navbar-nav navbar-right">
 82 |         <li>
 83 |   <a href="https://github.com/ModelOriented/EIX">
 84 |     <span class="fa fa-github fa-lg"></span>
 85 |      
 86 |   </a>
 87 | </li>
 88 |       </ul>
 89 |     </div><!--/.nav-collapse -->
 90 |   </div><!--/.container -->
 91 | </div><!--/.navbar -->
 92 | 
 93 |       
 94 |       </header>
 95 | 
 96 |       <div class="row">
 97 |   <div class="col-md-9 contents">
 98 |     <div class="page-header">
 99 |     <h1>Passengers and Crew on the RMS Titanic</h1>
100 |     </div>
101 | 
102 |     
103 |     <p>The <code>titanic</code> data is a complete list of passengers and crew members on  the RMS Titanic.
104 | It includes a variable indicating whether a person did  survive the sinking of the RMS
105 | Titanic on April 15, 1912.</p>
106 |     
107 | 
108 |     <pre class="usage"><span class='fu'><a href='https://www.rdocumentation.org/packages/utils/topics/data'>data</a></span>(<span class='no'>titanic_data</span>)</pre>
109 |         
110 |     <h2 class="hasAnchor" id="format"><a class="anchor" href="#format"></a>Format</h2>
111 | 
112 |     <p>a data frame with 2207 rows and 11 columns</p>
113 |     
114 |     <h2 class="hasAnchor" id="source"><a class="anchor" href="#source"></a>Source</h2>
115 | 
116 |     <p>The description of dataset was copied from the <code>DALEX</code> package.
117 | This dataset was copied from the <code>stablelearner</code> package and went through few variable
118 | transformations. The complete list of persons on the RMS titanic was downloaded from
119 | <a href='https://www.encyclopedia-titanica.org'>https://www.encyclopedia-titanica.org</a> on April 5, 2016. The  information given
120 | in <code>sibsp</code> and <code>parch</code> was adopoted from a data set obtained from <a href='http://biostat.mc.vanderbilt.edu/DataSets'>http://biostat.mc.vanderbilt.edu/DataSets</a>.</p>
121 |     
122 |     <h2 class="hasAnchor" id="details"><a class="anchor" href="#details"></a>Details</h2>
123 | 
124 |     <p>The description of the dataset was copied from the <code>DALEX</code> package.</p>
125 | <p>This dataset was copied from the <code>stablelearner</code> package and went through few variable
126 | transformations. Levels in <code>embarked</code> was replaced with full names, <code>sibsp</code>, <code>parch</code> and <code>fare</code>
127 | were converted to numerical variables and values for crew were replaced with 0.
128 | If you use this dataset please cite the original package.</p>
129 | <p>From <code>stablelearner</code>: The website <a href='https://www.encyclopedia-titanica.org'>https://www.encyclopedia-titanica.org</a> offers detailed  information about passengers and crew
130 | members on the RMS Titanic. According to the website 1317 passengers and 890 crew member were abord.
131 | 8 musicians and 9 employees of the shipyard company are listed as passengers, but travelled with a
132 | free ticket, which is why they have <code>NA</code> values in <code>fare</code>. In addition to that, <code>fare</code>
133 | is truely missing for a few regular passengers.</p>
134 | <ul>
135 | <li><p>gender a factor with levels <code>male</code> and <code>female</code>.</p></li>
136 | <li><p>age a numeric value with the persons age on the day of the sinking.</p></li>
137 | <li><p>class a factor specifying the class for passengers or the type of service aboard for crew members.</p></li>
138 | <li><p>embarked a factor with the persons place of of embarkment (Belfast/Cherbourg/Queenstown/Southampton).</p></li>
139 | <li><p>country a factor with the persons home country.</p></li>
140 | <li><p>fare a numeric value with the ticket price (<code>0</code> for crew members, musicians and employees of the shipyard company).</p></li>
141 | <li><p>sibsp an ordered factor specifying the number if siblings/spouses aboard; adopted from Vanderbild data set (see below).</p></li>
142 | <li><p>parch an ordered factor specifying the number of parents/children aboard; adopted from Vanderbild data set (see below).</p></li>
143 | <li><p>survived a factor with two levels (<code>no</code> and <code>yes</code>) specifying whether the person has survived the sinking.</p></li>
144 | </ul>
145 |     
146 |     <h2 class="hasAnchor" id="references"><a class="anchor" href="#references"></a>References</h2>
147 | 
148 |     <p><a href='https://www.encyclopedia-titanica.org'>https://www.encyclopedia-titanica.org</a>, <a href='http://biostat.mc.vanderbilt.edu/DataSets'>http://biostat.mc.vanderbilt.edu/DataSets</a>,
149 | <a href='https://CRAN.R-project.org/package=stablelearner'>https://CRAN.R-project.org/package=stablelearner</a>, <a href='https://cran.r-project.org/package=DALEX'>https://cran.r-project.org/package=DALEX</a>.</p>
150 |     
151 | 
152 |   </div>
153 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
154 |     <h2>Contents</h2>
155 |     <ul class="nav nav-pills nav-stacked">
156 |       
157 |       <li><a href="#format">Format</a></li>
158 | 
159 |       <li><a href="#source">Source</a></li>
160 | 
161 |       <li><a href="#details">Details</a></li>
162 | 
163 |       <li><a href="#references">References</a></li>
164 |           </ul>
165 | 
166 |   </div>
167 | </div>
168 | 
169 |       <footer>
170 |       <div class="copyright">
171 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
172 | </div>
173 | 
174 | <div class="pkgdown">
175 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
176 | </div>
177 | 
178 |       </footer>
179 |    </div>
180 | 
181 |   </body>
182 | </html>
183 | 
184 | 


--------------------------------------------------------------------------------
/docs/reference/countPairs.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html lang="en">
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Table of occurancess number — countPairs • EIX</title>
 10 | 
 11 | <!-- favicons -->
 12 | <link rel="icon" type="image/png" sizes="16x16" href="../favicon-16x16.png">
 13 | <link rel="icon" type="image/png" sizes="32x32" href="../favicon-32x32.png">
 14 | <link rel="apple-touch-icon" type="image/png" sizes="180x180" href="../apple-touch-icon.png" />
 15 | <link rel="apple-touch-icon" type="image/png" sizes="120x120" href="../apple-touch-icon-120x120.png" />
 16 | <link rel="apple-touch-icon" type="image/png" sizes="76x76" href="../apple-touch-icon-76x76.png" />
 17 | <link rel="apple-touch-icon" type="image/png" sizes="60x60" href="../apple-touch-icon-60x60.png" />
 18 | <!-- jquery -->
 19 | <script src="https://cdnjs.cloudflare.com/ajax/libs/jquery/3.3.1/jquery.min.js" integrity="sha256-FgpCb/KJQlLNfOu91ta32o/NMZxltwRo8QtmkMRdAu8=" crossorigin="anonymous"></script>
 20 | <!-- Bootstrap -->
 21 | 
 22 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/css/bootstrap.min.css" integrity="sha256-916EbMg70RQy9LHiGkXzG8hSg9EdNy97GazNG/aiY1w=" crossorigin="anonymous" />
 23 | <script src="https://cdnjs.cloudflare.com/ajax/libs/twitter-bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha256-U5ZEeKfGNOja007MMD3YBI0A3OSZOQbeG6z2f2Y0hu8=" crossorigin="anonymous"></script>
 24 | 
 25 | <!-- Font Awesome icons -->
 26 | <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/4.7.0/css/font-awesome.min.css" integrity="sha256-eZrrJcwDc/3uDhsdt61sL2oOBY362qM3lon1gyExkL0=" crossorigin="anonymous" />
 27 | 
 28 | <!-- clipboard.js -->
 29 | <script src="https://cdnjs.cloudflare.com/ajax/libs/clipboard.js/2.0.4/clipboard.min.js" integrity="sha256-FiZwavyI2V6+EXO1U+xzLG3IKldpiTFf3153ea9zikQ=" crossorigin="anonymous"></script>
 30 | 
 31 | <!-- sticky kit -->
 32 | <script src="https://cdnjs.cloudflare.com/ajax/libs/sticky-kit/1.1.3/sticky-kit.min.js" integrity="sha256-c4Rlo1ZozqTPE2RLuvbusY3+SU1pQaJC0TjuhygMipw=" crossorigin="anonymous"></script>
 33 | 
 34 | <!-- pkgdown -->
 35 | <link href="../pkgdown.css" rel="stylesheet">
 36 | <script src="../pkgdown.js"></script>
 37 | 
 38 | 
 39 | 
 40 | <meta property="og:title" content="Table of occurancess number — countPairs" />
 41 | 
 42 | <meta property="og:description" content="Table containing occurancess number of variables' pairs in the model." />
 43 | 
 44 | <meta property="og:image" content="/logo.png" />
 45 | <meta name="twitter:card" content="summary" />
 46 | 
 47 | 
 48 | 
 49 | <!-- mathjax -->
 50 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/MathJax.js" integrity="sha256-nvJJv9wWKEm88qvoQl9ekL2J+k/RWIsaSScxxlsrv8k=" crossorigin="anonymous"></script>
 51 | <script src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.5/config/TeX-AMS-MML_HTMLorMML.js" integrity="sha256-84DKXVJXs0/F8OTMzX4UR909+jtl4G7SPypPavF+GfA=" crossorigin="anonymous"></script>
 52 | 
 53 | <!--[if lt IE 9]>
 54 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 55 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 56 | <![endif]-->
 57 | 
 58 | 
 59 |   </head>
 60 | 
 61 |   <body>
 62 |     <div class="container template-reference-topic">
 63 |       <header>
 64 |       <div class="navbar navbar-default navbar-fixed-top" role="navigation">
 65 |   <div class="container">
 66 |     <div class="navbar-header">
 67 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar" aria-expanded="false">
 68 |         <span class="sr-only">Toggle navigation</span>
 69 |         <span class="icon-bar"></span>
 70 |         <span class="icon-bar"></span>
 71 |         <span class="icon-bar"></span>
 72 |       </button>
 73 |       <span class="navbar-brand">
 74 |         <a class="navbar-link" href="../index.html">EIX</a>
 75 |         <span class="version label label-default" data-toggle="tooltip" data-placement="bottom" title="Released version">0.0.0.9000</span>
 76 |       </span>
 77 |     </div>
 78 | 
 79 |     <div id="navbar" class="navbar-collapse collapse">
 80 |       <ul class="nav navbar-nav">
 81 |         <li>
 82 |   <a href="../index.html">
 83 |     <span class="fa fa-home fa-lg"></span>
 84 |      
 85 |   </a>
 86 | </li>
 87 | <li>
 88 |   <a href="../reference/index.html">Reference</a>
 89 | </li>
 90 |       </ul>
 91 |       
 92 |       <ul class="nav navbar-nav navbar-right">
 93 |         
 94 |       </ul>
 95 |       
 96 |     </div><!--/.nav-collapse -->
 97 |   </div><!--/.container -->
 98 | </div><!--/.navbar -->
 99 | 
100 |       
101 |       </header>
102 | 
103 | <div class="row">
104 |   <div class="col-md-9 contents">
105 |     <div class="page-header">
106 |     <h1>Table of occurancess number</h1>
107 |     
108 |     <div class="hidden name"><code>countPairs.Rd</code></div>
109 |     </div>
110 | 
111 |     <div class="ref-description">
112 |     
113 |     <p>Table containing occurancess number of variables' pairs in the model.</p>
114 |     
115 |     </div>
116 | 
117 |     <pre class="usage"><span class='fu'>countPairs</span>(<span class='no'>xgb.model</span>, <span class='no'>data</span>)</pre>
118 |     
119 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a>Arguments</h2>
120 |     <table class="ref-arguments">
121 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
122 |     <tr>
123 |       <th>xgb.model</th>
124 |       <td><p>a xgboost or lightgbm model</p></td>
125 |     </tr>
126 |     <tr>
127 |       <th>data</th>
128 |       <td><p>a data table with data used to train the model</p></td>
129 |     </tr>
130 |     </table>
131 |     
132 |     <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
133 | 
134 |     <p>a data table</p>
135 |     
136 | 
137 |     <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
138 |     <pre class="examples"><div class='input'><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"EIX"</span>)
139 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"Matrix"</span>)</div><div class='output co'>#&gt; <span class='warning'>Warning: pakiet 'Matrix' został zbudowany w wersji R 3.4.4</span></div><div class='input'><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"data.table"</span>)</div><div class='output co'>#&gt; <span class='warning'>Warning: pakiet 'data.table' został zbudowany w wersji R 3.4.4</span></div><div class='input'><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"xgboost"</span>)</div><div class='output co'>#&gt; <span class='warning'>Warning: pakiet 'xgboost' został zbudowany w wersji R 3.4.4</span></div><div class='input'>
140 | <span class='no'>dt_HR</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/data.table/topics/data.table'>data.table</a></span>(<span class='no'>HR_data</span>)
141 | <span class='no'>sm</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/Matrix/topics/sparse.model.matrix'>sparse.model.matrix</a></span>(<span class='no'>left</span> ~ <span class='no'>.</span> - <span class='fl'>1</span>,  <span class='kw'>data</span> <span class='kw'>=</span> <span class='no'>dt_HR</span>)
142 | 
143 | <span class='no'>param</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/list'>list</a></span>(<span class='kw'>objective</span> <span class='kw'>=</span> <span class='st'>"binary:logistic"</span>, <span class='kw'>base_score</span> <span class='kw'>=</span> <span class='fl'>0.5</span>, <span class='kw'>max_depth</span> <span class='kw'>=</span> <span class='fl'>2</span>)
144 | <span class='no'>xgb.model</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/xgboost/topics/xgb.train'>xgboost</a></span>( <span class='kw'>param</span> <span class='kw'>=</span> <span class='no'>param</span>, <span class='kw'>data</span> <span class='kw'>=</span> <span class='no'>sm</span>, <span class='kw'>label</span> <span class='kw'>=</span> <span class='no'>dt_HR</span>[, <span class='no'>left</span>] <span class='kw'>==</span> <span class='fl'>1</span>, <span class='kw'>nrounds</span> <span class='kw'>=</span> <span class='fl'>50</span>, <span class='kw'>verbose</span> <span class='kw'>=</span> <span class='fl'>FALSE</span>)
145 | 
146 | <span class='fu'>countPairs</span>(<span class='no'>xgb.model</span>, <span class='no'>sm</span>)</div><div class='output co'>#&gt; <span class='error'>Error in countPairs(xgb.model, sm): nie udało się znaleźć funkcji 'countPairs'</span></div><div class='input'>
147 | </div></pre>
148 |   </div>
149 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
150 |     <h2>Contents</h2>
151 |     <ul class="nav nav-pills nav-stacked">
152 |       <li><a href="#arguments">Arguments</a></li>
153 |       
154 |       <li><a href="#value">Value</a></li>
155 |       
156 |       <li><a href="#examples">Examples</a></li>
157 |     </ul>
158 | 
159 |   </div>
160 | </div>
161 | 
162 |       <footer>
163 |       <div class="copyright">
164 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
165 | </div>
166 | 
167 | <div class="pkgdown">
168 |   <p>Site built with <a href="https://pkgdown.r-lib.org/">pkgdown</a> 1.3.0.</p>
169 | </div>
170 |       </footer>
171 |    </div>
172 | 
173 |   
174 | 
175 |   </body>
176 | </html>
177 | 
178 | 


--------------------------------------------------------------------------------
/docs/reference/lollipop.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html>
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Tables needed for lollipop plot — lollipop • EIX</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 16 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 20 | 
 21 | 
 22 | <!-- pkgdown -->
 23 | <link href="../pkgdown.css" rel="stylesheet">
 24 | <script src="../jquery.sticky-kit.min.js"></script>
 25 | <script src="../pkgdown.js"></script>
 26 | <!-- mathjax -->
 27 | <script src='https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML'></script>
 28 | 
 29 | <!--[if lt IE 9]>
 30 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 31 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 32 | <![endif]-->
 33 | 
 34 | 
 35 |   </head>
 36 | 
 37 |   <body>
 38 |     <div class="container template-reference-topic">
 39 |       <header>
 40 |       <div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 41 |   <div class="container">
 42 |     <div class="navbar-header">
 43 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 44 |         <span class="icon-bar"></span>
 45 |         <span class="icon-bar"></span>
 46 |         <span class="icon-bar"></span>
 47 |       </button>
 48 | 	  <a class = "navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 49 |         <img src = "https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt = "MI2" height = 46 title = "MI2">
 50 | 	  </a>
 51 |       <a class="navbar-brand navbar-mi2" href="../index.html">Tables needed for lollipop plot</a>
 52 |     </div>
 53 |     <div id="navbar" class="navbar-collapse collapse">
 54 |       <ul class="navbar-mi2 nav navbar-nav">
 55 |         <li>
 56 |   <a href="../index.html">
 57 |     <span class="fa fa-home fa-lg"></span>
 58 |      
 59 |   </a>
 60 | </li>
 61 | <li>
 62 |   <a href="../articles/EIX.html">Get started</a>
 63 | </li>
 64 | <li>
 65 |   <a href="../reference/index.html">Reference</a>
 66 | </li>
 67 | <li class="dropdown">
 68 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 69 |     Articles
 70 |      
 71 |     <span class="caret"></span>
 72 |   </a>
 73 |   <ul class="dropdown-menu" role="menu">
 74 |     <li>
 75 |       <a href="../articles/titanic_data.html">EIX: Titanic data </a>
 76 |     </li>
 77 |   </ul>
 78 | </li>
 79 |       </ul>
 80 |       
 81 |       <ul class="nav navbar-nav navbar-right">
 82 |         <li>
 83 |   <a href="https://github.com/ModelOriented/EIX">
 84 |     <span class="fa fa-github fa-lg"></span>
 85 |      
 86 |   </a>
 87 | </li>
 88 |       </ul>
 89 |     </div><!--/.nav-collapse -->
 90 |   </div><!--/.container -->
 91 | </div><!--/.navbar -->
 92 | 
 93 |       
 94 |       </header>
 95 | 
 96 |       <div class="row">
 97 |   <div class="col-md-9 contents">
 98 |     <div class="page-header">
 99 |     <h1>Tables needed for lollipop plot</h1>
100 |     </div>
101 | 
102 |     
103 |     <p>This function calculates two tables needed to generate lollipop plot, which visualise the model.
104 | The first table contains information about all nodes in the trees forming a model.
105 | It includes gain value, depth and ID of each nodes.
106 | The second table contains similarly information about roots in the trees.</p>
107 |     
108 | 
109 |     <pre class="usage"><span class='fu'>lollipop</span>(<span class='no'>xgb_model</span>, <span class='no'>data</span>)</pre>
110 |     
111 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a> Arguments</h2>
112 |     <table class="ref-arguments">
113 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
114 |     <tr>
115 |       <th>xgb_model</th>
116 |       <td><p>a xgboost or lightgbm model.</p></td>
117 |     </tr>
118 |     <tr>
119 |       <th>data</th>
120 |       <td><p>a data table with data used to train the model.</p></td>
121 |     </tr>
122 |     </table>
123 |     
124 |     <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
125 | 
126 |     <p>an object of the lollipop class</p>
127 |     
128 | 
129 |     <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
130 |     <pre class="examples"><div class='input'><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"EIX"</span>)
131 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"Matrix"</span>)
132 | <span class='no'>sm</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/Matrix/topics/sparse.model.matrix'>sparse.model.matrix</a></span>(<span class='no'>left</span> ~ <span class='no'>.</span> - <span class='fl'>1</span>,  <span class='kw'>data</span> <span class='kw'>=</span> <span class='no'>HR_data</span>)
133 | 
134 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"xgboost"</span>)
135 | <span class='no'>param</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/list'>list</a></span>(<span class='kw'>objective</span> <span class='kw'>=</span> <span class='st'>"binary:logistic"</span>, <span class='kw'>max_depth</span> <span class='kw'>=</span> <span class='fl'>2</span>)
136 | <span class='no'>xgb_model</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/xgboost/topics/xgb.train'>xgboost</a></span>(<span class='no'>sm</span>, <span class='kw'>params</span> <span class='kw'>=</span> <span class='no'>param</span>, <span class='kw'>label</span> <span class='kw'>=</span> <span class='no'>HR_data</span>[, <span class='no'>left</span>] <span class='kw'>==</span> <span class='fl'>1</span>, <span class='kw'>nrounds</span> <span class='kw'>=</span> <span class='fl'>25</span>, <span class='kw'>verbose</span> <span class='kw'>=</span> <span class='fl'>0</span>)
137 | 
138 | <span class='no'>lolli</span> <span class='kw'>&lt;-</span> <span class='fu'>lollipop</span>(<span class='no'>xgb_model</span>, <span class='no'>sm</span>)
139 | <span class='fu'><a href='https://www.rdocumentation.org/packages/graphics/topics/plot'>plot</a></span>(<span class='no'>lolli</span>, <span class='kw'>labels</span> <span class='kw'>=</span> <span class='st'>"topAll"</span>, <span class='kw'>log_scale</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)</div><div class='img'><img src='lollipop-1.png' alt='' width='700' height='433' /></div><div class='input'>
140 | </div><div class='input'><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='no'>lightgbm</span>)
141 | <span class='no'>train_data</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/lightgbm/topics/lgb.Dataset'>lgb.Dataset</a></span>(<span class='no'>sm</span>, <span class='kw'>label</span> <span class='kw'>=</span>  <span class='no'>HR_data</span>[, <span class='no'>left</span>] <span class='kw'>==</span> <span class='fl'>1</span>)
142 | <span class='no'>params</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/list'>list</a></span>(<span class='kw'>objective</span> <span class='kw'>=</span> <span class='st'>"binary"</span>, <span class='kw'>max_depth</span> <span class='kw'>=</span> <span class='fl'>2</span>)
143 | <span class='no'>lgb_model</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/lightgbm/topics/lgb.train'>lgb.train</a></span>(<span class='no'>params</span>, <span class='no'>train_data</span>, <span class='fl'>25</span>)
144 | 
145 | <span class='no'>lolli</span> <span class='kw'>&lt;-</span> <span class='fu'>lollipop</span>(<span class='no'>lgb_model</span>, <span class='no'>sm</span>)
146 | <span class='fu'><a href='https://www.rdocumentation.org/packages/graphics/topics/plot'>plot</a></span>(<span class='no'>lolli</span>, <span class='kw'>labels</span> <span class='kw'>=</span> <span class='st'>"topAll"</span>, <span class='kw'>log_scale</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)</div><div class='img'><img src='lollipop-2.png' alt='' width='700' height='433' /></div><div class='input'>
147 | </div><div class='input'>
148 | </div></pre>
149 |   </div>
150 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
151 |     <h2>Contents</h2>
152 |     <ul class="nav nav-pills nav-stacked">
153 |       <li><a href="#arguments">Arguments</a></li>
154 |       
155 |       <li><a href="#value">Value</a></li>
156 |       
157 |       <li><a href="#examples">Examples</a></li>
158 |     </ul>
159 | 
160 |   </div>
161 | </div>
162 | 
163 |       <footer>
164 |       <div class="copyright">
165 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
166 | </div>
167 | 
168 | <div class="pkgdown">
169 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
170 | </div>
171 | 
172 |       </footer>
173 |    </div>
174 | 
175 |   </body>
176 | </html>
177 | 
178 | 


--------------------------------------------------------------------------------
/docs/reference/EIX_lollipop.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html>
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Tables needed for lollipop plot — EIX_lollipop • EIX</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 16 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 20 | 
 21 | 
 22 | <!-- pkgdown -->
 23 | <link href="../pkgdown.css" rel="stylesheet">
 24 | <script src="../jquery.sticky-kit.min.js"></script>
 25 | <script src="../pkgdown.js"></script>
 26 | <!-- mathjax -->
 27 | <script src='https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML'></script>
 28 | 
 29 | <!--[if lt IE 9]>
 30 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 31 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 32 | <![endif]-->
 33 | 
 34 | 
 35 |   </head>
 36 | 
 37 |   <body>
 38 |     <div class="container template-reference-topic">
 39 |       <header>
 40 |       <div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 41 |   <div class="container">
 42 |     <div class="navbar-header">
 43 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 44 |         <span class="icon-bar"></span>
 45 |         <span class="icon-bar"></span>
 46 |         <span class="icon-bar"></span>
 47 |       </button>
 48 | 	  <a class = "navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 49 |         <img src = "https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt = "MI2" height = 46 title = "MI2">
 50 | 	  </a>
 51 |       <a class="navbar-brand navbar-mi2" href="../index.html">Tables needed for lollipop plot</a>
 52 |     </div>
 53 |     <div id="navbar" class="navbar-collapse collapse">
 54 |       <ul class="navbar-mi2 nav navbar-nav">
 55 |         <li>
 56 |   <a href="../index.html">
 57 |     <span class="fa fa-home fa-lg"></span>
 58 |      
 59 |   </a>
 60 | </li>
 61 | <li>
 62 |   <a href="../reference/index.html">Reference</a>
 63 | </li>
 64 |       </ul>
 65 |       
 66 |       <ul class="nav navbar-nav navbar-right">
 67 |         
 68 |       </ul>
 69 |     </div><!--/.nav-collapse -->
 70 |   </div><!--/.container -->
 71 | </div><!--/.navbar -->
 72 | 
 73 |       
 74 |       </header>
 75 | 
 76 |       <div class="row">
 77 |   <div class="col-md-9 contents">
 78 |     <div class="page-header">
 79 |     <h1>Tables needed for lollipop plot</h1>
 80 |     </div>
 81 | 
 82 |     
 83 |     <p>This function calculates two tables needed to generate lollipop plot, which visualise the model.
 84 | The first table contains information about all nodes in the trees forming a model.
 85 | It includes gain value, depth and ID of each nodes.
 86 | The second table contains similarly information about roots in the trees.</p>
 87 |     
 88 | 
 89 |     <pre class="usage"><span class='fu'>EIX_lollipop</span>(<span class='no'>xgb.model</span>, <span class='no'>data</span>)</pre>
 90 |     
 91 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a> Arguments</h2>
 92 |     <table class="ref-arguments">
 93 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
 94 |     <tr>
 95 |       <th>xgb.model</th>
 96 |       <td><p>a xgboost or lightgbm model.</p></td>
 97 |     </tr>
 98 |     <tr>
 99 |       <th>data</th>
100 |       <td><p>a data table with data used to train the model.</p></td>
101 |     </tr>
102 |     </table>
103 |     
104 |     <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
105 | 
106 |     <p>an object of the lollipop class</p>
107 |     
108 | 
109 |     <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
110 |     <pre class="examples"><div class='input'><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"EIX"</span>)
111 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"Matrix"</span>)</div><div class='output co'>#&gt; <span class='warning'>Warning: pakiet 'Matrix' został zbudowany w wersji R 3.4.4</span></div><div class='input'><span class='no'>sm</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/Matrix/topics/sparse.model.matrix'>sparse.model.matrix</a></span>(<span class='no'>left</span> ~ <span class='no'>.</span> - <span class='fl'>1</span>,  <span class='kw'>data</span> <span class='kw'>=</span> <span class='no'>HR_data</span>)
112 | 
113 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"xgboost"</span>)</div><div class='output co'>#&gt; <span class='warning'>Warning: pakiet 'xgboost' został zbudowany w wersji R 3.4.4</span></div><div class='input'><span class='no'>param</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/list'>list</a></span>(<span class='kw'>objective</span> <span class='kw'>=</span> <span class='st'>"binary:logistic"</span>, <span class='kw'>max_depth</span> <span class='kw'>=</span> <span class='fl'>2</span>)
114 | <span class='no'>xgb.model</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/xgboost/topics/xgb.train'>xgboost</a></span>(<span class='no'>sm</span>, <span class='kw'>params</span> <span class='kw'>=</span> <span class='no'>param</span>, <span class='kw'>label</span> <span class='kw'>=</span> <span class='no'>HR_data</span>[, <span class='no'>left</span>] <span class='kw'>==</span> <span class='fl'>1</span>, <span class='kw'>nrounds</span> <span class='kw'>=</span> <span class='fl'>50</span>)</div><div class='output co'>#&gt; [1]	train-error:0.150077 
115 | #&gt; [2]	train-error:0.098007 
116 | #&gt; [3]	train-error:0.098007 
117 | #&gt; [4]	train-error:0.098007 
118 | #&gt; [5]	train-error:0.098007 
119 | #&gt; [6]	train-error:0.098007 
120 | #&gt; [7]	train-error:0.098007 
121 | #&gt; [8]	train-error:0.095873 
122 | #&gt; [9]	train-error:0.095873 
123 | #&gt; [10]	train-error:0.095606 
124 | #&gt; [11]	train-error:0.095473 
125 | #&gt; [12]	train-error:0.093406 
126 | #&gt; [13]	train-error:0.061271 
127 | #&gt; [14]	train-error:0.059404 
128 | #&gt; [15]	train-error:0.055137 
129 | #&gt; [16]	train-error:0.063271 
130 | #&gt; [17]	train-error:0.043070 
131 | #&gt; [18]	train-error:0.042670 
132 | #&gt; [19]	train-error:0.039203 
133 | #&gt; [20]	train-error:0.038536 
134 | #&gt; [21]	train-error:0.037669 
135 | #&gt; [22]	train-error:0.037869 
136 | #&gt; [23]	train-error:0.036802 
137 | #&gt; [24]	train-error:0.037336 
138 | #&gt; [25]	train-error:0.036602 
139 | #&gt; [26]	train-error:0.036402 
140 | #&gt; [27]	train-error:0.036669 
141 | #&gt; [28]	train-error:0.035802 
142 | #&gt; [29]	train-error:0.035402 
143 | #&gt; [30]	train-error:0.032202 
144 | #&gt; [31]	train-error:0.031869 
145 | #&gt; [32]	train-error:0.031469 
146 | #&gt; [33]	train-error:0.030935 
147 | #&gt; [34]	train-error:0.030602 
148 | #&gt; [35]	train-error:0.030269 
149 | #&gt; [36]	train-error:0.029402 
150 | #&gt; [37]	train-error:0.029269 
151 | #&gt; [38]	train-error:0.028802 
152 | #&gt; [39]	train-error:0.028802 
153 | #&gt; [40]	train-error:0.028535 
154 | #&gt; [41]	train-error:0.028269 
155 | #&gt; [42]	train-error:0.028202 
156 | #&gt; [43]	train-error:0.027935 
157 | #&gt; [44]	train-error:0.027669 
158 | #&gt; [45]	train-error:0.027669 
159 | #&gt; [46]	train-error:0.027402 
160 | #&gt; [47]	train-error:0.028269 
161 | #&gt; [48]	train-error:0.027268 
162 | #&gt; [49]	train-error:0.026668 
163 | #&gt; [50]	train-error:0.026335 </div><div class='input'>
164 | <span class='no'>lolli</span> <span class='kw'>&lt;-</span> <span class='fu'>EIX_lollipop</span>(<span class='no'>xgb.model</span>, <span class='no'>sm</span>)
165 | <span class='fu'><a href='https://www.rdocumentation.org/packages/graphics/topics/plot'>plot</a></span>(<span class='no'>lolli</span>, <span class='kw'>labels</span> <span class='kw'>=</span> <span class='st'>"topAll"</span>, <span class='kw'>log_scale</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)</div><div class='output co'>#&gt; <span class='warning'>Warning: Transformation introduced infinite values in continuous x-axis</span></div><div class='output co'>#&gt; <span class='warning'>Warning: Transformation introduced infinite values in continuous x-axis</span></div><div class='output co'>#&gt; <span class='warning'>Warning: Transformation introduced infinite values in continuous x-axis</span></div><div class='output co'>#&gt; <span class='warning'>Warning: Transformation introduced infinite values in continuous x-axis</span></div><div class='output co'>#&gt; <span class='warning'>Warning: Transformation introduced infinite values in continuous x-axis</span></div><div class='output co'>#&gt; <span class='warning'>Warning: Transformation introduced infinite values in continuous x-axis</span></div><div class='output co'>#&gt; <span class='warning'>Warning: Removed 7 rows containing missing values (geom_text_repel).</span></div><div class='img'><img src='EIX_lollipop-1.png' alt='' width='700' height='433' /></div><div class='input'>
166 | </div></pre>
167 |   </div>
168 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
169 |     <h2>Contents</h2>
170 |     <ul class="nav nav-pills nav-stacked">
171 |       <li><a href="#arguments">Arguments</a></li>
172 |       
173 |       <li><a href="#value">Value</a></li>
174 |       
175 |       <li><a href="#examples">Examples</a></li>
176 |     </ul>
177 | 
178 |   </div>
179 | </div>
180 | 
181 |       <footer>
182 |       <div class="copyright">
183 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
184 | </div>
185 | 
186 | <div class="pkgdown">
187 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
188 | </div>
189 | 
190 |       </footer>
191 |    </div>
192 | 
193 |   </body>
194 | </html>
195 | 
196 | 


--------------------------------------------------------------------------------
/vignettes/EIX.Rmd:
--------------------------------------------------------------------------------
  1 | ---
  2 | title: "EIX: Explain Interactions in XGBoost"
  3 | author: "Ewelina Karbowiak"
  4 | date: "2018-12-07"
  5 | output: rmarkdown::html_vignette
  6 | vignette: >
  7 |   %\VignetteIndexEntry{EIX Explain Interactions in XGBoost}
  8 |   %\VignetteEngine{knitr::rmarkdown}
  9 |   %\VignetteEncoding{UTF-8}
 10 | ---
 11 | 
 12 | ```{r, echo=FALSE}
 13 | knitr::opts_chunk$set(fig.height = 6, fig.width = 6, fig.align = "center")
 14 | 
 15 | ```
 16 | 
 17 | Package `EIX` is the set of tools to explore the structure of XGBoost and lightGBM models. It includes functions finding strong interactions and also checking importance of single variables and interactions by usage different measures. `EIX` consists several functions to visualize results.
 18 | 
 19 | Almost all `EIX` functions require only two parameters: a XGBoost or LightGBM model and data table used as training dataset. The exceptions are the `waterfall` function and its plot. The first one requires parameters: a XGBoost model and observation, which prediction has to be explained). These two functions support only XGBoost models. All plots are created with package `ggplot2`. Most of them use plot theme `theme_mi2` from `DALEX`.
 20 | 
 21 | ## Data Info
 22 | 
 23 | This vignette shows usage of `EIX` package. It lets to explain XGBoost prediction model concerning departures of employees from company using HR_data. Dataset was taken from kaggle and consists 14999 observations and 10 variables. The dataset is also available in package `EIX` and there it is described more precisely.
 24 | 
 25 | ```{r}
 26 | #devtools :: install_github("ModelOriented/EIX")
 27 | library("EIX")
 28 | set.seed(4)
 29 | knitr::kable(head(HR_data))
 30 | ```
 31 | 
 32 | To create correct XGBoost model, remember to change categorical features to factors and next change the data frame to sparse matrix. The categorical features are one-hot encoded.
 33 | 
 34 | ```{r, warning=FALSE, message=FALSE}
 35 | library("Matrix")
 36 | sparse_matrix <- sparse.model.matrix(left ~ . - 1,  data = HR_data)
 37 | head(sparse_matrix)
 38 | ```
 39 | 
 40 | 
 41 | ## Xgboost model creation
 42 | 
 43 | Package `EIX` uses table, which was generated by `xgboost::xgb.model.dt.tree` with information about trees, their nodes and leaves.
 44 | 
 45 | ```{r}
 46 | library("xgboost")
 47 | param <- list(objective = "binary:logistic", max_depth = 2)
 48 | xgb_model <- xgboost(sparse_matrix, params = param, label = HR_data[, left] == 1, nrounds = 50, verbose = FALSE)
 49 | knitr::kable(head(xgboost::xgb.model.dt.tree(colnames(sparse_matrix),xgb_model)))
 50 | ```
 51 | 
 52 | Function `xgboost::xgb.importance` shows importance of single variables. `EIX` adds new measures of variables’ importance and shows also importance of interactions.
 53 | 
 54 | ```{r}
 55 | knitr::kable(head(xgboost::xgb.importance(colnames(sparse_matrix),xgb_model)))
 56 | ```
 57 | 
 58 | ## Model visualization
 59 | 
 60 | The `lollipop` plot is used to visualize the model in such way that the most important variables and interactions are visible. 
 61 | 
 62 | On the x-axis, there are tree numbers and on the y-axis there is **Gain** measure for each node. One segment is one tree in the model and each point is one node. On the plot there are all nodes, which are not leaves. Shape of points signifies depth of node. All roots on the plot are connected by a red line. If in the same segment there is a variable with a higher depth above the variable with a lower depth, it means that interaction occurs.
 63 | 
 64 | There is opportunity to set a different way of labeling. On the plot we can see the most important variables in roots (horizontal labels), and interactions (vertical labels), this is option `labels = "topAll"` which is default. Moreover, there are two additional options: `labels = "roots"` - for variables in roots only, `labels = "interactions"` for interactions only. The numbers of labels visible on the plot you can change by parametr `threshold` (range from 0 to 1, default 0.1).
 65 | The plot is on a logarithmic scale because the initial trees usually are the most important. You can change the scale of the plot by setting the parameter `log_scale = FALSE`.
 66 | 
 67 | ```{r}
 68 | lolli<-lollipop(xgb_model,sparse_matrix)
 69 | plot(lolli)
 70 | #plot(lolli, threshold=0.05)
 71 | #plot(lolli, labels="roots")
 72 | #plot(lolli, labels="interactions")
 73 | #plot(lolli, labels="roots", threshold=0.05)
 74 | #plot(lolli, labels="interactions",threshold=0.05)
 75 | #plot(lolli, log_scale = FALSE)
 76 | ```
 77 | 
 78 | 
 79 | ## Interactions
 80 | 
 81 | We can consider interactions in two ways. In first approach we can explore all pairs of variable, which occur in the model one above the other. This approach is not the best one, because we cannot distinguish if pair of variables are real interaction or not. In this approach high gain of pair can be a result of high gain of down variable (child). To explore pairs of variables you can generate table with them using function `interactions` with parametr `option = "pairs"`. This table includes **Gain** measure and  number of occurrences of pairs. You can also use the function `plot` to visualize **Gain** measure.
 82 | 
 83 | ```{r}
 84 | pairs<-interactions(xgb_model, sparse_matrix, option = "pairs")
 85 | head(pairs)
 86 | plot(pairs)
 87 | ```
 88 | 
 89 | The `interactions` plot is a matrix plot with a child from the pair on the x-axis and the parent on the y-axis. The color of the square at the intersection of two variables means value of **sumGain** measure. The darker square, the higher **sumGain** of variable pairs. The range of **sumGain** measure is divided into four equal parts: `very low, low, medium, high`.
 90 | 
 91 | In second approach, to find strong interactions, we can consider only these pairs of variables, where variable on the bottom (child) has higher gain than variable on the top (parent). We can also create ranking of interactions using function `importance` with parameter `option = "interactions"`. More details in the next section.
 92 | 
 93 | ```{r, warning=FALSE, message=FALSE}
 94 | interactions<-interactions(xgb_model, sparse_matrix, option = "interactions")
 95 | head(interactions)
 96 | plot(interactions)
 97 | ```
 98 | 
 99 | 
100 | ## Variables' and interactions’ importance
101 | 
102 | For exploring variables’ and interactions’ importance there are three functions in `EIX` package: `importance`, its `plot` with parameter `radar = TRUE` or `radar = FALSE`.
103 | With `EIX` package we can compare importance of single variables and interactions. The functions `importance` can return three kinds of outputs, depending on the `opt` parameter:
104 | 
105 |  * `option = "variables"` - it consists only single variables
106 | 
107 |  * `option = "interactions"`- only interactions
108 | 
109 |  * `option = "both"`-  output shows importance both single variables and interactions.
110 |  
111 |  NOTE: `option = "both"` is not direct connection `option = "variables"` and `option = "interactions"`, because values of variable importance measure, which were in the interactions, are not included in importance of single variable.
112 | 
113 | In `EIX` the following measures are available:
114 | 
115 | * **sumGain** - sum of Gain value in all nodes, in which given variable occurs
116 | * **sumCover** - sum of Cover value in all nodes, in which given variable occurs; for LightGBM models: number of observation, which pass through the node
117 | * **mean5Gain** - mean gain from 5 occurrences of given variable with the highest gain
118 | * **meanGain** - mean Gain value in all nodes, in which given variable occurs
119 | * **meanCover** - mean Cover value in all nodes, in which given variable occurs; for LightGBM models: mean number of observation, which pass through the node
120 | * **freqency** - number of occurrences in the nodes for given variable
121 | 
122 | `EIX` package gives additionally measures of variables importance for single variable:
123 | 
124 | * **counterRoot** - number of occurrences in the root
125 | * **weightedRoot**  - mean number of occurrences in the root, which is weighted by gain
126 | * **meanDepth ** - mean depth weighted by gain
127 | 
128 | The function `importance` returns a table with all available importance measures for given option. 
129 | The table is sorted by descending value of **sumGain**.
130 | 
131 | The function `plot` with parameter  `radar = FALSE` and a result from the `importance` function as an argument  shows two measures of importance, which can be chosen by `xmeasure` and `ymeasure` parameters. By parameter `top` we can decide how many positions will be included in the plot.
132 | 
133 | ```{r}
134 | importance<-importance(xgb_model, sparse_matrix, option = "both")
135 | head(importance)
136 | plot(importance, radar=FALSE)
137 | #plot(importance,  xmeasure = "mean5Gain", ymeasure = "sumGain",  top = 15, radar=FALSE)
138 | ```
139 | 
140 | The function `plot` with parameter `radar = TRUE` enables to compare different measures of variables and interactions importance on the radar plot from `ggiraphExtra` package.
141 | Bellow I attach the example of radar plot. On the outside of the circle there are names of variables or interactions. Colored lines represent various measures  of importance. The positions on the plot are sorted decreasing. The variable with the highest **sumGain** value is on the right of 12 o'clock. Next the **sumGain** value decreases in a clockwise direction.  On the plot it is possible to change place, where the features names start by parameter `text_start_point` (range from 0 to 1, default 0.5), and size of this text by parametrer `text_size`.
142 | 
143 | ```{r}
144 | plot(importance)
145 | #plot(importance, text_start_point = 0.3)
146 | #plot(importance, text_size = 4)
147 | #plot(importance, top=15)
148 | ```
149 | 
150 | ## Explanation of single prediction including interactions
151 | 
152 | For single prediction explaining package `EIX` uses two packages: `xgboostExplainer` i `breakDown`. The package `xgboostExplainer` is a tool to interpreting prediction of xgboost model. The package `EIX` uses its code and modifies it to include interactions. The methodology of plot creation comes from package `breakDown`.
153 | 
154 | The function `waterfall` returns table with variables’ impact on the prediction of the model.  Depending on the parameter `option`, the table includes interactions (`option = "interactions"`- default) or does not (`option = "variables"`). The function `plot` with `waterfall` object as an argument visualizes this table. On the y-axis there are: intercept (it is the probability that random variable from training dataset will be 1), variables (which have an impact on prediction) and final prognosis of the model. On the x-axis there is log-odds of impact each variables.
155 | 
156 | ```{r}
157 | data <- HR_data[9,]
158 | new_observation <- sparse_matrix[9,]
159 | wf<-waterfall(xgb_model, new_observation, data, option = "interactions")
160 | wf
161 | plot(wf)
162 | #wf<-waterfall(xgb_model, new_observation, data, option = "interactions", baseline = "intercept")
163 | #wf
164 | #plot(wf)
165 | ```
166 | 


--------------------------------------------------------------------------------
/docs/reference/plot.lollipop.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html>
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Visualiation of the model — plot.lollipop • EIX</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 16 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 20 | 
 21 | 
 22 | <!-- pkgdown -->
 23 | <link href="../pkgdown.css" rel="stylesheet">
 24 | <script src="../jquery.sticky-kit.min.js"></script>
 25 | <script src="../pkgdown.js"></script>
 26 | <!-- mathjax -->
 27 | <script src='https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML'></script>
 28 | 
 29 | <!--[if lt IE 9]>
 30 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 31 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 32 | <![endif]-->
 33 | 
 34 | 
 35 |   </head>
 36 | 
 37 |   <body>
 38 |     <div class="container template-reference-topic">
 39 |       <header>
 40 |       <div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 41 |   <div class="container">
 42 |     <div class="navbar-header">
 43 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 44 |         <span class="icon-bar"></span>
 45 |         <span class="icon-bar"></span>
 46 |         <span class="icon-bar"></span>
 47 |       </button>
 48 | 	  <a class = "navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 49 |         <img src = "https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt = "MI2" height = 46 title = "MI2">
 50 | 	  </a>
 51 |       <a class="navbar-brand navbar-mi2" href="../index.html">Visualiation of the model</a>
 52 |     </div>
 53 |     <div id="navbar" class="navbar-collapse collapse">
 54 |       <ul class="navbar-mi2 nav navbar-nav">
 55 |         <li>
 56 |   <a href="../index.html">
 57 |     <span class="fa fa-home fa-lg"></span>
 58 |      
 59 |   </a>
 60 | </li>
 61 | <li>
 62 |   <a href="../articles/EIX.html">Get started</a>
 63 | </li>
 64 | <li>
 65 |   <a href="../reference/index.html">Reference</a>
 66 | </li>
 67 | <li class="dropdown">
 68 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 69 |     Articles
 70 |      
 71 |     <span class="caret"></span>
 72 |   </a>
 73 |   <ul class="dropdown-menu" role="menu">
 74 |     <li>
 75 |       <a href="../articles/titanic_data.html">EIX: Titanic data </a>
 76 |     </li>
 77 |   </ul>
 78 | </li>
 79 |       </ul>
 80 |       
 81 |       <ul class="nav navbar-nav navbar-right">
 82 |         <li>
 83 |   <a href="https://github.com/ModelOriented/EIX">
 84 |     <span class="fa fa-github fa-lg"></span>
 85 |      
 86 |   </a>
 87 | </li>
 88 |       </ul>
 89 |     </div><!--/.nav-collapse -->
 90 |   </div><!--/.container -->
 91 | </div><!--/.navbar -->
 92 | 
 93 |       
 94 |       </header>
 95 | 
 96 |       <div class="row">
 97 |   <div class="col-md-9 contents">
 98 |     <div class="page-header">
 99 |     <h1>Visualiation of the model</h1>
100 |     </div>
101 | 
102 |     
103 |     <p>The lollipop plots the model with the most important interactions and variables in the roots.</p>
104 |     
105 | 
106 |     <pre class="usage"><span class='co'># S3 method for lollipop</span>
107 | <span class='fu'><a href='https://www.rdocumentation.org/packages/graphics/topics/plot'>plot</a></span>(<span class='no'>x</span>, <span class='no'>...</span>, <span class='kw'>labels</span> <span class='kw'>=</span> <span class='st'>"topAll"</span>, <span class='kw'>log_scale</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>,
108 |   <span class='kw'>threshold</span> <span class='kw'>=</span> <span class='fl'>0.1</span>)</pre>
109 |     
110 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a> Arguments</h2>
111 |     <table class="ref-arguments">
112 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
113 |     <tr>
114 |       <th>x</th>
115 |       <td><p>a result from the <code>lollipop</code> function.</p></td>
116 |     </tr>
117 |     <tr>
118 |       <th>...</th>
119 |       <td><p>other parameters.</p></td>
120 |     </tr>
121 |     <tr>
122 |       <th>labels</th>
123 |       <td><p>if "topAll" then labels for the most important interactions (vertical label)
124 | and variables in the roots (horizontal label) will be displayed,
125 | if "interactions" then labels for all interactions,
126 | if "roots" then labels for all variables in the root.</p></td>
127 |     </tr>
128 |     <tr>
129 |       <th>log_scale</th>
130 |       <td><p>TRUE/FALSE logarithmic scale on the plot. Default TRUE.</p></td>
131 |     </tr>
132 |     <tr>
133 |       <th>threshold</th>
134 |       <td><p>on the plot will occur only labels with Gain higher than `threshold` of the max Gain value in the model.
135 | The lower threshold, the more labels on the plot. Range from 0 to 1. Default 0.1.</p></td>
136 |     </tr>
137 |     </table>
138 |     
139 |     <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
140 | 
141 |     <p>a ggplot object</p>
142 |     
143 | 
144 |     <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
145 |     <pre class="examples"><div class='input'><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"EIX"</span>)
146 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"Matrix"</span>)
147 | <span class='no'>sm</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/Matrix/topics/sparse.model.matrix'>sparse.model.matrix</a></span>(<span class='no'>left</span> ~ <span class='no'>.</span> - <span class='fl'>1</span>,  <span class='kw'>data</span> <span class='kw'>=</span> <span class='no'>HR_data</span>)
148 | 
149 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"xgboost"</span>)
150 | <span class='no'>param</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/list'>list</a></span>(<span class='kw'>objective</span> <span class='kw'>=</span> <span class='st'>"binary:logistic"</span>, <span class='kw'>max_depth</span> <span class='kw'>=</span> <span class='fl'>2</span>)
151 | <span class='no'>xgb_model</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/xgboost/topics/xgb.train'>xgboost</a></span>(<span class='no'>sm</span>, <span class='kw'>params</span> <span class='kw'>=</span> <span class='no'>param</span>, <span class='kw'>label</span> <span class='kw'>=</span> <span class='no'>HR_data</span>[, <span class='no'>left</span>] <span class='kw'>==</span> <span class='fl'>1</span>, <span class='kw'>nrounds</span> <span class='kw'>=</span> <span class='fl'>25</span>, <span class='kw'>verbose</span> <span class='kw'>=</span> <span class='fl'>0</span>)
152 | 
153 | <span class='no'>lolli</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='lollipop.html'>lollipop</a></span>(<span class='no'>xgb_model</span>, <span class='no'>sm</span>)
154 | <span class='fu'><a href='https://www.rdocumentation.org/packages/graphics/topics/plot'>plot</a></span>(<span class='no'>lolli</span>, <span class='kw'>labels</span> <span class='kw'>=</span> <span class='st'>"topAll"</span>, <span class='kw'>log_scale</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)</div><div class='img'><img src='plot.lollipop-1.png' alt='' width='700' height='433' /></div><div class='input'>
155 | </div><div class='input'><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='no'>lightgbm</span>)
156 | <span class='no'>train_data</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/lightgbm/topics/lgb.Dataset'>lgb.Dataset</a></span>(<span class='no'>sm</span>, <span class='kw'>label</span> <span class='kw'>=</span>  <span class='no'>HR_data</span>[, <span class='no'>left</span>] <span class='kw'>==</span> <span class='fl'>1</span>)
157 | <span class='no'>params</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/list'>list</a></span>(<span class='kw'>objective</span> <span class='kw'>=</span> <span class='st'>"binary"</span>, <span class='kw'>max_depth</span> <span class='kw'>=</span> <span class='fl'>3</span>)
158 | <span class='no'>lgb_model</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/lightgbm/topics/lgb.train'>lgb.train</a></span>(<span class='no'>params</span>, <span class='no'>train_data</span>, <span class='fl'>25</span>)
159 | 
160 | <span class='no'>lolli</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='lollipop.html'>lollipop</a></span>(<span class='no'>lgb_model</span>, <span class='no'>sm</span>)
161 | <span class='fu'><a href='https://www.rdocumentation.org/packages/graphics/topics/plot'>plot</a></span>(<span class='no'>lolli</span>, <span class='kw'>labels</span> <span class='kw'>=</span> <span class='st'>"topAll"</span>, <span class='kw'>log_scale</span> <span class='kw'>=</span> <span class='fl'>TRUE</span>)</div><div class='img'><img src='plot.lollipop-2.png' alt='' width='700' height='433' /></div><div class='input'>
162 | </div></pre>
163 |   </div>
164 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
165 |     <h2>Contents</h2>
166 |     <ul class="nav nav-pills nav-stacked">
167 |       <li><a href="#arguments">Arguments</a></li>
168 |       
169 |       <li><a href="#value">Value</a></li>
170 |       
171 |       <li><a href="#examples">Examples</a></li>
172 |     </ul>
173 | 
174 |   </div>
175 | </div>
176 | 
177 |       <footer>
178 |       <div class="copyright">
179 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
180 | </div>
181 | 
182 | <div class="pkgdown">
183 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
184 | </div>
185 | 
186 |       </footer>
187 |    </div>
188 | 
189 |   </body>
190 | </html>
191 | 
192 | 


--------------------------------------------------------------------------------
/docs/reference/waterfall.html:
--------------------------------------------------------------------------------
  1 | <!-- Generated by pkgdown: do not edit by hand -->
  2 | <!DOCTYPE html>
  3 | <html>
  4 |   <head>
  5 |   <meta charset="utf-8">
  6 | <meta http-equiv="X-UA-Compatible" content="IE=edge">
  7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  8 | 
  9 | <title>Explain prediction of a single observation — waterfall • EIX</title>
 10 | 
 11 | <!-- jquery -->
 12 | <script src="https://code.jquery.com/jquery-3.1.0.min.js" integrity="sha384-nrOSfDHtoPMzJHjVTdCopGqIqeYETSXhZDFyniQ8ZHcVy08QesyHcnOUpMpqnmWq" crossorigin="anonymous"></script>
 13 | <!-- Bootstrap -->
 14 | 
 15 | <link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/css/bootstrap.min.css" rel="stylesheet" integrity="sha384-BVYiiSIFeK1dGmJRAkycuHAHRg32OmUcww7on3RYdg4Va+PmSTsz/K68vbdEjh4u" crossorigin="anonymous">
 16 | <script src="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.7/js/bootstrap.min.js" integrity="sha384-Tc5IQib027qvyjSMfHjOMaLkfuWVxZxUPnCJA7l2mCWNIpG9mGCD8wGNIcPD7Txa" crossorigin="anonymous"></script>
 17 | 
 18 | <!-- Font Awesome icons -->
 19 | <link href="https://maxcdn.bootstrapcdn.com/font-awesome/4.6.3/css/font-awesome.min.css" rel="stylesheet" integrity="sha384-T8Gy5hrqNKT+hzMclPo118YTQO6cYprQmhrYwIiQ/3axmI1hQomh7Ud2hPOy8SP1" crossorigin="anonymous">
 20 | 
 21 | 
 22 | <!-- pkgdown -->
 23 | <link href="../pkgdown.css" rel="stylesheet">
 24 | <script src="../jquery.sticky-kit.min.js"></script>
 25 | <script src="../pkgdown.js"></script>
 26 | <!-- mathjax -->
 27 | <script src='https://mathjax.rstudio.com/latest/MathJax.js?config=TeX-AMS-MML_HTMLorMML'></script>
 28 | 
 29 | <!--[if lt IE 9]>
 30 | <script src="https://oss.maxcdn.com/html5shiv/3.7.3/html5shiv.min.js"></script>
 31 | <script src="https://oss.maxcdn.com/respond/1.4.2/respond.min.js"></script>
 32 | <![endif]-->
 33 | 
 34 | 
 35 |   </head>
 36 | 
 37 |   <body>
 38 |     <div class="container template-reference-topic">
 39 |       <header>
 40 |       <div class="navbar navbar-default navbar-fixed-top navbar-mi2" role="navigation">
 41 |   <div class="container">
 42 |     <div class="navbar-header">
 43 |       <button type="button" class="navbar-toggle collapsed" data-toggle="collapse" data-target="#navbar">
 44 |         <span class="icon-bar"></span>
 45 |         <span class="icon-bar"></span>
 46 |         <span class="icon-bar"></span>
 47 |       </button>
 48 | 	  <a class = "navbar-mi2logo" href="http://mi2.mini.pw.edu.pl/">
 49 |         <img src = "https://github.com/mi2-warsaw/MI2template/blob/master/inst/pkgdown/assets/MI2logo.jpg?raw=true" alt = "MI2" height = 46 title = "MI2">
 50 | 	  </a>
 51 |       <a class="navbar-brand navbar-mi2" href="../index.html">Explain prediction of a single observation</a>
 52 |     </div>
 53 |     <div id="navbar" class="navbar-collapse collapse">
 54 |       <ul class="navbar-mi2 nav navbar-nav">
 55 |         <li>
 56 |   <a href="../index.html">
 57 |     <span class="fa fa-home fa-lg"></span>
 58 |      
 59 |   </a>
 60 | </li>
 61 | <li>
 62 |   <a href="../articles/EIX.html">Get started</a>
 63 | </li>
 64 | <li>
 65 |   <a href="../reference/index.html">Reference</a>
 66 | </li>
 67 | <li class="dropdown">
 68 |   <a href="#" class="dropdown-toggle" data-toggle="dropdown" role="button" aria-expanded="false">
 69 |     Articles
 70 |      
 71 |     <span class="caret"></span>
 72 |   </a>
 73 |   <ul class="dropdown-menu" role="menu">
 74 |     <li>
 75 |       <a href="../articles/titanic_data.html">EIX: Titanic data </a>
 76 |     </li>
 77 |   </ul>
 78 | </li>
 79 |       </ul>
 80 |       
 81 |       <ul class="nav navbar-nav navbar-right">
 82 |         <li>
 83 |   <a href="https://github.com/ModelOriented/EIX">
 84 |     <span class="fa fa-github fa-lg"></span>
 85 |      
 86 |   </a>
 87 | </li>
 88 |       </ul>
 89 |     </div><!--/.nav-collapse -->
 90 |   </div><!--/.container -->
 91 | </div><!--/.navbar -->
 92 | 
 93 |       
 94 |       </header>
 95 | 
 96 |       <div class="row">
 97 |   <div class="col-md-9 contents">
 98 |     <div class="page-header">
 99 |     <h1>Explain prediction of a single observation</h1>
100 |     </div>
101 | 
102 |     
103 |     <p>This function calculates a table with influence of variables and interactions
104 | on the prediction of a given observation. It supports only xgboost models.</p>
105 |     
106 | 
107 |     <pre class="usage"><span class='fu'>waterfall</span>(<span class='no'>xgb_model</span>, <span class='no'>new_observation</span>, <span class='no'>data</span>, <span class='kw'>type</span> <span class='kw'>=</span> <span class='st'>"binary"</span>,
108 |   <span class='kw'>option</span> <span class='kw'>=</span> <span class='st'>"interactions"</span>, <span class='kw'>baseline</span> <span class='kw'>=</span> <span class='fl'>0</span>)</pre>
109 |     
110 |     <h2 class="hasAnchor" id="arguments"><a class="anchor" href="#arguments"></a> Arguments</h2>
111 |     <table class="ref-arguments">
112 |     <colgroup><col class="name" /><col class="desc" /></colgroup>
113 |     <tr>
114 |       <th>xgb_model</th>
115 |       <td><p>a xgboost model.</p></td>
116 |     </tr>
117 |     <tr>
118 |       <th>new_observation</th>
119 |       <td><p>a new observation.</p></td>
120 |     </tr>
121 |     <tr>
122 |       <th>data</th>
123 |       <td><p>row from the original dataset with the new observation to explain (not one-hot-encoded).
124 | The param above has to be set to merge categorical features.
125 | If you dont wont to merge categorical features, set this parameter the same as <code>new_observation</code>.</p></td>
126 |     </tr>
127 |     <tr>
128 |       <th>type</th>
129 |       <td><p>the learning task of the model. Available tasks: "binary" for binary classification  or "regression" for linear regression.</p></td>
130 |     </tr>
131 |     <tr>
132 |       <th>option</th>
133 |       <td><p>if "variables", the plot includes only single variables,
134 | if "interactions", then only interactions.
135 | Default "interaction".</p></td>
136 |     </tr>
137 |     <tr>
138 |       <th>baseline</th>
139 |       <td><p>a number or a character "Intercept" (for model intercept).
140 | The baseline for the plot, where the rectangles should start.
141 | Default 0.</p></td>
142 |     </tr>
143 |     </table>
144 |     
145 |     <h2 class="hasAnchor" id="value"><a class="anchor" href="#value"></a>Value</h2>
146 | 
147 |     <p>an object of the broken class</p>
148 |     
149 |     <h2 class="hasAnchor" id="details"><a class="anchor" href="#details"></a>Details</h2>
150 | 
151 |     <p>The function contains code or pieces of code
152 | from <code>breakDown</code> code created by Przemysław Biecek
153 | and <code>xgboostExplainer</code> code created by David Foster.</p>
154 |     
155 | 
156 |     <h2 class="hasAnchor" id="examples"><a class="anchor" href="#examples"></a>Examples</h2>
157 |     <pre class="examples"><div class='input'>
158 | </div><div class='input'><span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"EIX"</span>)
159 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"Matrix"</span>)
160 | <span class='no'>sm</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/Matrix/topics/sparse.model.matrix'>sparse.model.matrix</a></span>(<span class='no'>left</span> ~ <span class='no'>.</span> - <span class='fl'>1</span>,  <span class='kw'>data</span> <span class='kw'>=</span> <span class='no'>HR_data</span>)
161 | 
162 | <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/library'>library</a></span>(<span class='st'>"xgboost"</span>)
163 | <span class='no'>param</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/base/topics/list'>list</a></span>(<span class='kw'>objective</span> <span class='kw'>=</span> <span class='st'>"binary:logistic"</span>, <span class='kw'>max_depth</span> <span class='kw'>=</span> <span class='fl'>2</span>)
164 | <span class='no'>xgb_model</span> <span class='kw'>&lt;-</span> <span class='fu'><a href='https://www.rdocumentation.org/packages/xgboost/topics/xgb.train'>xgboost</a></span>(<span class='no'>sm</span>, <span class='kw'>params</span> <span class='kw'>=</span> <span class='no'>param</span>, <span class='kw'>label</span> <span class='kw'>=</span> <span class='no'>HR_data</span>[, <span class='no'>left</span>] <span class='kw'>==</span> <span class='fl'>1</span>, <span class='kw'>nrounds</span> <span class='kw'>=</span> <span class='fl'>25</span>, <span class='kw'>verbose</span><span class='kw'>=</span><span class='fl'>0</span>)
165 | 
166 | <span class='no'>data</span> <span class='kw'>&lt;-</span> <span class='no'>HR_data</span>[<span class='fl'>9</span>,-<span class='fl'>7</span>]
167 | <span class='no'>new_observation</span> <span class='kw'>&lt;-</span> <span class='no'>sm</span>[<span class='fl'>9</span>,]
168 | 
169 | <span class='no'>wf</span> <span class='kw'>&lt;-</span> <span class='fu'>waterfall</span>(<span class='no'>xgb_model</span>, <span class='no'>new_observation</span>, <span class='no'>data</span>,  <span class='kw'>option</span> <span class='kw'>=</span> <span class='st'>"interactions"</span>)
170 | <span class='no'>wf</span></div><div class='output co'>#&gt;                                                         contribution
171 | #&gt; xgboost: intercept                                            -1.492
172 | #&gt; xgboost: time_spend_company = 5                                1.360
173 | #&gt; xgboost: last_evaluation = 1                                   1.093
174 | #&gt; xgboost: Work_accident = 0                                    -0.423
175 | #&gt; xgboost: satisfaction_level = 0.89                            -0.390
176 | #&gt; xgboost: last_evaluation:time_spend_company = 1:5              0.297
177 | #&gt; xgboost: last_evaluation:average_montly_hours = 1:224          0.227
178 | #&gt; xgboost: satisfaction_level:time_spend_company = 0.89:5        0.223
179 | #&gt; xgboost: number_project = 5                                   -0.211
180 | #&gt; xgboost: average_montly_hours:last_evaluation = 224:1         -0.156
181 | #&gt; xgboost: average_montly_hours = 224                           -0.096
182 | #&gt; xgboost: time_spend_company:last_evaluation = 5:1              0.095
183 | #&gt; xgboost: salary = 2                                            0.074
184 | #&gt; xgboost: satisfaction_level:number_project = 0.89:5           -0.003
185 | #&gt; xgboost: prediction                                            0.597</div><div class='input'>
186 | <span class='fu'><a href='https://www.rdocumentation.org/packages/graphics/topics/plot'>plot</a></span>(<span class='no'>wf</span>)</div><div class='img'><img src='waterfall-1.png' alt='' width='700' height='433' /></div><div class='input'>
187 | </div></pre>
188 |   </div>
189 |   <div class="col-md-3 hidden-xs hidden-sm" id="sidebar">
190 |     <h2>Contents</h2>
191 |     <ul class="nav nav-pills nav-stacked">
192 |       <li><a href="#arguments">Arguments</a></li>
193 |       
194 |       <li><a href="#value">Value</a></li>
195 | 
196 |       <li><a href="#details">Details</a></li>
197 |       
198 |       <li><a href="#examples">Examples</a></li>
199 |     </ul>
200 | 
201 |   </div>
202 | </div>
203 | 
204 |       <footer>
205 |       <div class="copyright">
206 |   <p>Developed by Ewelina Karbowiak, Przemyslaw Biecek.</p>
207 | </div>
208 | 
209 | <div class="pkgdown">
210 |   <p>Site built with <a href="http://hadley.github.io/pkgdown/">pkgdown</a>.</p>
211 | </div>
212 | 
213 |       </footer>
214 |    </div>
215 | 
216 |   </body>
217 | </html>
218 | 
219 | 


--------------------------------------------------------------------------------