├── tests
    ├── __init__.py
    ├── __main__.py
    ├── conftest.py
    ├── utils
    │   ├── test_btree.py
    │   └── test_concordance.py
    └── test_generate_datasets.py
├── docs
    ├── docs_requirements.txt
    ├── _static
    │   └── custom.css
    ├── images
    │   ├── badfit.png
    │   ├── goodfit.png
    │   ├── qq_plot.png
    │   ├── flat_plot.png
    │   ├── kmf_mcas.png
    │   ├── add_at_risk.png
    │   ├── ci_show_plot.png
    │   ├── coxph_plot.png
    │   ├── normal_plot.png
    │   ├── invert_y_axis.png
    │   ├── lcd_parametric.png
    │   ├── lifetimes_mcas.png
    │   ├── lls_democracy.png
    │   ├── quickstart_aaf.png
    │   ├── quickstart_kmf.png
    │   ├── lls_regime_type.png
    │   ├── quickstart_multi.png
    │   ├── show_censors_plot.png
    │   ├── survival_weibull.png
    │   ├── lifelines_intro_lcd.png
    │   ├── quickstart_kmf_cdf.png
    │   ├── weibull_aft_forest.png
    │   ├── coxph_plot_quickstart.png
    │   ├── quickstart_predict_aaf.png
    │   ├── single_at_risk_plots.png
    │   ├── waft_plot_quickstart.png
    │   ├── weibull_aft_two_models.png
    │   ├── weibull_extrapolation.png
    │   ├── survival_regression_aaf.png
    │   ├── coxph_plot_covarite_groups.png
    │   ├── lifelines_intro_all_regimes.png
    │   ├── lifelines_intro_kmf_curve.png
    │   ├── lifelines_intro_kmf_fitter.png
    │   ├── lifelines_intro_naf_fitter.png
    │   ├── survival_regression_harper.png
    │   ├── waltons_cumulative_hazard.png
    │   ├── waltons_survival_function.png
    │   ├── lifelines_intro_multi_kmf_fitter.png
    │   ├── lifelines_intro_naf_fitter_multi.png
    │   ├── lifelines_intro_naf_smooth_multi.png
    │   ├── survival_regression_conditioning.png
    │   ├── lifelines_intro_multi_kmf_fitter_2.png
    │   ├── lifelines_intro_naf_smooth_multi_2.png
    │   ├── survival_analysis_intro_censoring.png
    │   ├── weibull_aft_two_models_side_by_side.png
    │   ├── survival_analysis_intro_censoring_revealed.png
    │   └── survival_regression_conditioning_with_median.png
    ├── lifelines.utils.rst
    ├── lifelines.datasets.rst
    ├── lifelines.plotting.rst
    ├── lifelines.statistics.rst
    ├── References.rst
    ├── index.rst
    ├── lifelines.fitters.rst
    ├── Makefile
    ├── Survival Analysis intro.rst
    └── conf.py
├── .coveragerc
├── reqs
    ├── travis-requirements.txt
    ├── base-requirements.txt
    ├── docs-requirements.txt
    └── dev-requirements.txt
├── lifelines
    ├── version.py
    ├── datasets
    │   ├── static_test.csv
    │   ├── holly_molly_polly.tsv
    │   ├── psychiatric_patients.csv
    │   ├── panel_test.csv
    │   ├── gehan.dat
    │   ├── g3.csv
    │   ├── anderson.csv
    │   ├── lymphoma.csv
    │   ├── larynx.csv
    │   ├── multicenter_aids_cohort.tsv
    │   ├── CuZn-LeftCensoredDataset.csv
    │   ├── dfcv_dataset.py
    │   ├── waltons_dataset.csv
    │   ├── nh4.csv
    │   ├── regression.csv
    │   ├── stanford_heart.csv
    │   ├── lung.csv
    │   └── rossi.csv
    ├── utils
    │   ├── logsf.py
    │   ├── lowess.py
    │   ├── gamma.py
    │   └── btree.py
    ├── __init__.py
    └── fitters
    │   ├── exponential_fitter.py
    │   ├── log_normal_fitter.py
    │   ├── log_logistic_fitter.py
    │   ├── weibull_fitter.py
    │   ├── breslow_fleming_harrington_fitter.py
    │   ├── piecewise_exponential_fitter.py
    │   ├── weibull_aft_fitter.py
    │   ├── log_logistic_aft_fitter.py
    │   └── log_normal_aft_fitter.py
├── MANIFEST.in
├── .gitignore
├── examples
    └── README.md
├── .pre-commit-config.yaml
├── perf_tests
    ├── aaf_perf_test.py
    ├── cp_perf_test.py
    ├── lognormal_perf_test.py
    ├── ctv_perf_test.py
    ├── weibull_aft_perf.py
    ├── weibull_perf_test.py
    └── batch_vs_single.py
├── Makefile
├── .travis.yml
├── experiments
    ├── aalen_and_cook_simulation.py
    ├── detection_limits.py
    └── left_censoring_experiments.py
├── .prospector.yaml
├── LICENSE
├── setup.py
├── CONTRIBUTING.md
├── README.md
└── paper
    ├── paper.md
    └── paper.bib


/tests/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/docs/docs_requirements.txt:
--------------------------------------------------------------------------------
1 | -r ../reqs/docs-requirements.txt


--------------------------------------------------------------------------------
/docs/_static/custom.css:
--------------------------------------------------------------------------------
1 | .wy-nav-content {
2 |     max-width: 900px !important;
3 | }
4 | 


--------------------------------------------------------------------------------
/.coveragerc:
--------------------------------------------------------------------------------
1 | # .coveragerc to control coverage.py
2 | [run]
3 | omit =
4 |     lifelines/plotting.py
5 | 


--------------------------------------------------------------------------------
/docs/images/badfit.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/badfit.png


--------------------------------------------------------------------------------
/docs/images/goodfit.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/goodfit.png


--------------------------------------------------------------------------------
/docs/images/qq_plot.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/qq_plot.png


--------------------------------------------------------------------------------
/docs/images/flat_plot.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/flat_plot.png


--------------------------------------------------------------------------------
/docs/images/kmf_mcas.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/kmf_mcas.png


--------------------------------------------------------------------------------
/docs/images/add_at_risk.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/add_at_risk.png


--------------------------------------------------------------------------------
/docs/images/ci_show_plot.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/ci_show_plot.png


--------------------------------------------------------------------------------
/docs/images/coxph_plot.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/coxph_plot.png


--------------------------------------------------------------------------------
/docs/images/normal_plot.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/normal_plot.png


--------------------------------------------------------------------------------
/docs/images/invert_y_axis.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/invert_y_axis.png


--------------------------------------------------------------------------------
/docs/images/lcd_parametric.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lcd_parametric.png


--------------------------------------------------------------------------------
/docs/images/lifetimes_mcas.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lifetimes_mcas.png


--------------------------------------------------------------------------------
/docs/images/lls_democracy.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lls_democracy.png


--------------------------------------------------------------------------------
/docs/images/quickstart_aaf.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/quickstart_aaf.png


--------------------------------------------------------------------------------
/docs/images/quickstart_kmf.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/quickstart_kmf.png


--------------------------------------------------------------------------------
/docs/images/lls_regime_type.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lls_regime_type.png


--------------------------------------------------------------------------------
/docs/images/quickstart_multi.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/quickstart_multi.png


--------------------------------------------------------------------------------
/docs/images/show_censors_plot.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/show_censors_plot.png


--------------------------------------------------------------------------------
/docs/images/survival_weibull.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/survival_weibull.png


--------------------------------------------------------------------------------
/reqs/travis-requirements.txt:
--------------------------------------------------------------------------------
1 | python-coveralls
2 | seaborn
3 | pytest-travis-fold
4 | dill
5 | -r dev-requirements.txt
6 | 


--------------------------------------------------------------------------------
/docs/images/lifelines_intro_lcd.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lifelines_intro_lcd.png


--------------------------------------------------------------------------------
/docs/images/quickstart_kmf_cdf.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/quickstart_kmf_cdf.png


--------------------------------------------------------------------------------
/docs/images/weibull_aft_forest.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/weibull_aft_forest.png


--------------------------------------------------------------------------------
/lifelines/version.py:
--------------------------------------------------------------------------------
1 | # -*- coding: utf-8 -*-
2 | from __future__ import unicode_literals
3 | 
4 | __version__ = "0.21.0"
5 | 


--------------------------------------------------------------------------------
/docs/images/coxph_plot_quickstart.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/coxph_plot_quickstart.png


--------------------------------------------------------------------------------
/docs/images/quickstart_predict_aaf.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/quickstart_predict_aaf.png


--------------------------------------------------------------------------------
/docs/images/single_at_risk_plots.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/single_at_risk_plots.png


--------------------------------------------------------------------------------
/docs/images/waft_plot_quickstart.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/waft_plot_quickstart.png


--------------------------------------------------------------------------------
/docs/images/weibull_aft_two_models.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/weibull_aft_two_models.png


--------------------------------------------------------------------------------
/docs/images/weibull_extrapolation.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/weibull_extrapolation.png


--------------------------------------------------------------------------------
/docs/images/survival_regression_aaf.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/survival_regression_aaf.png


--------------------------------------------------------------------------------
/reqs/base-requirements.txt:
--------------------------------------------------------------------------------
1 | numpy>=1.14.0
2 | scipy>=1.0
3 | pandas>=0.23.0
4 | matplotlib>=3.0
5 | bottleneck>=1.0
6 | autograd>=1.2
7 | 


--------------------------------------------------------------------------------
/docs/images/coxph_plot_covarite_groups.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/coxph_plot_covarite_groups.png


--------------------------------------------------------------------------------
/docs/images/lifelines_intro_all_regimes.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lifelines_intro_all_regimes.png


--------------------------------------------------------------------------------
/docs/images/lifelines_intro_kmf_curve.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lifelines_intro_kmf_curve.png


--------------------------------------------------------------------------------
/docs/images/lifelines_intro_kmf_fitter.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lifelines_intro_kmf_fitter.png


--------------------------------------------------------------------------------
/docs/images/lifelines_intro_naf_fitter.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lifelines_intro_naf_fitter.png


--------------------------------------------------------------------------------
/docs/images/survival_regression_harper.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/survival_regression_harper.png


--------------------------------------------------------------------------------
/docs/images/waltons_cumulative_hazard.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/waltons_cumulative_hazard.png


--------------------------------------------------------------------------------
/docs/images/waltons_survival_function.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/waltons_survival_function.png


--------------------------------------------------------------------------------
/reqs/docs-requirements.txt:
--------------------------------------------------------------------------------
1 | -r dev-requirements.txt
2 | sphinx
3 | sphinx_rtd_theme
4 | nbsphinx
5 | jupyter_client
6 | nbconvert!=5.4
7 | ipykernel


--------------------------------------------------------------------------------
/docs/images/lifelines_intro_multi_kmf_fitter.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lifelines_intro_multi_kmf_fitter.png


--------------------------------------------------------------------------------
/docs/images/lifelines_intro_naf_fitter_multi.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lifelines_intro_naf_fitter_multi.png


--------------------------------------------------------------------------------
/docs/images/lifelines_intro_naf_smooth_multi.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lifelines_intro_naf_smooth_multi.png


--------------------------------------------------------------------------------
/docs/images/survival_regression_conditioning.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/survival_regression_conditioning.png


--------------------------------------------------------------------------------
/docs/images/lifelines_intro_multi_kmf_fitter_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lifelines_intro_multi_kmf_fitter_2.png


--------------------------------------------------------------------------------
/docs/images/lifelines_intro_naf_smooth_multi_2.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/lifelines_intro_naf_smooth_multi_2.png


--------------------------------------------------------------------------------
/docs/images/survival_analysis_intro_censoring.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/survival_analysis_intro_censoring.png


--------------------------------------------------------------------------------
/docs/images/weibull_aft_two_models_side_by_side.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/weibull_aft_two_models_side_by_side.png


--------------------------------------------------------------------------------
/lifelines/datasets/static_test.csv:
--------------------------------------------------------------------------------
1 | id,t,E,var1,var2
2 | 1,4,1,-1,-1
3 | 2,3,1,-2,-2
4 | 3,3,0,-3,-3
5 | 4,4,1,-4,-4
6 | 5,2,1,-5,-5
7 | 6,0,1,-6,-6
8 | 7,2,1,-7,-7
9 | 


--------------------------------------------------------------------------------
/docs/images/survival_analysis_intro_censoring_revealed.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/survival_analysis_intro_censoring_revealed.png


--------------------------------------------------------------------------------
/docs/images/survival_regression_conditioning_with_median.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/canyon289/lifelines/master/docs/images/survival_regression_conditioning_with_median.png


--------------------------------------------------------------------------------
/docs/lifelines.utils.rst:
--------------------------------------------------------------------------------
1 | lifelines.utils
2 | ===============
3 | 
4 | .. automodule:: lifelines.utils
5 |     :members:
6 |     :undoc-members:
7 |     :show-inheritance:
8 | 


--------------------------------------------------------------------------------
/docs/lifelines.datasets.rst:
--------------------------------------------------------------------------------
1 | lifelines.datasets
2 | ==================
3 | 
4 | 
5 | .. automodule:: lifelines.datasets
6 |     :members:
7 |     :undoc-members:
8 |     :show-inheritance:
9 | 


--------------------------------------------------------------------------------
/docs/lifelines.plotting.rst:
--------------------------------------------------------------------------------
1 | lifelines.plotting
2 | ==================
3 | 
4 | 
5 | .. automodule:: lifelines.plotting
6 |     :members:
7 |     :undoc-members:
8 |     :show-inheritance:
9 | 


--------------------------------------------------------------------------------
/docs/lifelines.statistics.rst:
--------------------------------------------------------------------------------
1 | lifelines.statistics
2 | ======================
3 | 
4 | 
5 | .. automodule:: lifelines.statistics
6 |     :members:
7 |     :undoc-members:
8 |     :show-inheritance:
9 | 


--------------------------------------------------------------------------------
/tests/__main__.py:
--------------------------------------------------------------------------------
1 | # -*- coding: utf-8 -*-
2 | import sys
3 | import pytest
4 | 
5 | 
6 | if __name__ == "__main__":
7 |     # Exit with correct code
8 |     sys.exit(pytest.main(["--pyargs", "lifelines.tests"] + sys.argv[1:]))
9 | 


--------------------------------------------------------------------------------
/lifelines/datasets/holly_molly_polly.tsv:
--------------------------------------------------------------------------------
1 |  ID Status Stratum Start(days) Stop(days) tx T
2 | 0 M 1 1 0 100 1 100
3 | 1 M 1 2 100 105 1 5
4 | 2 H 1 1 0 30 0 30
5 | 3 H 1 2 30 50 0 20
6 | 4 P 1 1 0 20 0 20
7 | 5 P 1 2 20 60 0 40
8 | 6 P 1 3 60 85 0 25
9 | 


--------------------------------------------------------------------------------
/MANIFEST.in:
--------------------------------------------------------------------------------
 1 | include README.md
 2 | include LICENSE
 3 | include MANIFEST.in
 4 | 
 5 | include *.ipynb
 6 | 
 7 | recursive-include lifelines *
 8 | recursive-include datasets *
 9 | recursive-include styles *
10 | 
11 | recursive-exclude * *.py[co]
12 | 


--------------------------------------------------------------------------------
/docs/References.rst:
--------------------------------------------------------------------------------
 1 | Reference library for *lifelines*
 2 | ==================================
 3 | 
 4 | .. toctree::
 5 | 
 6 |     lifelines.fitters
 7 |     lifelines.utils
 8 |     lifelines.statistics
 9 |     lifelines.plotting
10 |     lifelines.datasets
11 | 


--------------------------------------------------------------------------------
/reqs/dev-requirements.txt:
--------------------------------------------------------------------------------
 1 | -r base-requirements.txt
 2 | # installs lifelines as editable dependency in develop mode
 3 | -e .
 4 | pytest>=3.6
 5 | pytest-icdiff;python_version > '3.5'
 6 | coverage>=4.4
 7 | pytest-cov
 8 | pypandoc
 9 | prospector[with_pyroma]
10 | pre-commit
11 | black;python_version > '3.5'
12 | dill
13 | statsmodels
14 | flaky
15 | 


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
 1 | *.pyc
 2 | *.so
 3 | build
 4 | dist
 5 | *.egg-info
 6 | *.iml
 7 | 
 8 | # IDE files
 9 | \.vscode/
10 | 
11 | # testing artifacts
12 | \.coverage
13 | \.pytest_cache/
14 | 
15 | # pipenv files
16 | Pipfile
17 | Pipfile.lock
18 | 
19 | # Pyenv
20 | .python-version
21 | 
22 | # Jupyter
23 | .ipynb_checkpoints
24 | 
25 | # docs artifacts
26 | docs/_build/
27 | 
28 | # asv builds
29 | \.asv/
30 | 


--------------------------------------------------------------------------------
/examples/README.md:
--------------------------------------------------------------------------------
1 | ### Examples
2 | 
3 | In this folder are some examples of lifelines usage, some with and some without comments and context. You can see some common patterns using lifelines and survival analysis.
4 | 
5 | 
6 | #### Other examples
7 | 
8 |  - [nice tutorial to lifelines and survival analysis](https://github.com/chrisluedtke/data-science-journal/blob/master/07-Advanced-Regression/02_Survival_Analysis.ipynb)
9 | 


--------------------------------------------------------------------------------
/lifelines/datasets/psychiatric_patients.csv:
--------------------------------------------------------------------------------
 1 | Age,T,C,sex
 2 | 51,1,1,2
 3 | 58,1,1,2
 4 | 55,2,1,2
 5 | 28,22,1,2
 6 | 21,30,0,1
 7 | 19,28,1,1
 8 | 25,32,1,2
 9 | 48,11,1,2
10 | 47,14,1,2
11 | 25,36,0,2
12 | 31,31,0,2
13 | 24,33,0,1
14 | 25,33,0,1
15 | 30,37,0,2
16 | 33,35,0,2
17 | 36,25,1,1
18 | 30,31,0,1
19 | 41,22,1,1
20 | 43,26,1,2
21 | 45,24,1,2
22 | 35,35,0,2
23 | 29,34,0,1
24 | 35,30,0,1
25 | 32,35,1,1
26 | 36,40,1,2
27 | 32,39,0,1
28 | 


--------------------------------------------------------------------------------
/lifelines/datasets/panel_test.csv:
--------------------------------------------------------------------------------
 1 | id,t,E,var1,var2
 2 | 1,1,0,0,1
 3 | 1,2,0,0,1
 4 | 1,3,0,4,3
 5 | 1,4,1,8,4
 6 | 2,1,0,1.2,1
 7 | 2,2,0,1.2,2
 8 | 2,3,0,1.2,2
 9 | 3,1,0,0,1
10 | 3,2,1,1,2
11 | 4,1,0,0,1
12 | 4,2,0,1,2
13 | 4,3,0,1,3
14 | 4,4,0,2,4
15 | 4,5,1,2,5
16 | 5,1,0,1,-1
17 | 5,2,0,2,-1
18 | 5,3,0,3,-1
19 | 6,1,1,3,0
20 | 7,1,0,1,0
21 | 7,2,0,2,1
22 | 7,3,0,3,0
23 | 7,4,0,3,1
24 | 7,5,0,3,0
25 | 7,6,1,3,1
26 | 8,1,0,-1,0
27 | 8,2,1,1,0
28 | 9,1,0,1,1
29 | 9,2,0,2,2
30 | 


--------------------------------------------------------------------------------
/.pre-commit-config.yaml:
--------------------------------------------------------------------------------
 1 | repos:
 2 | -   repo: https://github.com/pre-commit/pre-commit-hooks
 3 |     rev: v2.0.0
 4 |     hooks:
 5 |     -   id: trailing-whitespace
 6 |     -   id: check-ast
 7 |     -   id: check-yaml
 8 |     -   id: end-of-file-fixer
 9 |     -   id: fix-encoding-pragma
10 |     -   id: mixed-line-ending
11 |     -   id: trailing-whitespace
12 | -   repo: https://github.com/ambv/black
13 |     rev: stable
14 |     hooks:
15 |     - id: black
16 |       args: ["--line-length", "120"]
17 | 


--------------------------------------------------------------------------------
/lifelines/datasets/gehan.dat:
--------------------------------------------------------------------------------
 1 | 2 6 1
 2 | 2 6 1
 3 | 2 6 1
 4 | 2 6 0
 5 | 2 7 1
 6 | 2 9 0
 7 | 2 10 1
 8 | 2 10 0
 9 | 2 11 0
10 | 2 13 1
11 | 2 16 1
12 | 2 17 0
13 | 2 19 0
14 | 2 20 0
15 | 2 22 1
16 | 2 23 1
17 | 2 25 0
18 | 2 32 0
19 | 2 32 0
20 | 2 34 0
21 | 2 35 0
22 | 1 1 1
23 | 1 1 1
24 | 1 2 1
25 | 1 2 1
26 | 1 3 1
27 | 1 4 1
28 | 1 4 1
29 | 1 5 1
30 | 1 5 1
31 | 1 8 1
32 | 1 8 1
33 | 1 8 1
34 | 1 8 1
35 | 1 11 1
36 | 1 11 1
37 | 1 12 1
38 | 1 12 1
39 | 1 15 1
40 | 1 17 1
41 | 1 22 1
42 | 1 23 1
43 | 


--------------------------------------------------------------------------------
/tests/conftest.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | import numpy as np
 3 | import pytest
 4 | 
 5 | 
 6 | def pytest_runtest_setup(item):
 7 |     random_seed = np.random.randint(1000)
 8 |     print("Seed used in np.random.seed(): %d" % random_seed)
 9 |     np.random.seed(random_seed)
10 | 
11 | 
12 | def pytest_addoption(parser):
13 |     parser.addoption("--block", action="store", default=True, help="Should plotting block or not.")
14 | 
15 | 
16 | @pytest.fixture
17 | def block(request):
18 |     try:
19 |         return request.config.getoption("--block") not in "False,false,no,0".split(",")
20 |     except ValueError:
21 |         return True
22 | 


--------------------------------------------------------------------------------
/lifelines/datasets/g3.csv:
--------------------------------------------------------------------------------
 1 | no.,age,sex,histology,group,event,time
 2 | 1,41,Female,Grade3,RIT,True,53
 3 | 2,45,Female,Grade3,RIT,False,28
 4 | 3,48,Male,Grade3,RIT,False,69
 5 | 4,54,Male,Grade3,RIT,False,58
 6 | 5,40,Female,Grade3,RIT,False,54
 7 | 6,31,Male,Grade3,RIT,True,25
 8 | 7,53,Male,Grade3,RIT,False,51
 9 | 8,49,Male,Grade3,RIT,False,61
10 | 9,36,Male,Grade3,RIT,False,57
11 | 10,52,Male,Grade3,RIT,False,57
12 | 11,57,Male,Grade3,RIT,False,50
13 | 1,27,Male,Grade3,Control,True,34
14 | 2,32,Male,Grade3,Control,True,32
15 | 3,53,Female,Grade3,Control,True,9
16 | 4,46,Male,Grade3,Control,True,19
17 | 5,33,Female,Grade3,Control,False,50
18 | 6,19,Female,Grade3,Control,False,48
19 | 


--------------------------------------------------------------------------------
/perf_tests/aaf_perf_test.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | # aalen additive
 3 | 
 4 | 
 5 | if __name__ == "__main__":
 6 |     import pandas as pd
 7 |     import numpy as np
 8 |     import time
 9 | 
10 |     from lifelines.fitters.aalen_additive_fitter import AalenAdditiveFitter
11 |     from lifelines.datasets import load_rossi
12 | 
13 |     df = load_rossi()
14 |     df = pd.concat([df] * 1)
15 |     # df['week'] = np.random.exponential(size=df.shape[0])
16 |     aaf = AalenAdditiveFitter()
17 |     start_time = time.time()
18 |     aaf.fit(df, duration_col="week", event_col="arrest")
19 |     print("--- %s seconds ---" % (time.time() - start_time))
20 |     aaf.print_summary(5)
21 | 


--------------------------------------------------------------------------------
/perf_tests/cp_perf_test.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | # cox regression
 3 | 
 4 | 
 5 | if __name__ == "__main__":
 6 |     import pandas as pd
 7 |     import time
 8 |     import numpy as np
 9 | 
10 |     from lifelines import CoxPHFitter
11 |     from lifelines.datasets import load_rossi
12 | 
13 |     df = load_rossi()
14 |     df = pd.concat([df] * 16)
15 |     # df = df.reset_index()
16 |     # df['week'] = np.random.exponential(1, size=df.shape[0])
17 |     cp = CoxPHFitter()
18 |     start_time = time.time()
19 |     cp.fit(df, duration_col="week", event_col="arrest", batch_mode=True)
20 |     print("--- %s seconds ---" % (time.time() - start_time))
21 |     cp.print_summary()
22 | 


--------------------------------------------------------------------------------
/perf_tests/lognormal_perf_test.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | # aalen additive
 3 | 
 4 | 
 5 | if __name__ == "__main__":
 6 |     import pandas as pd
 7 |     import numpy as np
 8 |     import time
 9 | 
10 |     from lifelines import LogNormalFitter
11 | 
12 |     np.random.seed(1)
13 |     N = 250000
14 |     mu = 3 * np.random.randn()
15 |     sigma = np.random.uniform(0.1, 3.0)
16 | 
17 |     X, C = np.exp(sigma * np.random.randn(N) + mu), np.exp(np.random.randn(N) + mu)
18 |     E = X <= C
19 |     T = np.minimum(X, C)
20 | 
21 |     lnf = LogNormalFitter()
22 |     start_time = time.time()
23 |     lnf.fit(T, E)
24 |     print("--- %s seconds ---" % (time.time() - start_time))
25 |     lnf.print_summary(5)
26 | 


--------------------------------------------------------------------------------
/perf_tests/ctv_perf_test.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | if __name__ == "__main__":
 3 |     import time
 4 |     import pandas as pd
 5 |     from lifelines import CoxTimeVaryingFitter
 6 |     from lifelines.datasets import load_rossi
 7 |     from lifelines.utils import to_long_format
 8 | 
 9 |     df = load_rossi()
10 |     df = pd.concat([df] * 20)
11 |     df = df.reset_index()
12 |     df = to_long_format(df, duration_col="week")
13 |     ctv = CoxTimeVaryingFitter()
14 |     start_time = time.time()
15 |     ctv.fit(df, id_col="index", event_col="arrest", start_col="start", stop_col="stop")
16 |     time_took = time.time() - start_time
17 |     print("--- %s seconds ---" % time_took)
18 |     ctv.print_summary()
19 | 


--------------------------------------------------------------------------------
/Makefile:
--------------------------------------------------------------------------------
 1 | init:
 2 | ifeq ($(TRAVIS), true)
 3 | 		pip install -r reqs/travis-requirements.txt
 4 | 		pip install pandas==${PANDAS_VERSION}
 5 | 		pip list --local
 6 | else
 7 | 		pip install -r reqs/dev-requirements.txt
 8 | 		pre-commit install
 9 | endif
10 | 
11 | test:
12 | 	py.test -rfs --cov=lifelines --block=False --cov-report term-missing
13 | 
14 | lint:
15 | ifeq ($(TRAVIS_PYTHON_VERSION), 2.7)
16 | 		echo "Skip linting for Python2.7"
17 | else
18 | 		black lifelines/ -l 120 --fast
19 | 		black tests/ -l 120 --fast
20 | 		prospector --output-format grouped
21 | endif
22 | 
23 | check_format:
24 | ifeq ($(TRAVIS_PYTHON_VERSION), 3.6)
25 | 		black . --check --line-length 120
26 | else
27 | 		echo "Only check format on Python3.6"
28 | endif
29 | 
30 | pre:
31 | 	pre-commit run --all-files
32 | 


--------------------------------------------------------------------------------
/lifelines/datasets/anderson.csv:
--------------------------------------------------------------------------------
 1 | t status sex logWBC Rx
 2 | 35 0 1 1.45 0
 3 | 34 0 1 1.47 0
 4 | 32 0 1 2.2 0
 5 | 32 0 1 2.53 0
 6 | 25 0 1 1.78 0
 7 | 23 1 1 2.57 0
 8 | 22 1 1 2.32 0
 9 | 20 0 1 2.01 0
10 | 19 0 0 2.05 0
11 | 17 0 0 2.16 0
12 | 16 1 1 3.6 0
13 | 13 1 0 2.88 0
14 | 11 0 0 2.6 0
15 | 10 0 0 2.7 0
16 | 10 1 0 2.96 0
17 | 9 0 0 2.8 0
18 | 7 1 0 4.43 0
19 | 6 0 0 3.2 0
20 | 6 1 0 2.31 0
21 | 6 1 1 4.06 0
22 | 6 1 0 3.28 0
23 | 23 1 1 1.97 1
24 | 22 1 0 2.73 1
25 | 17 1 0 2.95 1
26 | 15 1 0 2.3 1
27 | 12 1 0 1.5 1
28 | 12 1 0 3.06 1
29 | 11 1 0 3.49 1
30 | 11 1 0 2.12 1
31 | 8 1 0 3.52 1
32 | 8 1 0 3.05 1
33 | 8 1 0 2.32 1
34 | 8 1 1 3.26 1
35 | 5 1 1 3.49 1
36 | 5 1 0 3.97 1
37 | 4 1 1 4.36 1
38 | 4 1 1 2.42 1
39 | 3 1 1 4.01 1
40 | 2 1 1 4.91 1
41 | 2 1 1 4.48 1
42 | 1 1 1 2.8 1
43 | 1 1 1 5 1
44 | 


--------------------------------------------------------------------------------
/.travis.yml:
--------------------------------------------------------------------------------
 1 | language: python
 2 | cache: pip
 3 | dist: trusty
 4 | python:
 5 |    - "3.5"
 6 |    - "3.6"
 7 | env:
 8 | - export PANDAS_VERSION=0.23.4
 9 | - export PANDAS_VERSION=0.24.1
10 | # Enable newer 3.7 without globally enabling sudo and dist: xenial for other build jobs
11 | matrix:
12 |   include:
13 |   - python: 3.7
14 |     dist: xenial
15 |     sudo: true
16 |     env: export PANDAS_VERSION=0.24.1
17 |   - python: 3.7
18 |     dist: xenial
19 |     sudo: true
20 |     env: export PANDAS_VERSION=0.23.4
21 | before_install:
22 |   - ls
23 |   # - sudo apt-get update
24 | install: "make"
25 | script:
26 |   # enforce formatting
27 |   - make check_format
28 |   # command to run tests
29 |   - make test
30 | after_success:
31 |   - coveralls
32 | # Don't want notifications
33 | notifications:
34 |   email: false
35 | 


--------------------------------------------------------------------------------
/perf_tests/weibull_aft_perf.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | # weibull aft
 3 | 
 4 | 
 5 | if __name__ == "__main__":
 6 |     import pandas as pd
 7 |     import time
 8 |     import numpy as np
 9 | 
10 |     from lifelines import WeibullAFTFitter
11 |     from lifelines.datasets import load_rossi
12 | 
13 |     df = load_rossi()
14 |     df = pd.concat([df] * 1)
15 | 
16 |     df["start"] = df["week"]
17 |     df["stop"] = np.where(df["arrest"], df["start"], np.inf)
18 |     df = df.drop("week", axis=1)
19 | 
20 |     wp = WeibullAFTFitter()
21 |     start_time = time.time()
22 |     print(df.head())
23 |     wp.fit_interval_censoring(df, start_col="start", stop_col="stop", event_col="arrest")
24 |     print("--- %s seconds ---" % (time.time() - start_time))
25 |     wp.print_summary()
26 | 
27 |     wp.fit_right_censoring(load_rossi(), "week", event_col="arrest")
28 |     wp.print_summary()
29 | 


--------------------------------------------------------------------------------
/perf_tests/weibull_perf_test.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | 
 3 | if __name__ == "__main__":
 4 |     import pandas as pd
 5 |     import numpy as np
 6 |     import time
 7 | 
 8 |     from lifelines import WeibullFitter
 9 | 
10 |     data = (
11 |         [{"start": 0, "stop": 2, "E": False}] * (1000 - 376)
12 |         + [{"start": 2, "stop": 5, "E": False}] * (376 - 82)
13 |         + [{"start": 5, "stop": 10, "E": False}] * (82 - 7)
14 |         + [{"start": 10, "stop": 1e10, "E": False}] * 7
15 |     )
16 | 
17 |     df = pd.DataFrame.from_records(data)
18 |     print(df)
19 | 
20 |     df = df.groupby(["start", "stop", "E"]).size().reset_index()
21 |     print(df)
22 | 
23 |     wb = WeibullFitter()
24 |     start_time = time.time()
25 |     wb.fit_interval_censoring(df["start"], df["stop"], df["E"], weights=df[0])
26 |     print("--- %s seconds ---" % (time.time() - start_time))
27 |     wb.print_summary(5)
28 | 


--------------------------------------------------------------------------------
/lifelines/utils/logsf.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | 
 3 | from scipy.stats import norm as _scipy_norm
 4 | import autograd.numpy as np
 5 | from autograd.scipy.stats import norm
 6 | from autograd.extend import primitive, defvjp
 7 | from autograd.numpy.numpy_vjps import unbroadcast_f
 8 | 
 9 | # TODO: next release of autograd will have this built in.
10 | 
11 | logsf = primitive(_scipy_norm.logsf)
12 | 
13 | defvjp(
14 |     logsf,
15 |     lambda ans, x, loc=0.0, scale=1.0: unbroadcast_f(
16 |         x, lambda g: -g * np.exp(norm.logpdf(x, loc, scale) - logsf(x, loc, scale))
17 |     ),
18 |     lambda ans, x, loc=0.0, scale=1.0: unbroadcast_f(
19 |         loc, lambda g: g * np.exp(norm.logpdf(x, loc, scale) - logsf(x, loc, scale))
20 |     ),
21 |     lambda ans, x, loc=0.0, scale=1.0: unbroadcast_f(
22 |         scale, lambda g: g * np.exp(norm.logpdf(x, loc, scale) - logsf(x, loc, scale)) * (x - loc) / scale
23 |     ),
24 | )
25 | 


--------------------------------------------------------------------------------
/experiments/aalen_and_cook_simulation.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | import numpy as np
 3 | from scipy.stats import weibull_min
 4 | import pandas as pd
 5 | from lifelines import WeibullAFTFitter, CoxPHFitter
 6 | 
 7 | # This is an implementation of https://uwspace.uwaterloo.ca/bitstream/handle/10012/10265/Cook_Richard-10265.pdf
 8 | 
 9 | N = 50000
10 | p = 0.5
11 | bX = np.log(0.5)
12 | bZ = np.log(4)
13 | 
14 | Z = np.random.binomial(1, p, size=N)
15 | X = np.random.binomial(1, 0.5, size=N)
16 | X_ = 20000 + 10 * np.random.randn(N)
17 | 
18 | W = weibull_min.rvs(1, scale=1, loc=0, size=N)
19 | 
20 | Y = bX * X + bZ * Z + np.log(W)
21 | T = np.exp(Y)
22 | 
23 | #######################################
24 | 
25 | df = pd.DataFrame({"T": T, "x": X, "x_": X_})
26 | 
27 | 
28 | wf = WeibullAFTFitter().fit(df, "T")
29 | wf.print_summary(4)
30 | 
31 | 
32 | cph = CoxPHFitter().fit(df, "T", show_progress=True, step_size=1.0)
33 | cph.print_summary(4)
34 | 


--------------------------------------------------------------------------------
/lifelines/datasets/lymphoma.csv:
--------------------------------------------------------------------------------
 1 | Stage_group,Time,Censor
 2 | 1,6,1
 3 | 1,19,1
 4 | 1,32,1
 5 | 1,42,1
 6 | 1,42,1
 7 | 1,43,0
 8 | 1,94,1
 9 | 1,126,0
10 | 1,169,0
11 | 1,207,1
12 | 1,211,0
13 | 1,227,0
14 | 1,253,1
15 | 1,255,0
16 | 1,270,0
17 | 1,310,0
18 | 1,316,0
19 | 1,335,0
20 | 1,346,0
21 | 2,4,1
22 | 2,6,1
23 | 2,10,1
24 | 2,11,1
25 | 2,11,1
26 | 2,11,1
27 | 2,13,1
28 | 2,17,1
29 | 2,20,1
30 | 2,20,1
31 | 2,21,1
32 | 2,22,1
33 | 2,24,1
34 | 2,24,1
35 | 2,29,1
36 | 2,30,1
37 | 2,30,1
38 | 2,31,1
39 | 2,33,1
40 | 2,34,1
41 | 2,35,1
42 | 2,39,1
43 | 2,40,1
44 | 2,41,0
45 | 2,43,0
46 | 2,45,1
47 | 2,46,1
48 | 2,50,1
49 | 2,56,1
50 | 2,61,0
51 | 2,61,0
52 | 2,63,1
53 | 2,68,1
54 | 2,82,1
55 | 2,85,1
56 | 2,88,1
57 | 2,89,1
58 | 2,90,1
59 | 2,93,1
60 | 2,104,1
61 | 2,110,1
62 | 2,134,1
63 | 2,137,1
64 | 2,160,0
65 | 2,169,1
66 | 2,171,1
67 | 2,173,1
68 | 2,175,1
69 | 2,184,1
70 | 2,201,1
71 | 2,222,1
72 | 2,235,0
73 | 2,247,0
74 | 2,260,0
75 | 2,284,0
76 | 2,290,0
77 | 2,291,0
78 | 2,302,0
79 | 2,304,0
80 | 2,341,0
81 | 2,345,0
82 | 


--------------------------------------------------------------------------------
/.prospector.yaml:
--------------------------------------------------------------------------------
 1 | strictness: medium
 2 | 
 3 | pylint:
 4 |   options:
 5 |     bad-names: foo,baz,toto,tutu,tata,data
 6 |     # max-args default = 5
 7 |     max-args: 15
 8 |     # max-locals default = 15
 9 |     max-locals: 50
10 |     # max-branches default = 15
11 |     max-branches: 16
12 |   disable:
13 |     - line-too-long
14 |     - protected-access
15 |     - no-value-for-parameter
16 |     - assignment-from-no-return
17 |     - invalid-unary-operand-type
18 |     # remove if python2.7 support is dropped
19 |     - useless-object-inheritance
20 |     - old-style-class
21 | 
22 | pyflakes:
23 |   disable:
24 |     - F401
25 |     - F841
26 |     # let pylint used-before-assignment handle this
27 |     - F821
28 | 
29 | pep8:
30 |   options:
31 |     max-line-length: 120
32 |   disable:
33 |     - E501
34 |     - E241
35 | 
36 | mccabe:
37 |   options:
38 |     # max-complexity default = 10
39 |     max-complexity: 23
40 | 
41 | pyroma:
42 |   run: true
43 | 
44 | pep257:
45 |   run: false
46 | 
47 | ignore-paths:
48 |   - build
49 |   - benchmarks
50 | 


--------------------------------------------------------------------------------
/tests/utils/test_btree.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | from __future__ import print_function
 3 | 
 4 | import pytest
 5 | import numpy as np
 6 | 
 7 | from lifelines.utils.btree import _BTree as BTree
 8 | 
 9 | 
10 | def test_btree():
11 |     t = BTree(np.arange(10))
12 |     for i in range(10):
13 |         assert t.rank(i) == (0, 0)
14 | 
15 |     assert len(t) == 0
16 |     t.insert(5)
17 |     t.insert(6)
18 |     t.insert(6)
19 |     t.insert(0)
20 |     t.insert(9)
21 |     assert len(t) == 5
22 | 
23 |     assert t.rank(0) == (0, 1)
24 |     assert t.rank(0.5) == (1, 0)
25 |     assert t.rank(4.5) == (1, 0)
26 |     assert t.rank(5) == (1, 1)
27 |     assert t.rank(5.5) == (2, 0)
28 |     assert t.rank(6) == (2, 2)
29 |     assert t.rank(6.5) == (4, 0)
30 |     assert t.rank(8.5) == (4, 0)
31 |     assert t.rank(9) == (4, 1)
32 |     assert t.rank(9.5) == (5, 0)
33 | 
34 |     for i in range(1, 32):
35 |         BTree(np.arange(i))
36 | 
37 |     with pytest.raises(ValueError):
38 |         # This has to go last since it screws up the counts
39 |         t.insert(5.5)
40 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
 1 | MIT License
 2 | 
 3 | Copyright (c) 2017 Cameron Davidson-Pilon
 4 | 
 5 | Permission is hereby granted, free of charge, to any person obtaining a copy
 6 | of this software and associated documentation files (the "Software"), to deal
 7 | in the Software without restriction, including without limitation the rights
 8 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
 9 | copies of the Software, and to permit persons to whom the Software is
10 | furnished to do so, subject to the following conditions:
11 | 
12 | The above copyright notice and this permission notice shall be included in all
13 | copies or substantial portions of the Software.
14 | 
15 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21 | SOFTWARE.
22 | 


--------------------------------------------------------------------------------
/tests/test_generate_datasets.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | import os
 3 | 
 4 | import pytest
 5 | import matplotlib.pyplot as plt
 6 | 
 7 | from lifelines import NelsonAalenFitter, KaplanMeierFitter
 8 | from lifelines.generate_datasets import exponential_survival_data
 9 | 
10 | 
11 | def test_exponential_data_sets_correct_censor():
12 |     N = 20000
13 |     censorship = 0.2
14 |     T, C = exponential_survival_data(N, censorship, scale=10)
15 |     assert abs(C.mean() - (1 - censorship)) < 0.02
16 | 
17 | 
18 | @pytest.mark.skipif("DISPLAY" not in os.environ, reason="requires display")
19 | def test_exponential_data_sets_fit():
20 |     N = 20000
21 |     T, C = exponential_survival_data(N, 0.2, scale=10)
22 |     naf = NelsonAalenFitter()
23 |     naf.fit(T, C).plot()
24 |     plt.title("Should be a linear with slope = 0.1")
25 | 
26 | 
27 | @pytest.mark.skipif("DISPLAY" not in os.environ, reason="requires display")
28 | def test_kmf_minimum_observation_bias():
29 |     N = 250
30 |     kmf = KaplanMeierFitter()
31 |     T, C = exponential_survival_data(N, 0.1, scale=10)
32 |     B = 0.01 * T
33 |     kmf.fit(T, C, entry=B)
34 |     kmf.plot()
35 |     plt.title("Should have larger variances in the tails")
36 | 


--------------------------------------------------------------------------------
/experiments/detection_limits.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | """
 3 | Experimenting with some data generation and inference for left censorship with one or more
 4 | minimum detectable limits.
 5 | 
 6 | Recall that MLE bias is equal to 0 up to the order 1/sqrt(n), so we expect that for
 7 | small n, we will see a bias.
 8 | 
 9 | """
10 | import numpy as np
11 | from lifelines import WeibullFitter
12 | 
13 | 
14 | def one_detection_limit(N, fraction_below_limit):
15 | 
16 |     T_actual = 0.5 * np.random.weibull(1, size=N)
17 | 
18 |     MIN_1 = np.percentile(T_actual, fraction_below_limit)
19 | 
20 |     T = np.maximum(MIN_1, T_actual)
21 |     E = T_actual > MIN_1
22 | 
23 |     wf = WeibullFitter().fit(T, E, left_censorship=True)
24 |     return wf
25 | 
26 | 
27 | def three_detection_limit(N):
28 | 
29 |     T_actual = 0.5 * np.random.weibull(5, size=N)
30 | 
31 |     MIN_0 = np.percentile(T_actual, 5)
32 |     MIN_1 = np.percentile(T_actual, 10)
33 |     MIN_2 = np.percentile(T_actual, 30)
34 |     MIN_3 = np.percentile(T_actual, 50)
35 | 
36 |     T = T_actual.copy()
37 |     ix = np.random.randint(4, size=N)
38 | 
39 |     T = np.where(ix == 0, np.maximum(T, MIN_0), T)
40 |     T = np.where(ix == 1, np.maximum(T, MIN_1), T)
41 |     T = np.where(ix == 2, np.maximum(T, MIN_2), T)
42 |     T = np.where(ix == 3, np.maximum(T, MIN_3), T)
43 |     E = T_actual == T
44 | 
45 |     wf = WeibullFitter().fit(T, E, left_censorship=True)
46 |     return wf
47 | 
48 | 
49 | # biased
50 | np.mean([three_detection_limit(50).rho_ for _ in range(1000)])
51 | 
52 | 
53 | # less biased
54 | np.mean([three_detection_limit(500).rho_ for _ in range(1000)])
55 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | import os
 3 | 
 4 | from setuptools import setup, find_packages
 5 | 
 6 | 
 7 | def filepath(fname):
 8 |     return os.path.join(os.path.dirname(__file__), fname)
 9 | 
10 | 
11 | exec(compile(open("lifelines/version.py").read(), "lifelines/version.py", "exec"))
12 | 
13 | with open("README.md") as f:
14 |     long_description = f.read()
15 | 
16 | setup(
17 |     name="lifelines",
18 |     version=__version__,
19 |     author="Cameron Davidson-Pilon",
20 |     author_email="cam.davidson.pilon@gmail.com",
21 |     description="Survival analysis in Python, including Kaplan Meier, Nelson Aalen and regression",
22 |     license="MIT",
23 |     keywords="survival analysis statistics data analysis",
24 |     url="https://github.com/CamDavidsonPilon/lifelines",
25 |     packages=find_packages(),
26 |     python_requires=">=3.5",
27 |     long_description=long_description,
28 |     long_description_content_type="text/markdown",
29 |     classifiers=[
30 |         "Development Status :: 4 - Beta",
31 |         "License :: OSI Approved :: MIT License",
32 |         "Programming Language :: Python",
33 |         "Programming Language :: Python :: 3.5",
34 |         "Programming Language :: Python :: 3.6",
35 |         "Programming Language :: Python :: 3.7",
36 |         "Topic :: Scientific/Engineering",
37 |     ],
38 |     install_requires=[
39 |         "numpy>=1.6.0",
40 |         "scipy>=1.0",
41 |         "pandas>=0.23.0",
42 |         "matplotlib>=3.0",
43 |         "bottleneck>=1.0",
44 |         "autograd>=1.2",
45 |     ],
46 |     package_data={"lifelines": ["../README.md", "../README.txt", "../LICENSE", "../MANIFEST.in", "datasets/*"]},
47 | )
48 | 


--------------------------------------------------------------------------------
/experiments/left_censoring_experiments.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | import numpy as np
 3 | import scipy
 4 | from matplotlib import pyplot as plt
 5 | from lifelines import WeibullFitter, KaplanMeierFitter, LogNormalFitter, LogLogisticFitter
 6 | from lifelines.plotting import left_censorship_cdf_plot, qq_plot
 7 | 
 8 | plt.style.use("bmh")
 9 | 
10 | 
11 | N = 2500
12 | 
13 | T_actual = scipy.stats.fisk(8, 0, 1).rvs(N)
14 | 
15 | MIN_0 = np.percentile(T_actual, 5)
16 | MIN_1 = np.percentile(T_actual, 10)
17 | MIN_2 = np.percentile(T_actual, 30)
18 | MIN_3 = np.percentile(T_actual, 50)
19 | 
20 | T = T_actual.copy()
21 | ix = np.random.randint(4, size=N)
22 | 
23 | T = np.where(ix == 0, np.maximum(T, MIN_0), T)
24 | T = np.where(ix == 1, np.maximum(T, MIN_1), T)
25 | T = np.where(ix == 2, np.maximum(T, MIN_2), T)
26 | T = np.where(ix == 3, np.maximum(T, MIN_3), T)
27 | E = T_actual == T
28 | 
29 | fig, axes = plt.subplots(2, 2, figsize=(9, 5))
30 | axes = axes.reshape(4)
31 | 
32 | for i, model in enumerate([WeibullFitter(), KaplanMeierFitter(), LogNormalFitter(), LogLogisticFitter()]):
33 |     if isinstance(model, KaplanMeierFitter):
34 |         model.fit(T, E, left_censorship=True, label=model.__class__.__name__)
35 |     else:
36 |         model.fit(T, E, left_censorship=True, label=model.__class__.__name__)
37 | 
38 |     model.plot_cumulative_density(ax=axes[i])
39 | plt.tight_layout()
40 | 
41 | for i, model in enumerate([WeibullFitter(), LogNormalFitter(), LogLogisticFitter()]):
42 |     model.fit(T, E, left_censorship=True)
43 |     fig, axes = plt.subplots(2, 1, figsize=(8, 6))
44 | 
45 |     left_censorship_cdf_plot(model, ax=axes[0])
46 |     qq_plot(model, ax=axes[1])
47 | 
48 | 
49 | plt.show()
50 | 


--------------------------------------------------------------------------------
/lifelines/__init__.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | # pylint: skip-file
 3 | 
 4 | from lifelines.fitters.weibull_fitter import WeibullFitter
 5 | from lifelines.fitters.exponential_fitter import ExponentialFitter
 6 | from lifelines.fitters.nelson_aalen_fitter import NelsonAalenFitter
 7 | from lifelines.fitters.kaplan_meier_fitter import KaplanMeierFitter
 8 | from lifelines.fitters.breslow_fleming_harrington_fitter import BreslowFlemingHarringtonFitter
 9 | from lifelines.fitters.coxph_fitter import CoxPHFitter
10 | from lifelines.fitters.cox_time_varying_fitter import CoxTimeVaryingFitter
11 | from lifelines.fitters.aalen_additive_fitter import AalenAdditiveFitter
12 | from lifelines.fitters.aalen_johansen_fitter import AalenJohansenFitter
13 | from lifelines.fitters.log_normal_fitter import LogNormalFitter
14 | from lifelines.fitters.log_logistic_fitter import LogLogisticFitter
15 | from lifelines.fitters.piecewise_exponential_fitter import PiecewiseExponentialFitter
16 | from lifelines.fitters.weibull_aft_fitter import WeibullAFTFitter
17 | from lifelines.fitters.log_logistic_aft_fitter import LogLogisticAFTFitter
18 | from lifelines.fitters.log_normal_aft_fitter import LogNormalAFTFitter
19 | 
20 | 
21 | from lifelines.version import __version__
22 | 
23 | __all__ = [
24 |     "__version__",
25 |     "KaplanMeierFitter",
26 |     "NelsonAalenFitter",
27 |     "AalenAdditiveFitter",
28 |     "BreslowFlemingHarringtonFitter",
29 |     "CoxPHFitter",
30 |     "WeibullFitter",
31 |     "ExponentialFitter",
32 |     "CoxTimeVaryingFitter",
33 |     "AalenJohansenFitter",
34 |     "LogNormalFitter",
35 |     "LogLogisticFitter",
36 |     "WeibullAFTFitter",
37 |     "LogLogisticAFTFitter",
38 |     "LogNormalAFTFitter",
39 |     "PiecewiseExponentialFitter",
40 | ]
41 | 


--------------------------------------------------------------------------------
/lifelines/datasets/larynx.csv:
--------------------------------------------------------------------------------
 1 | time,age,death,Stage II,Stage III,Stage IV
 2 | 0.6,77,1,0,0,0
 3 | 1.3,53,1,0,0,0
 4 | 2.4,45,1,0,0,0
 5 | 2.5,57,0,0,0,0
 6 | 3.2,58,1,0,0,0
 7 | 3.2,51,0,0,0,0
 8 | 3.3,76,1,0,0,0
 9 | 3.3,63,0,0,0,0
10 | 3.5,43,1,0,0,0
11 | 3.5,60,1,0,0,0
12 | 4.0,52,1,0,0,0
13 | 4.0,63,1,0,0,0
14 | 4.3,86,1,0,0,0
15 | 4.5,48,0,0,0,0
16 | 4.5,68,0,0,0,0
17 | 5.3,81,1,0,0,0
18 | 5.5,70,0,0,0,0
19 | 5.9,58,0,0,0,0
20 | 5.9,47,0,0,0,0
21 | 6.0,75,1,0,0,0
22 | 6.1,77,0,0,0,0
23 | 6.2,64,0,0,0,0
24 | 6.4,77,1,0,0,0
25 | 6.5,67,1,0,0,0
26 | 6.5,79,0,0,0,0
27 | 6.7,61,0,0,0,0
28 | 7.0,66,0,0,0,0
29 | 7.4,68,1,0,0,0
30 | 7.4,73,0,0,0,0
31 | 8.1,56,0,0,0,0
32 | 8.1,73,0,0,0,0
33 | 9.6,58,0,0,0,0
34 | 10.7,68,0,0,0,0
35 | 0.2,86,1,1,0,0
36 | 1.8,64,1,1,0,0
37 | 2.0,63,1,1,0,0
38 | 2.2,71,0,1,0,0
39 | 2.6,67,0,1,0,0
40 | 3.3,51,0,1,0,0
41 | 3.6,70,1,1,0,0
42 | 3.6,72,0,1,0,0
43 | 4.0,81,1,1,0,0
44 | 4.3,47,0,1,0,0
45 | 4.3,64,0,1,0,0
46 | 5.0,66,0,1,0,0
47 | 6.2,74,1,1,0,0
48 | 7.0,62,1,1,0,0
49 | 7.5,50,0,1,0,0
50 | 7.6,53,0,1,0,0
51 | 9.3,61,0,1,0,0
52 | 0.3,49,1,0,1,0
53 | 0.3,71,1,0,1,0
54 | 0.5,57,1,0,1,0
55 | 0.7,79,1,0,1,0
56 | 0.8,82,1,0,1,0
57 | 1.0,49,1,0,1,0
58 | 1.3,60,1,0,1,0
59 | 1.6,64,1,0,1,0
60 | 1.8,74,1,0,1,0
61 | 1.9,72,1,0,1,0
62 | 1.9,53,1,0,1,0
63 | 3.2,54,1,0,1,0
64 | 3.5,81,1,0,1,0
65 | 3.7,52,0,0,1,0
66 | 4.5,66,0,0,1,0
67 | 4.8,54,0,0,1,0
68 | 4.8,63,0,0,1,0
69 | 5.0,59,1,0,1,0
70 | 5.0,49,0,0,1,0
71 | 5.1,69,0,0,1,0
72 | 6.3,70,1,0,1,0
73 | 6.4,65,1,0,1,0
74 | 6.5,65,0,0,1,0
75 | 7.8,68,1,0,1,0
76 | 8.0,78,0,0,1,0
77 | 9.3,69,0,0,1,0
78 | 10.1,51,0,0,1,0
79 | 0.1,65,1,0,0,1
80 | 0.3,71,1,0,0,1
81 | 0.4,76,1,0,0,1
82 | 0.8,65,1,0,0,1
83 | 0.8,78,1,0,0,1
84 | 1.0,41,1,0,0,1
85 | 1.5,68,1,0,0,1
86 | 2.0,69,1,0,0,1
87 | 2.3,62,1,0,0,1
88 | 2.9,74,0,0,0,1
89 | 3.6,71,1,0,0,1
90 | 3.8,84,1,0,0,1
91 | 4.3,48,0,0,0,1
92 | 


--------------------------------------------------------------------------------
/perf_tests/batch_vs_single.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | from time import time
 3 | import pandas as pd
 4 | import numpy as np
 5 | from lifelines.datasets import load_rossi
 6 | from lifelines import CoxPHFitter
 7 | import statsmodels.api as sm
 8 | 
 9 | # This compares the batch algorithm (in CTV) vs the single iteration algorithm (original in CPH)
10 | # N vs (% ties == unique(T) / N)
11 | 
12 | 
13 | ROSSI_ROWS = 432
14 | results = {}
15 | 
16 | 
17 | for n_copies in [1, 2, 4, 6, 8, 10, 13, 17, 20, 25]:
18 | 
19 |     # lower percents means more ties.
20 |     # original rossi dataset has 0.113
21 |     for fraction in np.linspace(0.01, 0.99, 15):
22 |         print(n_copies, fraction)
23 | 
24 |         df = pd.concat([load_rossi()] * n_copies)
25 |         n_unique_durations = int(df.shape[0] * fraction) + 1
26 |         unique_durations = np.round(np.random.exponential(10, size=n_unique_durations), 5)
27 | 
28 |         df["week"] = np.tile(unique_durations, int(np.ceil(1 / fraction)))[: df.shape[0]]
29 | 
30 |         batch_results = []
31 |         for _ in range(3):
32 |             cph_batch = CoxPHFitter()
33 |             start_time = time()
34 |             cph_batch.fit(df, "week", "arrest", batch_mode=True)
35 |             batch_results.append(time() - start_time)
36 | 
37 |         single_results = []
38 |         for _ in range(3):
39 |             cph_single = CoxPHFitter()
40 |             start_time = time()
41 |             cph_single.fit(df, "week", "arrest", batch_mode=False)
42 |             single_results.append(time() - start_time)
43 | 
44 |         batch_time = min(batch_results)
45 |         single_time = min(single_results)
46 |         print({"batch": batch_time, "single": single_time})
47 |         results[(n_copies * ROSSI_ROWS, fraction)] = {"batch": batch_time, "single": single_time}
48 | 
49 | results = pd.DataFrame(results).T.sort_index()
50 | results = results.reset_index()
51 | results = results.rename(columns={"level_0": "N", "level_1": "frac"})
52 | results["ratio"] = results["batch"] / results["single"]
53 | 
54 | print(results)
55 | results.to_csv("perf_results.csv", index=False)
56 | 
57 | 
58 | results["N * frac"] = results["N"] * results["frac"]
59 | 
60 | X = results[["N", "frac", "N * frac"]]
61 | X = sm.add_constant(X)
62 | 
63 | Y = results["ratio"]
64 | 
65 | 
66 | model = sm.OLS(Y, X).fit()
67 | print(model.summary())
68 | print(model.params)
69 | 


--------------------------------------------------------------------------------
/lifelines/datasets/multicenter_aids_cohort.tsv:
--------------------------------------------------------------------------------
 1 | i	AIDSY	W	T	D
 2 | 1	1990.425	4.575	7.575	0
 3 | 2	1991.250	3.750	6.750	0
 4 | 3	1992.014	2.986	5.986	0
 5 | 4	1992.030	2.970	5.970	0
 6 | 5	1992.072	2.928	5.928	0
 7 | 6	1992.220	2.780	4.688	1
 8 | 7	1992.374	2.626	5.626	0
 9 | 8	1992.389	2.611	5.611	0
10 | 9	1992.450	2.550	5.550	0
11 | 10	1992.653	2.347	5.347	0
12 | 11	1992.825	2.175	3.842	0
13 | 12	1992.906	2.094	3.655	1
14 | 13	1992.911	2.089	3.062	1
15 | 14	1992.958	2.042	5.042	0
16 | 15	1993.264	1.736	4.653	0
17 | 16	1993.384	1.616	2.729	1
18 | 17	1993.436	1.564	4.564	0
19 | 18	1993.439	1.561	2.897	1
20 | 19	1993.444	1.556	4.556	0
21 | 20	1993.503	1.497	2.024	1
22 | 21	1993.533	1.467	2.400	1
23 | 22	1993.637	1.363	3.043	1
24 | 23	1993.700	1.300	4.300	0
25 | 24	1994.081	0.919	1.169	1
26 | 25	1994.137	0.863	3.863	0
27 | 26	1994.189	0.811	3.811	0
28 | 27	1994.212	0.788	3.788	0
29 | 28	1994.228	0.772	3.772	0
30 | 29	1994.253	0.747	1.894	1
31 | 30	1994.358	0.642	1.951	1
32 | 31	1994.538	0.462	3.462	0
33 | 32	1994.664	0.336	3.336	0
34 | 33	1994.708	0.292	1.125	0
35 | 34	1994.734	0.266	1.258	1
36 | 35	1994.742	0.258	3.258	0
37 | 36	1994.798	0.202	3.202	0
38 | 37	1994.814	0.186	3.186	0
39 | 38	1994.836	0.164	0.973	1
40 | 39	1994.872	0.128	3.128	0
41 | 40	1994.903	0.097	1.794	1
42 | 41	1994.933	0.067	0.962	1
43 | 42	1994.950	0.050	1.255	1
44 | 43	1995.059	0.000	2.941	0
45 | 44	1995.070	0.000	1.619	1
46 | 45	1995.103	0.000	2.897	0
47 | 46	1995.169	0.000	1.619	1
48 | 47	1995.178	0.000	2.456	1
49 | 48	1995.189	0.000	1.752	1
50 | 49	1995.202	0.000	2.798	0
51 | 50	1995.231	0.000	2.769	0
52 | 51	1995.239	0.000	0.791	1
53 | 52	1995.247	0.000	2.753	0
54 | 53	1995.280	0.000	2.720	0
55 | 54	1995.286	0.000	1.881	0
56 | 55	1995.286	0.000	2.714	0
57 | 56	1995.309	0.000	1.322	1
58 | 57	1995.342	0.000	2.658	0
59 | 58	1995.384	0.000	1.216	1
60 | 59	1995.478	0.000	0.269	1
61 | 60	1995.481	0.000	2.500	1
62 | 61	1995.664	0.000	2.336	0
63 | 62	1995.869	0.000	2.131	0
64 | 63	1995.897	0.000	2.103	0
65 | 64	1995.914	0.000	0.086	0
66 | 65	1995.936	0.000	2.064	0
67 | 66	1995.941	0.000	2.059	0
68 | 67	1996.027	0.000	1.107	1
69 | 68	1996.350	0.000	0.067	0
70 | 69	1996.384	0.000	1.616	0
71 | 70	1996.486	0.000	1.431	0
72 | 71	1996.530	0.000	1.470	0
73 | 72	1996.572	0.000	0.820	1
74 | 73	1997.011	0.000	0.989	0
75 | 74	1997.422	0.000	0.578	0
76 | 75	1997.511	0.000	0.489	0
77 | 76	1997.597	0.000	0.403	0
78 | 77	1997.650	0.000	0.350	0
79 | 78	1997.847	0.000	0.153	0
80 | 


--------------------------------------------------------------------------------
/lifelines/datasets/CuZn-LeftCensoredDataset.csv:
--------------------------------------------------------------------------------
  1 | E,T,group
  2 | 0,1.0,alluvial_fan
  3 | 0,1.0,alluvial_fan
  4 | 0,1.0,alluvial_fan
  5 | 0,1.0,alluvial_fan
  6 | 1,1.0,alluvial_fan
  7 | 1,1.0,alluvial_fan
  8 | 1,1.0,alluvial_fan
  9 | 1,1.0,alluvial_fan
 10 | 1,1.0,alluvial_fan
 11 | 1,2.0,alluvial_fan
 12 | 1,2.0,alluvial_fan
 13 | 1,2.0,alluvial_fan
 14 | 1,2.0,alluvial_fan
 15 | 1,2.0,alluvial_fan
 16 | 1,2.0,alluvial_fan
 17 | 1,2.0,alluvial_fan
 18 | 1,2.0,alluvial_fan
 19 | 1,2.0,alluvial_fan
 20 | 1,2.0,alluvial_fan
 21 | 1,2.0,alluvial_fan
 22 | 1,2.0,alluvial_fan
 23 | 1,2.0,alluvial_fan
 24 | 1,2.0,alluvial_fan
 25 | 1,2.0,alluvial_fan
 26 | 1,2.0,alluvial_fan
 27 | 1,2.0,alluvial_fan
 28 | 1,2.0,alluvial_fan
 29 | 1,2.0,alluvial_fan
 30 | 1,2.0,alluvial_fan
 31 | 1,2.0,alluvial_fan
 32 | 1,3.0,alluvial_fan
 33 | 1,3.0,alluvial_fan
 34 | 1,3.0,alluvial_fan
 35 | 1,3.0,alluvial_fan
 36 | 1,3.0,alluvial_fan
 37 | 1,3.0,alluvial_fan
 38 | 1,4.0,alluvial_fan
 39 | 1,4.0,alluvial_fan
 40 | 1,4.0,alluvial_fan
 41 | 0,5.0,alluvial_fan
 42 | 0,5.0,alluvial_fan
 43 | 0,5.0,alluvial_fan
 44 | 0,5.0,alluvial_fan
 45 | 0,5.0,alluvial_fan
 46 | 0,5.0,alluvial_fan
 47 | 0,5.0,alluvial_fan
 48 | 0,5.0,alluvial_fan
 49 | 1,5.0,alluvial_fan
 50 | 1,5.0,alluvial_fan
 51 | 1,5.0,alluvial_fan
 52 | 1,7.0,alluvial_fan
 53 | 1,7.0,alluvial_fan
 54 | 1,7.0,alluvial_fan
 55 | 1,8.0,alluvial_fan
 56 | 1,9.0,alluvial_fan
 57 | 0,1.0,basin_trough
 58 | 0,1.0,basin_trough
 59 | 1,1.0,basin_trough
 60 | 1,1.0,basin_trough
 61 | 1,1.0,basin_trough
 62 | 1,1.0,basin_trough
 63 | 1,1.0,basin_trough
 64 | 1,1.0,basin_trough
 65 | 1,1.0,basin_trough
 66 | 0,2.0,basin_trough
 67 | 0,2.0,basin_trough
 68 | 1,2.0,basin_trough
 69 | 1,2.0,basin_trough
 70 | 1,2.0,basin_trough
 71 | 1,2.0,basin_trough
 72 | 1,3.0,basin_trough
 73 | 1,3.0,basin_trough
 74 | 1,3.0,basin_trough
 75 | 1,3.0,basin_trough
 76 | 1,3.0,basin_trough
 77 | 1,3.0,basin_trough
 78 | 1,3.0,basin_trough
 79 | 1,3.0,basin_trough
 80 | 1,4.0,basin_trough
 81 | 1,4.0,basin_trough
 82 | 1,4.0,basin_trough
 83 | 1,4.0,basin_trough
 84 | 1,4.0,basin_trough
 85 | 0,5.0,basin_trough
 86 | 0,5.0,basin_trough
 87 | 0,5.0,basin_trough
 88 | 0,5.0,basin_trough
 89 | 0,5.0,basin_trough
 90 | 1,5.0,basin_trough
 91 | 1,6.0,basin_trough
 92 | 1,6.0,basin_trough
 93 | 1,8.0,basin_trough
 94 | 1,9.0,basin_trough
 95 | 1,9.0,basin_trough
 96 | 0,10.0,basin_trough
 97 | 0,10.0,basin_trough
 98 | 0,10.0,basin_trough
 99 | 0,10.0,basin_trough
100 | 1,12.0,basin_trough
101 | 1,14.0,basin_trough
102 | 0,15.0,basin_trough
103 | 1,15.0,basin_trough
104 | 1,17.0,basin_trough
105 | 1,23.0,basin_trough
106 | 


--------------------------------------------------------------------------------
/lifelines/utils/lowess.py:
--------------------------------------------------------------------------------
 1 | """
 2 | This module implements the Lowess function for nonparametric regression.
 3 | Functions:
 4 | lowess Fit a smooth nonparametric regression curve to a scatterplot.
 5 | For more information, see
 6 | William S. Cleveland: "Robust locally weighted regression and smoothing
 7 | scatterplots", Journal of the American Statistical Association, December 1979,
 8 | volume 74, number 368, pp. 829-836.
 9 | William S. Cleveland and Susan J. Devlin: "Locally weighted regression: An
10 | approach to regression analysis by local fitting", Journal of the American
11 | Statistical Association, September 1988, volume 83, number 403, pp. 596-610.
12 | """
13 | 
14 | # Authors: Alexandre Gramfort <alexandre.gramfort@telecom-paristech.fr>
15 | #
16 | # License: BSD (3-clause)
17 | 
18 | 
19 | # Slight updates in lifelines 0.16.0, 2018
20 | 
21 | from math import ceil
22 | import numpy as np
23 | from scipy import linalg
24 | 
25 | 
26 | def lowess(x, y, f=2.0 / 3.0, iterations=3):
27 |     """lowess(x, y, f=2./3., iter=3) -> yest
28 |     Lowess smoother: Robust locally weighted regression.
29 |     The lowess function fits a nonparametric regression curve to a scatterplot.
30 |     The arrays x and y contain an equal number of elements; each pair
31 |     (x[i], y[i]) defines a data point in the scatterplot. The function returns
32 |     the estimated (smooth) values of y.
33 |     The smoothing span is given by f. A larger value for f will result in a
34 |     smoother curve. The number of robustifying iterations is given by iter. The
35 |     function will run faster with a smaller number of iterations.
36 |     """
37 |     n = len(x)
38 |     r = int(ceil(f * n))
39 |     h = [np.sort(np.abs(x - x[i]))[r] for i in range(n)]
40 |     w = np.clip(np.abs((x[:, None] - x[None, :]) / h), 0.0, 1.0)
41 |     w = (1 - w ** 3) ** 3
42 |     yest = np.zeros(n)
43 |     delta = np.ones(n)
44 |     for _ in range(iterations):
45 |         for i in range(n):
46 |             weights = delta * w[:, i]
47 |             b = np.array([np.sum(weights * y), np.sum(weights * y * x)])
48 |             A = np.array([[np.sum(weights), np.sum(weights * x)], [np.sum(weights * x), np.sum(weights * x * x)]])
49 |             # I think it is safe to assume this.
50 |             # pylint: disable=unexpected-keyword-arg
51 |             beta = linalg.solve(A, b, assume_a="pos", check_finite=False)
52 |             yest[i] = beta[0] + beta[1] * x[i]
53 | 
54 |         residuals = y - yest
55 |         s = np.median(np.abs(residuals))
56 |         delta = np.clip(residuals / (6.0 * s), -1, 1)
57 |         delta = (1 - delta ** 2) ** 2
58 | 
59 |     return yest
60 | 


--------------------------------------------------------------------------------
/CONTRIBUTING.md:
--------------------------------------------------------------------------------
 1 | ## Contributing to lifelines
 2 | 
 3 | 
 4 | ### Questions about survival analysis?
 5 | If you are using lifelines for survival analysis and have a question about "how do I do X?" or "what does Y do?", the best place to ask that is either in our [gitter channel](https://gitter.im/python-lifelines/Lobby) or at [stats.stackexchange.com](https://stats.stackexchange.com/).
 6 | 
 7 | 
 8 | ### Submitting bugs or other errors observed
 9 | 
10 | We appreciate all bug reports submitted, as this will help the entire community get a better product. Please open up an issue in the Github Repository. If possible, please provide a code snippet, and what version of lifelines you are using.
11 | 
12 | 
13 | ### Submitting new feature requests
14 | 
15 | Please open up an issue in the Github Repository with as much context as possible about the feature you would like to see. Also useful is to link to other libraries/software that have that feature.
16 | 
17 | 
18 | ### Submitting code, or other changes
19 | 
20 | If you are interested in contributing to lifelines (and we thank you for the interest!), we recommend first opening up an issue in the GitHub repository to discuss the changes. From there, we can together plan how to execute the changes. See the Development section below for how to setup a local environment.
21 | 
22 | ## Development
23 | 
24 | ### Setting up a lifelines development environment
25 | 
26 | 1. From the root directory of `lifelines` activate your [virtual environment](https://realpython.com/python-virtual-environments-a-primer/) (if you plan to use one).
27 | 2. Install the development requirements and [`pre-commit`](https://pre-commit.com) hooks. If you are on Mac, Linux, or [Windows `WSL`](https://docs.microsoft.com/en-us/windows/wsl/faq) you can use the provided [`Makefile`](https://github.com/CamDavidsonPilon/lifelines/blob/master/Makefile). Just type `make` into the console and you're ready to start developing. This will also install the dev-requirements.
28 | 
29 | ### Formatting
30 | 
31 | `lifelines` uses the [`black`](https://github.com/ambv/black) python formatter.
32 | There are 3 different ways to format your code.
33 | 1. Use the [`Makefile`](https://github.com/CamDavidsonPilon/lifelines/blob/master/Makefile).
34 |    * `make lint`
35 | 2. Call `black` directly and pass the correct line length.
36 |    * `black . -l 120`
37 | 3. Have you code formatted automatically during commit with the `pre-commit` hook.
38 |    * stage and commit your unformatted changes: `git commit -m "your_commit_message"`
39 |    * Code that needs to be formatted will "fail" the commit hooks and be formatted for you.
40 |    * Stage the newly formatted python code: `git add *.py`
41 |    * Recall your original commit command and commit again: `git commit -m "your_commit_message"`
42 | 
43 | ### Running the tests
44 | 
45 | You can optionally run the test suite after install with
46 | 
47 |     py.test
48 | 


--------------------------------------------------------------------------------
/docs/index.rst:
--------------------------------------------------------------------------------
  1 | .. lifelines documentation master file, created by
  2 |    sphinx-quickstart on Sun Feb  2 17:10:21 2014.
  3 |    You can adapt this file completely to your liking, but it should at least
  4 |    contain the root `toctree` directive.
  5 | 
  6 | .. image:: http://i.imgur.com/EOowdSD.png
  7 | 
  8 | -------------------------------------
  9 | 
 10 | 
 11 | lifelines
 12 | =====================================
 13 | 
 14 | *lifelines* is a implementation of survival analysis in Python. What
 15 | benefits does *lifelines* offer over other survival analysis
 16 | implementations?
 17 | 
 18 | -  built on top of Pandas
 19 | -  internal plotting methods
 20 | -  simple and intuitive API
 21 | -  only focus is survival analysis
 22 | 
 23 | 
 24 | Contents:
 25 | ============
 26 | 
 27 | .. toctree::
 28 |   :maxdepth: 1
 29 |   :caption: Quickstart & Intro
 30 | 
 31 |   Quickstart
 32 |   Survival Analysis intro
 33 | 
 34 | .. toctree::
 35 |   :maxdepth: 1
 36 |   :caption: Univariate Models
 37 | 
 38 |   Survival analysis with lifelines
 39 |   jupyter_notebooks/Piecewise Exponential Models and Creating Custom Models.ipynb
 40 |   jupyter_notebooks/Modelling time-lagged conversion rates.ipynb
 41 | 
 42 | .. toctree::
 43 |   :maxdepth: 1
 44 |   :caption: Regression Models
 45 | 
 46 |   Survival Regression
 47 |   Time varying survival regression
 48 |   jupyter_notebooks/Proportional hazard assumption.ipynb
 49 |   jupyter_notebooks/Cox residuals.ipynb
 50 | 
 51 | .. toctree::
 52 |   :maxdepth: 1
 53 |   :caption: Detailed documentation
 54 | 
 55 |   Examples
 56 |   References
 57 | 
 58 | .. toctree::
 59 |   :maxdepth: 1
 60 |   :caption: About lifelines
 61 | 
 62 |   Changelog
 63 |   Citing lifelines <https://doi.org/10.5281/zenodo.805993>
 64 | 
 65 | .. toctree::
 66 |   :maxdepth: 1
 67 |   :caption: Questions? Suggestions?
 68 | 
 69 |   Gitter channel <https://gitter.im/python-lifelines/Lobby>
 70 |   Create a GitHub issue <https://github.com/camdavidsonpilon/lifelines/issues>
 71 |   Development blog <https://dataorigami.net/blogs/napkin-folding/tagged/lifelines>
 72 | 
 73 | Installation
 74 | ------------------------------
 75 | 
 76 | 
 77 | .. code-block:: console
 78 | 
 79 |     pip install lifelines
 80 | 
 81 | 
 82 | Source code and issue tracker
 83 | ------------------------------
 84 | 
 85 | Available on Github, `CamDavidsonPilon/lifelines <https://github.com/CamDavidsonPilon/lifelines/>`_.
 86 | Please report bugs, issues and feature extensions there. We also have `Gitter channel <https://gitter.im/python-lifelines/Lobby>`_ available to discuss survival analysis and *lifelines*:
 87 | 
 88 | Citing *lifelines*
 89 | ------------------------------
 90 | 
 91 | The following link will bring you to a page where you can find the latest citation for *lifelines*:
 92 | 
 93 | `Citation for lifelines <https://doi.org/10.5281/zenodo.805993>`_
 94 | 
 95 | 
 96 | Indices and tables
 97 | ==================
 98 | 
 99 | * :ref:`genindex`
100 | * :ref:`modindex`
101 | * :ref:`search`
102 | 


--------------------------------------------------------------------------------
/tests/utils/test_concordance.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | 
 3 | import pytest
 4 | import numpy as np
 5 | import pandas as pd
 6 | 
 7 | from lifelines import CoxPHFitter
 8 | from lifelines.datasets import load_rossi
 9 | 
10 | from lifelines.utils.concordance import concordance_index
11 | from lifelines.utils.concordance import concordance_index as fast_cindex
12 | from lifelines.utils.concordance import naive_concordance_index as slow_cindex
13 | 
14 | 
15 | def test_concordance_index_returns_same_after_shifting():
16 |     T = np.array([1, 2, 3, 4, 5, 6])
17 |     T_ = np.array([2, 1, 4, 6, 5, 3])
18 |     assert (
19 |         concordance_index(T, T_)
20 |         == concordance_index(T - 5, T_ - 5)
21 |         == concordance_index(T, T_ - 5)
22 |         == concordance_index(T - 5, T_)
23 |     )
24 | 
25 | 
26 | def test_both_concordance_index_function_deal_with_ties_the_same_way():
27 |     actual_times = np.array([1, 1, 2])
28 |     predicted_times = np.array([1, 2, 3])
29 |     obs = np.ones(3)
30 |     assert fast_cindex(actual_times, predicted_times, obs) == slow_cindex(actual_times, predicted_times, obs) == 1.0
31 | 
32 | 
33 | def test_both_concordance_index_with_only_censoring_fails_gracefully():
34 |     actual_times = np.array([1, 2, 3])
35 |     predicted_times = np.array([1, 2, 3])
36 |     obs = np.zeros(3)
37 |     with pytest.raises(ZeroDivisionError, match="admissable pairs"):
38 |         fast_cindex(actual_times, predicted_times, obs)
39 | 
40 |     with pytest.raises(ZeroDivisionError, match="admissable pairs"):
41 |         slow_cindex(actual_times, predicted_times, obs)
42 | 
43 | 
44 | def test_concordance_index_function_exits():
45 |     N = 10 * 1000
46 |     actual_times = np.random.exponential(1, size=N)
47 |     predicted_times = np.random.exponential(1, size=N)
48 |     obs = np.ones(N)
49 |     assert fast_cindex(actual_times, predicted_times, obs)
50 | 
51 | 
52 | def test_concordance_index_will_not_overflow():
53 |     a = np.arange(65536)
54 |     assert concordance_index(a, a) == 1.0
55 |     b = np.arange(65537)
56 |     assert concordance_index(b, b) == 1.0
57 |     assert concordance_index(b, b[::-1]) == 0.0
58 | 
59 | 
60 | def test_concordance_index_fast_is_same_as_slow():
61 |     size = 100
62 |     T = np.random.normal(size=size)
63 |     P = np.random.normal(size=size)
64 |     C = np.random.choice([0, 1], size=size)
65 |     Z = np.zeros_like(T)
66 | 
67 |     # Hard to imagine these failing
68 |     assert slow_cindex(T, Z, C) == fast_cindex(T, Z, C)
69 |     assert slow_cindex(T, T, C) == fast_cindex(T, T, C)
70 |     # This is the real test though
71 |     assert slow_cindex(T, P, C) == fast_cindex(T, P, C)
72 | 
73 |     cp = CoxPHFitter()
74 |     df = load_rossi()
75 |     cp.fit(df, duration_col="week", event_col="arrest")
76 | 
77 |     T = cp.durations.values.ravel()
78 |     P = -cp.predict_partial_hazard(df[df.columns.difference(["week", "arrest"])]).values.ravel()
79 | 
80 |     E = cp.event_observed.values.ravel()
81 | 
82 |     assert slow_cindex(T, P, E) == fast_cindex(T, P, E)
83 | 


--------------------------------------------------------------------------------
/lifelines/datasets/dfcv_dataset.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | import pandas as pd
 3 | from lifelines.utils import add_covariate_to_timeline
 4 | from lifelines.utils import to_long_format
 5 | 
 6 | df = pd.DataFrame(
 7 |     [
 8 |         [1, 3, True, 1],
 9 |         [6, 4, False, 0],
10 |         [3, 5, True, 1],
11 |         [2, 5, False, 1],
12 |         [4, 6, True, 1],
13 |         [7, 7, True, 0],
14 |         [8, 8, False, 0],
15 |         [5, 8, False, 1],
16 |         [9, 9, True, 0],
17 |         [10, 10, True, 0],
18 |     ],
19 |     columns=["id", "time", "event", "group"],
20 | )
21 | 
22 | 
23 | df = to_long_format(df, "time")
24 | 
25 | cv = pd.DataFrame.from_records(
26 |     [
27 |         {"id": 1, "z": 0, "time": 0},
28 |         {"id": 6, "z": 1, "time": 0},
29 |         {"id": 3, "z": 1, "time": 0},
30 |         {"id": 2, "z": 0, "time": 0},
31 |         {"id": 4, "z": 0, "time": 0},
32 |         {"id": 7, "z": 0, "time": 0},
33 |         {"id": 8, "z": 0, "time": 0},
34 |         {"id": 5, "z": 0, "time": 0},
35 |         {"id": 9, "z": 0, "time": 0},
36 |         {"id": 10, "z": 0, "time": 0},
37 |         {"id": 1, "z": 0, "time": 3},
38 |         {"id": 6, "z": 1, "time": 3},
39 |         {"id": 3, "z": 1, "time": 3},
40 |         {"id": 2, "z": 0, "time": 3},
41 |         {"id": 4, "z": 0, "time": 3},
42 |         {"id": 7, "z": 0, "time": 3},
43 |         {"id": 8, "z": 0, "time": 3},
44 |         {"id": 5, "z": 0, "time": 3},
45 |         {"id": 9, "z": 0, "time": 3},
46 |         {"id": 10, "z": 1, "time": 3},
47 |         {"id": 6, "z": 1, "time": 4},
48 |         {"id": 3, "z": 1, "time": 4},
49 |         {"id": 2, "z": 0, "time": 4},
50 |         {"id": 4, "z": 0, "time": 4},
51 |         {"id": 7, "z": 0, "time": 4},
52 |         {"id": 8, "z": 0, "time": 4},
53 |         {"id": 5, "z": 0, "time": 4},
54 |         {"id": 9, "z": 0, "time": 4},
55 |         {"id": 10, "z": 1, "time": 4},
56 |         {"id": 3, "z": 1, "time": 5},
57 |         {"id": 2, "z": 0, "time": 5},
58 |         {"id": 4, "z": 0, "time": 5},
59 |         {"id": 7, "z": 1, "time": 5},
60 |         {"id": 8, "z": 0, "time": 5},
61 |         {"id": 5, "z": 0, "time": 5},
62 |         {"id": 9, "z": 1, "time": 5},
63 |         {"id": 10, "z": 1, "time": 5},
64 |         {"id": 4, "z": 0, "time": 6},
65 |         {"id": 7, "z": 1, "time": 6},
66 |         {"id": 8, "z": 0, "time": 6},
67 |         {"id": 5, "z": 1, "time": 6},
68 |         {"id": 9, "z": 1, "time": 6},
69 |         {"id": 10, "z": 1, "time": 6},
70 |         {"id": 7, "z": 1, "time": 7},
71 |         {"id": 8, "z": 0, "time": 7},
72 |         {"id": 5, "z": 1, "time": 7},
73 |         {"id": 9, "z": 1, "time": 7},
74 |         {"id": 10, "z": 1, "time": 7},
75 |         {"id": 8, "z": 0, "time": 8},
76 |         {"id": 5, "z": 1, "time": 8},
77 |         {"id": 9, "z": 1, "time": 8},
78 |         {"id": 10, "z": 1, "time": 8},
79 |         {"id": 9, "z": 1, "time": 9},
80 |         {"id": 10, "z": 1, "time": 9},
81 |     ]
82 | )
83 | 
84 | dfcv = add_covariate_to_timeline(df, cv, "id", "time", "event", add_enum=False)
85 | 


--------------------------------------------------------------------------------
/lifelines/fitters/exponential_fitter.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | 
 3 | 
 4 | import numpy as np
 5 | from lifelines.fitters import KnownModelParametericUnivariateFitter
 6 | 
 7 | 
 8 | class ExponentialFitter(KnownModelParametericUnivariateFitter):
 9 |     r"""
10 |     This class implements an Exponential model for univariate data. The model has parameterized
11 |     form:
12 | 
13 |     .. math::  S(t) = \exp\left(\frac{-t}{\lambda}\right),   \lambda >0
14 | 
15 |     which implies the cumulative hazard rate is
16 | 
17 |     .. math::  H(t) = \frac{t}{\lambda}
18 | 
19 |     and the hazard rate is:
20 | 
21 |     .. math::  h(t) = \frac{1}{\lambda}
22 | 
23 |     After calling the `.fit` method, you have access to properties like: ``survival_function_``, ``lambda_``, ``cumulative_hazard_``
24 |     A summary of the fit is available with the method ``print_summary()``
25 | 
26 |     Parameters
27 |     -----------
28 |     alpha: float, optional (default=0.05)
29 |         the level in the confidence intervals.
30 | 
31 |     Important
32 |     ----------
33 |     The parameterization of this model changed in lifelines 0.19.0. Previously, the cumulative hazard looked like
34 |     :math:`\lambda t`. The parameterization is now the reciprocal of :math:`\lambda`.
35 | 
36 |     Attributes
37 |     ----------
38 |     cumulative_hazard_ : DataFrame
39 |         The estimated cumulative hazard (with custom timeline if provided)
40 |     confidence_interval_cumulative_hazard_ : DataFrame
41 |         The lower and upper confidence intervals for the cumulative hazard
42 |     hazard_ : DataFrame
43 |         The estimated hazard (with custom timeline if provided)
44 |     confidence_interval_hazard_ : DataFrame
45 |         The lower and upper confidence intervals for the hazard
46 |     survival_function_ : DataFrame
47 |         The estimated survival function (with custom timeline if provided)
48 |     confidence_interval_survival_function_ : DataFrame
49 |         The lower and upper confidence intervals for the survival function
50 |     variance_matrix_ : numpy array
51 |         The variance matrix of the coefficients
52 |     median_: float
53 |         The median time to event
54 |     lambda_: float
55 |         The fitted parameter in the model
56 |     durations: array
57 |         The durations provided
58 |     event_observed: array
59 |         The event_observed variable provided
60 |     timeline: array
61 |         The time line to use for plotting and indexing
62 |     entry: array or None
63 |         The entry array provided, or None
64 |     cumumlative_density_ : DataFrame
65 |         The estimated cumulative density function (with custom timeline if provided)
66 |     confidence_interval_cumumlative_density_ : DataFrame
67 |         The lower and upper confidence intervals for the cumulative density
68 |     """
69 | 
70 |     _fitted_parameter_names = ["lambda_"]
71 | 
72 |     @property
73 |     def median_(self):
74 |         return np.log(2) / self.lambda_
75 | 
76 |     def _cumulative_hazard(self, params, times):
77 |         lambda_ = params[0]
78 |         return times / lambda_
79 | 


--------------------------------------------------------------------------------
/lifelines/datasets/waltons_dataset.csv:
--------------------------------------------------------------------------------
  1 | T,E,group
  2 | 6.0,1,miR-137
  3 | 13.0,1,miR-137
  4 | 13.0,1,miR-137
  5 | 13.0,1,miR-137
  6 | 19.0,1,miR-137
  7 | 19.0,1,miR-137
  8 | 19.0,1,miR-137
  9 | 26.0,1,miR-137
 10 | 26.0,1,miR-137
 11 | 26.0,1,miR-137
 12 | 26.0,1,miR-137
 13 | 26.0,1,miR-137
 14 | 33.0,1,miR-137
 15 | 33.0,1,miR-137
 16 | 47.0,1,miR-137
 17 | 62.0,1,miR-137
 18 | 62.0,1,miR-137
 19 | 9.0,1,miR-137
 20 | 9.0,1,miR-137
 21 | 9.0,1,miR-137
 22 | 15.0,1,miR-137
 23 | 15.0,1,miR-137
 24 | 22.0,1,miR-137
 25 | 22.0,1,miR-137
 26 | 22.0,1,miR-137
 27 | 22.0,1,miR-137
 28 | 29.0,1,miR-137
 29 | 29.0,1,miR-137
 30 | 29.0,1,miR-137
 31 | 29.0,1,miR-137
 32 | 29.0,1,miR-137
 33 | 36.0,1,miR-137
 34 | 36.0,1,miR-137
 35 | 43.0,1,miR-137
 36 | 33.0,1,control
 37 | 54.0,1,control
 38 | 54.0,1,control
 39 | 61.0,1,control
 40 | 61.0,1,control
 41 | 61.0,0,control
 42 | 61.0,1,control
 43 | 61.0,0,control
 44 | 61.0,1,control
 45 | 61.0,1,control
 46 | 61.0,1,control
 47 | 61.0,1,control
 48 | 61.0,1,control
 49 | 61.0,1,control
 50 | 69.0,1,control
 51 | 69.0,1,control
 52 | 69.0,1,control
 53 | 69.0,1,control
 54 | 69.0,1,control
 55 | 69.0,1,control
 56 | 69.0,0,control
 57 | 69.0,1,control
 58 | 69.0,1,control
 59 | 69.0,1,control
 60 | 69.0,1,control
 61 | 32.0,1,control
 62 | 53.0,1,control
 63 | 53.0,1,control
 64 | 60.0,1,control
 65 | 60.0,1,control
 66 | 60.0,1,control
 67 | 60.0,1,control
 68 | 60.0,1,control
 69 | 68.0,1,control
 70 | 68.0,1,control
 71 | 68.0,1,control
 72 | 68.0,1,control
 73 | 68.0,0,control
 74 | 68.0,1,control
 75 | 68.0,1,control
 76 | 68.0,1,control
 77 | 68.0,1,control
 78 | 68.0,1,control
 79 | 75.0,1,control
 80 | 17.0,1,control
 81 | 51.0,1,control
 82 | 51.0,1,control
 83 | 51.0,1,control
 84 | 58.0,1,control
 85 | 58.0,1,control
 86 | 58.0,1,control
 87 | 58.0,1,control
 88 | 66.0,1,control
 89 | 66.0,1,control
 90 | 7.0,1,control
 91 | 7.0,0,control
 92 | 41.0,1,control
 93 | 41.0,1,control
 94 | 41.0,1,control
 95 | 41.0,1,control
 96 | 41.0,1,control
 97 | 41.0,1,control
 98 | 41.0,1,control
 99 | 48.0,1,control
100 | 48.0,1,control
101 | 48.0,1,control
102 | 48.0,1,control
103 | 48.0,1,control
104 | 48.0,1,control
105 | 48.0,1,control
106 | 48.0,1,control
107 | 56.0,1,control
108 | 56.0,1,control
109 | 56.0,1,control
110 | 56.0,1,control
111 | 56.0,1,control
112 | 56.0,1,control
113 | 56.0,1,control
114 | 56.0,1,control
115 | 56.0,1,control
116 | 56.0,1,control
117 | 56.0,1,control
118 | 56.0,1,control
119 | 56.0,1,control
120 | 56.0,1,control
121 | 56.0,1,control
122 | 56.0,1,control
123 | 56.0,1,control
124 | 56.0,1,control
125 | 63.0,1,control
126 | 63.0,1,control
127 | 63.0,1,control
128 | 63.0,1,control
129 | 63.0,1,control
130 | 63.0,1,control
131 | 63.0,1,control
132 | 63.0,1,control
133 | 63.0,1,control
134 | 69.0,1,control
135 | 69.0,1,control
136 | 38.0,1,control
137 | 38.0,1,control
138 | 45.0,1,control
139 | 45.0,1,control
140 | 45.0,1,control
141 | 45.0,1,control
142 | 45.0,1,control
143 | 45.0,1,control
144 | 45.0,1,control
145 | 45.0,1,control
146 | 45.0,0,control
147 | 45.0,1,control
148 | 53.0,1,control
149 | 53.0,1,control
150 | 53.0,1,control
151 | 53.0,1,control
152 | 53.0,1,control
153 | 60.0,1,control
154 | 60.0,0,control
155 | 60.0,1,control
156 | 60.0,1,control
157 | 60.0,1,control
158 | 60.0,1,control
159 | 60.0,1,control
160 | 60.0,1,control
161 | 60.0,1,control
162 | 60.0,1,control
163 | 60.0,1,control
164 | 66.0,1,control
165 | 


--------------------------------------------------------------------------------
/lifelines/utils/gamma.py:
--------------------------------------------------------------------------------
 1 | """
 2 | MIT License
 3 | 
 4 | Copyright (c) 2018 Better
 5 | 
 6 | Permission is hereby granted, free of charge, to any person obtaining a copy
 7 | of this software and associated documentation files (the "Software"), to deal
 8 | in the Software without restriction, including without limitation the rights
 9 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 | copies of the Software, and to permit persons to whom the Software is
11 | furnished to do so, subject to the following conditions:
12 | 
13 | The above copyright notice and this permission notice shall be included in all
14 | copies or substantial portions of the Software.
15 | 
16 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
19 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
22 | SOFTWARE.
23 | 
24 | Edited in 2019, Cameron Davidson-Pilon
25 | """
26 | from autograd.extend import primitive, defvjp
27 | from autograd.numpy.numpy_vjps import unbroadcast_f  # This is not documented
28 | from scipy.special import gammainc as gammainc_orig
29 | 
30 | 
31 | @primitive
32 | def gammainc(k, x):
33 |     """ Lower regularized incomplete gamma function.
34 |     We rely on `scipy.special.gammainc
35 |     <https://docs.scipy.org/doc/scipy/reference/generated/scipy.special.gammainc.html>`_
36 |     for this. However, there is a number of issues using this function
37 |     together with `autograd <https://github.com/HIPS/autograd>`_:
38 |     1. It doesn't let you take the gradient with respect to k
39 |     2. The gradient with respect to x is really slow
40 |     As a really stupid workaround, because we don't need the numbers to
41 |     be 100% exact, we just approximate the gradient.
42 |     Side note 1: if you truly want to compute the correct derivative, see the
43 |     `Wikipedia articule about the Incomplete gamma function
44 |     <https://en.wikipedia.org/wiki/Incomplete_gamma_function#Derivatives>`_
45 |     where the T(3, s, x) function can be implemented as
46 |     .. code-block:: python
47 |        def T3(s, x):
48 |            return mpmath.meijerg(a_s=([], [0, 0]), b_s=([s-1, -1, -1], []), z=x)
49 |     I wasted a few hours on this but sadly it turns out to be extremely slow.
50 |     Side note 2: TensorFlow actually has a `similar bug
51 |     <https://github.com/tensorflow/tensorflow/issues/17995>`_
52 |     """
53 |     return gammainc_orig(k, x)
54 | 
55 | 
56 | @primitive
57 | def gammainc2(k, x):
58 |     return gammainc_orig(k, x)
59 | 
60 | 
61 | G_EPS = 1e-8
62 | 
63 | defvjp(
64 |     gammainc2,
65 |     lambda ans, k, x: unbroadcast_f(
66 |         k, lambda g: g * (gammainc_orig(k + G_EPS, x) - 2 * ans + gammainc_orig(k - G_EPS, x)) / G_EPS ** 2
67 |     ),
68 |     lambda ans, k, x: unbroadcast_f(
69 |         k, lambda g: g * (gammainc_orig(k, x + G_EPS) - 2 * ans + gammainc_orig(k, x - G_EPS)) / G_EPS ** 2
70 |     ),
71 | )
72 | 
73 | defvjp(
74 |     gammainc,
75 |     lambda ans, k, x: unbroadcast_f(k, lambda g: g * (gammainc2(k + G_EPS, x) - ans) / G_EPS),
76 |     lambda ans, k, x: unbroadcast_f(x, lambda g: g * (gammainc2(k, x + G_EPS) - ans) / G_EPS),
77 | )
78 | 


--------------------------------------------------------------------------------
/lifelines/fitters/log_normal_fitter.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | 
 3 | 
 4 | import autograd.numpy as np
 5 | from autograd.scipy.stats import norm
 6 | from lifelines.fitters import KnownModelParametericUnivariateFitter
 7 | from lifelines.utils.logsf import logsf
 8 | 
 9 | 
10 | class LogNormalFitter(KnownModelParametericUnivariateFitter):
11 |     r"""
12 |     This class implements an Log Normal model for univariate data. The model has parameterized
13 |     form:
14 | 
15 |     .. math::  S(t) = 1 - \Phi((\log(t) - \mu)/\sigma),   \sigma >0
16 | 
17 |     where :math:`\Phi` is the CDF of a standard normal random variable.
18 |     This implies the cumulative hazard rate is
19 | 
20 |     .. math::  H(t) = -\log(1 - \Phi((\log(t) - \mu)/\sigma))
21 | 
22 |     After calling the `.fit` method, you have access to properties like: ``survival_function_``, ``mu_``, ``sigma_``.
23 |     A summary of the fit is available with the method ``print_summary()``
24 | 
25 |     Parameters
26 |     -----------
27 |     alpha: float, optional (default=0.05)
28 |         the level in the confidence intervals.
29 | 
30 | 
31 |     Attributes
32 |     ----------
33 |     cumulative_hazard_ : DataFrame
34 |         The estimated cumulative hazard (with custom timeline if provided)
35 |     confidence_interval_cumulative_hazard_ : DataFrame
36 |         The lower and upper confidence intervals for the cumulative hazard
37 |     hazard_ : DataFrame
38 |         The estimated hazard (with custom timeline if provided)
39 |     confidence_interval_hazard_ : DataFrame
40 |         The lower and upper confidence intervals for the hazard
41 |     survival_function_ : DataFrame
42 |         The estimated survival function (with custom timeline if provided)
43 |     confidence_interval_survival_function_ : DataFrame
44 |         The lower and upper confidence intervals for the survival function
45 |     cumumlative_density_ : DataFrame
46 |         The estimated cumulative density function (with custom timeline if provided)
47 |     confidence_interval_cumumlative_density_ : DataFrame
48 |         The lower and upper confidence intervals for the cumulative density
49 |     variance_matrix_ : numpy array
50 |         The variance matrix of the coefficients
51 |     median_: float
52 |         The median time to event
53 |     mu_: float
54 |         The fitted parameter in the model
55 |     sigma_: float
56 |         The fitted parameter in the model
57 |     durations: array
58 |         The durations provided
59 |     event_observed: array
60 |         The event_observed variable provided
61 |     timeline: array
62 |         The time line to use for plotting and indexing
63 |     entry: array or None
64 |         The entry array provided, or None
65 |     """
66 | 
67 |     _fitted_parameter_names = ["mu_", "sigma_"]
68 |     _bounds = [(None, None), (0, None)]
69 | 
70 |     @property
71 |     def median_(self):
72 |         return np.exp(self.mu_)
73 | 
74 |     def _cumulative_hazard(self, params, times):
75 |         mu_, sigma_ = params
76 |         Z = (np.log(times) - mu_) / sigma_
77 |         return -logsf(Z)
78 | 
79 |     def _log_hazard(self, params, times):
80 |         mu_, sigma_ = params
81 |         Z = (np.log(times) - mu_) / sigma_
82 |         return norm.logpdf(Z, loc=0, scale=1) - np.log(sigma_) - np.log(times) - logsf(Z)
83 | 
84 |     def _log_1m_sf(self, params, times):
85 |         mu_, sigma_ = params
86 |         Z = (np.log(times) - mu_) / sigma_
87 |         return norm.logcdf(Z, loc=0, scale=1)
88 | 


--------------------------------------------------------------------------------
/docs/lifelines.fitters.rst:
--------------------------------------------------------------------------------
  1 | lifelines.fitters
  2 | =================
  3 | 
  4 | 
  5 | lifelines.fitters.aalen\_additive\_fitter module
  6 | ------------------------------------------------
  7 | 
  8 | .. automodule:: lifelines.fitters.aalen_additive_fitter
  9 |     :members:
 10 |     :undoc-members:
 11 | 
 12 | lifelines.fitters.aalen\_johansen\_fitter module
 13 | ------------------------------------------------
 14 | 
 15 | .. automodule:: lifelines.fitters.aalen_johansen_fitter
 16 |     :members:
 17 |     :undoc-members:
 18 | 
 19 | lifelines.fitters.breslow\_fleming\_harrington\_fitter module
 20 | -------------------------------------------------------------
 21 | 
 22 | .. automodule:: lifelines.fitters.breslow_fleming_harrington_fitter
 23 |     :members:
 24 |     :undoc-members:
 25 | 
 26 | lifelines.fitters.cox\_time\_varying\_fitter module
 27 | ---------------------------------------------------
 28 | 
 29 | .. automodule:: lifelines.fitters.cox_time_varying_fitter
 30 |     :members:
 31 |     :undoc-members:
 32 | 
 33 | lifelines.fitters.coxph\_fitter module
 34 | --------------------------------------
 35 | 
 36 | .. automodule:: lifelines.fitters.coxph_fitter
 37 |     :members:
 38 |     :undoc-members:
 39 | 
 40 | lifelines.fitters.exponential\_fitter module
 41 | --------------------------------------------
 42 | 
 43 | .. automodule:: lifelines.fitters.exponential_fitter
 44 |     :members:
 45 |     :undoc-members:
 46 | 
 47 | lifelines.fitters.kaplan\_meier\_fitter module
 48 | ----------------------------------------------
 49 | 
 50 | .. automodule:: lifelines.fitters.kaplan_meier_fitter
 51 |     :members:
 52 |     :undoc-members:
 53 | 
 54 | lifelines.fitters.log\_logistic\_fitter module
 55 | ----------------------------------------------
 56 | 
 57 | .. automodule:: lifelines.fitters.log_logistic_fitter
 58 |     :members:
 59 |     :undoc-members:
 60 | 
 61 | lifelines.fitters.log\_normal\_fitter module
 62 | --------------------------------------------
 63 | 
 64 | .. automodule:: lifelines.fitters.log_normal_fitter
 65 |     :members:
 66 |     :undoc-members:
 67 | 
 68 | lifelines.fitters.nelson\_aalen\_fitter module
 69 | ----------------------------------------------
 70 | 
 71 | .. automodule:: lifelines.fitters.nelson_aalen_fitter
 72 |     :members:
 73 |     :undoc-members:
 74 | 
 75 | lifelines.fitters.piecewise\_exponential\_fitter module
 76 | -------------------------------------------------------
 77 | 
 78 | .. automodule:: lifelines.fitters.piecewise_exponential_fitter
 79 |     :members:
 80 |     :undoc-members:
 81 | 
 82 | 
 83 | 
 84 | lifelines.fitters.weibull\_fitter module
 85 | ------------------------------------------
 86 | 
 87 | .. automodule:: lifelines.fitters.weibull_fitter
 88 |     :members:
 89 |     :undoc-members:
 90 | 
 91 | 
 92 | lifelines.fitters.weibull\_aft\_fitter module
 93 | -------------------------------------------------
 94 | 
 95 | .. automodule:: lifelines.fitters.weibull_aft_fitter
 96 |     :members:
 97 |     :undoc-members:
 98 | 
 99 | lifelines.fitters.log\_normal\_aft\_fitter module
100 | ---------------------------------------------------
101 | 
102 | .. automodule:: lifelines.fitters.log_normal_aft_fitter
103 |     :members:
104 |     :undoc-members:
105 | 
106 | lifelines.fitters.log\_logistic\_aft\_fitter module
107 | -----------------------------------------------------
108 | 
109 | .. automodule:: lifelines.fitters.log_logistic_aft_fitter
110 |     :members:
111 |     :undoc-members:
112 | 
113 | 
114 | 
115 | .. automodule:: lifelines.fitters
116 |     :members:
117 |     :undoc-members:
118 | 


--------------------------------------------------------------------------------
/lifelines/fitters/log_logistic_fitter.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | import autograd.numpy as np
 3 | 
 4 | from lifelines.fitters import KnownModelParametericUnivariateFitter
 5 | 
 6 | 
 7 | class LogLogisticFitter(KnownModelParametericUnivariateFitter):
 8 | 
 9 |     r"""
10 |     This class implements a Log-Logistic model for univariate data. The model has parameterized
11 |     form:
12 | 
13 |     .. math::  S(t) = \left(1 + \left(\frac{t}{\alpha}\right)^{\beta}\right)^{-1},   \alpha > 0, \beta > 0,
14 | 
15 |     and the hazard rate is:
16 | 
17 |     .. math::  h(t) = \frac{\left(\frac{\beta}{\alpha}\right)\left(\frac{t}{\alpha}\right) ^ {\beta-1}}{\left(1 + \left(\frac{t}{\alpha}\right)^{\beta}\right)}
18 | 
19 |     and the cumulative hazard is:
20 | 
21 |     .. math:: H(t) = \log\left(\left(\frac{t}{\alpha}\right) ^ {\beta} + 1\right)
22 | 
23 |     After calling the `.fit` method, you have access to properties like: ``cumulative_hazard_``, ``plot``, ``survival_function_``, ``alpha_`` and ``beta_``.
24 |     A summary of the fit is available with the method 'print_summary()'
25 | 
26 |     Parameters
27 |     -----------
28 |     alpha: float, optional (default=0.05)
29 |         the level in the confidence intervals.
30 | 
31 |     Examples
32 |     --------
33 | 
34 |     >>> from lifelines import LogLogisticFitter
35 |     >>> from lifelines.datasets import load_waltons
36 |     >>> waltons = load_waltons()
37 |     >>> llf = LogLogisticFitter()
38 |     >>> llf.fit(waltons['T'], waltons['E'])
39 |     >>> llf.plot()
40 |     >>> print(llf.alpha_)
41 | 
42 |     Attributes
43 |     ----------
44 |     cumulative_hazard_ : DataFrame
45 |         The estimated cumulative hazard (with custom timeline if provided)
46 |     confidence_interval_cumulative_hazard_ : DataFrame
47 |         The lower and upper confidence intervals for the cumulative hazard
48 |     hazard_ : DataFrame
49 |         The estimated hazard (with custom timeline if provided)
50 |     confidence_interval_hazard_ : DataFrame
51 |         The lower and upper confidence intervals for the hazard
52 |     survival_function_ : DataFrame
53 |         The estimated survival function (with custom timeline if provided)
54 |     confidence_interval_survival_function_ : DataFrame
55 |         The lower and upper confidence intervals for the survival function
56 |     cumumlative_density_ : DataFrame
57 |         The estimated cumulative density function (with custom timeline if provided)
58 |     confidence_interval_cumumlative_density_ : DataFrame
59 |         The lower and upper confidence intervals for the cumulative density
60 |     variance_matrix_ : numpy array
61 |         The variance matrix of the coefficients
62 |     median_: float
63 |         The median time to event
64 |     alpha_: float
65 |         The fitted parameter in the model
66 |     beta_: float
67 |         The fitted parameter in the model
68 |     durations: array
69 |         The durations provided
70 |     event_observed: array
71 |         The event_observed variable provided
72 |     timeline: array
73 |         The time line to use for plotting and indexing
74 |     entry: array or None
75 |         The entry array provided, or None
76 |     """
77 |     _fitted_parameter_names = ["alpha_", "beta_"]
78 | 
79 |     @property
80 |     def median_(self):
81 |         return self.alpha_
82 | 
83 |     def _cumulative_hazard(self, params, times):
84 |         alpha_, beta_ = params
85 |         return np.log1p((times / alpha_) ** beta_)
86 | 
87 |     def _log_1m_sf(self, params, times):
88 |         alpha_, beta_ = params
89 |         return -np.log1p((times / alpha_) ** -beta_)
90 | 


--------------------------------------------------------------------------------
/lifelines/fitters/weibull_fitter.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | import autograd.numpy as np
 3 | 
 4 | from lifelines.fitters import KnownModelParametericUnivariateFitter
 5 | 
 6 | 
 7 | class WeibullFitter(KnownModelParametericUnivariateFitter):
 8 | 
 9 |     r"""
10 | 
11 |     This class implements a Weibull model for univariate data. The model has parameterized
12 |     form:
13 | 
14 |     .. math::  S(t) = \exp\left(-\left(\frac{t}{\lambda}\right)^\rho\right),   \lambda > 0, \rho > 0,
15 | 
16 |     which implies the cumulative hazard rate is
17 | 
18 |     .. math:: H(t) = \left(\frac{t}{\lambda}\right)^\rho,
19 | 
20 |     and the hazard rate is:
21 | 
22 |     .. math::  h(t) = \frac{\rho}{\lambda}\left(\frac{t}{\lambda}\right)^{\rho-1}
23 | 
24 |     After calling the `.fit` method, you have access to properties like: ``cumulative_hazard_``, ``survival_function_``, ``lambda_`` and ``rho_``.
25 |     A summary of the fit is available with the method ``print_summary()``.
26 | 
27 |     Parameters
28 |     -----------
29 |     alpha: float, optional (default=0.05)
30 |         the level in the confidence intervals.
31 | 
32 |     Important
33 |     ----------
34 |     The parameterization of this model changed in lifelines 0.19.0. Previously, the cumulative hazard looked like
35 |     :math:`(\lambda t)^\rho`. The parameterization is now the reciprocal of :math:`\lambda`.
36 | 
37 |     Examples
38 |     --------
39 | 
40 |     >>> from lifelines import WeibullFitter
41 |     >>> from lifelines.datasets import load_waltons
42 |     >>> waltons = load_waltons()
43 |     >>> wbf = WeibullFitter()
44 |     >>> wbf.fit(waltons['T'], waltons['E'])
45 |     >>> wbf.plot()
46 |     >>> print(wbf.lambda_)
47 | 
48 |     Attributes
49 |     ----------
50 |     cumulative_hazard_ : DataFrame
51 |         The estimated cumulative hazard (with custom timeline if provided)
52 |     confidence_interval_cumulative_hazard_ : DataFrame
53 |         The lower and upper confidence intervals for the cumulative hazard
54 |     hazard_ : DataFrame
55 |         The estimated hazard (with custom timeline if provided)
56 |     confidence_interval_hazard_ : DataFrame
57 |         The lower and upper confidence intervals for the hazard
58 |     survival_function_ : DataFrame
59 |         The estimated survival function (with custom timeline if provided)
60 |     confidence_interval_survival_function_ : DataFrame
61 |         The lower and upper confidence intervals for the survival function
62 |     cumumlative_density_ : DataFrame
63 |         The estimated cumulative density function (with custom timeline if provided)
64 |     confidence_interval_cumumlative_density_ : DataFrame
65 |         The lower and upper confidence intervals for the cumulative density
66 |     variance_matrix_ : numpy array
67 |         The variance matrix of the coefficients
68 |     median_: float
69 |         The median time to event
70 |     lambda_: float
71 |         The fitted parameter in the model
72 |     rho_: float
73 |         The fitted parameter in the model
74 |     durations: array
75 |         The durations provided
76 |     event_observed: array
77 |         The event_observed variable provided
78 |     timeline: array
79 |         The time line to use for plotting and indexing
80 |     entry: array or None
81 |         The entry array provided, or None
82 |     """
83 | 
84 |     _fitted_parameter_names = ["lambda_", "rho_"]
85 | 
86 |     def _cumulative_hazard(self, params, times):
87 |         lambda_, rho_ = params
88 |         return (times / lambda_) ** rho_
89 | 
90 |     @property
91 |     def median_(self):
92 |         return self.lambda_ * (np.log(2) ** (1.0 / self.rho_))
93 | 


--------------------------------------------------------------------------------
/lifelines/fitters/breslow_fleming_harrington_fitter.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | 
  3 | 
  4 | import numpy as np
  5 | import pandas as pd
  6 | 
  7 | from lifelines.fitters import UnivariateFitter
  8 | from lifelines import NelsonAalenFitter
  9 | from lifelines.utils import _to_array, coalesce, CensoringType
 10 | 
 11 | 
 12 | class BreslowFlemingHarringtonFitter(UnivariateFitter):
 13 | 
 14 |     """
 15 |     Class for fitting the Breslow-Fleming-Harrington estimate for the survival function. This estimator
 16 |     is a biased estimator of the survival function but is more stable when the population is small and
 17 |     there are too few early truncation times, it may happen that is the number of patients at risk and
 18 |     the number of deaths is the same.
 19 | 
 20 |     Mathematically, the NAF estimator is the negative logarithm of the BFH estimator.
 21 | 
 22 |     BreslowFlemingHarringtonFitter(alpha=0.05)
 23 | 
 24 |     Parameters
 25 |     ----------
 26 |     alpha: float, optional (default=0.05)
 27 |       The alpha value associated with the confidence intervals.
 28 | 
 29 |     """
 30 | 
 31 |     def fit(
 32 |         self,
 33 |         durations,
 34 |         event_observed=None,
 35 |         timeline=None,
 36 |         entry=None,
 37 |         label="BFH_estimate",
 38 |         alpha=None,
 39 |         ci_labels=None,
 40 |     ):  # pylint: disable=too-many-arguments
 41 |         """
 42 |         Parameters
 43 |         ----------
 44 |         durations: an array, or pd.Series, of length n
 45 |             duration subject was observed for
 46 |         timeline:
 47 |             return the best estimate at the values in timelines (positively increasing)
 48 |         event_observed: an array, or pd.Series, of length n
 49 |             True if the the death was observed, False if the event was lost (right-censored). Defaults all True if event_observed==None
 50 |         entry: an array, or pd.Series, of length n
 51 |            relative time when a subject entered the study. This is
 52 |            useful for left-truncated observations, i.e the birth event was not observed.
 53 |            If None, defaults to all 0 (all birth events observed.)
 54 |         label: string
 55 |             a string to name the column of the estimate.
 56 |         alpha: float, optional (default=0.05)
 57 |             the alpha value in the confidence intervals. Overrides the initializing
 58 |            alpha for this call to fit only.
 59 |         ci_labels: iterable
 60 |             add custom column names to the generated confidence intervals as a length-2 list: [<lower-bound name>, <upper-bound name>]. Default: <label>_lower_<alpha>
 61 | 
 62 | 
 63 |         Returns
 64 |         -------
 65 |           self, with new properties like ``survival_function_``.
 66 | 
 67 |         """
 68 |         self._censoring_type = CensoringType.RIGHT
 69 |         self._label = label
 70 |         alpha = coalesce(alpha, self.alpha)
 71 | 
 72 |         naf = NelsonAalenFitter(alpha=alpha)
 73 |         naf.fit(
 74 |             durations, event_observed=event_observed, timeline=timeline, label=label, entry=entry, ci_labels=ci_labels
 75 |         )
 76 |         self.durations, self.event_observed, self.timeline, self.entry, self.event_table = (
 77 |             naf.durations,
 78 |             naf.event_observed,
 79 |             naf.timeline,
 80 |             naf.entry,
 81 |             naf.event_table,
 82 |         )
 83 | 
 84 |         # estimation
 85 |         self.survival_function_ = np.exp(-naf.cumulative_hazard_)
 86 |         self.confidence_interval_ = np.exp(-naf.confidence_interval_)
 87 | 
 88 |         # estimation methods
 89 |         self._estimation_method = "survival_function_"
 90 |         self._estimate_name = "survival_function_"
 91 |         self._predict_label = label
 92 |         self._update_docstrings()
 93 | 
 94 |         # plotting functions
 95 |         self.plot_survival_function = self.plot
 96 |         return self
 97 | 
 98 |     def survival_function_at_times(self, times, label=None):
 99 |         """
100 |         Return a Pandas series of the predicted survival value at specific times
101 | 
102 |         Parameters
103 |         -----------
104 |         times: iterable or float
105 | 
106 |         Returns
107 |         --------
108 |         pd.Series
109 | 
110 |         """
111 |         label = coalesce(label, self._label)
112 |         return pd.Series(self.predict(times), index=_to_array(times), name=label)
113 | 


--------------------------------------------------------------------------------
/lifelines/fitters/piecewise_exponential_fitter.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | import warnings
  3 | import autograd.numpy as np
  4 | from lifelines.fitters import KnownModelParametericUnivariateFitter
  5 | 
  6 | 
  7 | class PiecewiseExponentialFitter(KnownModelParametericUnivariateFitter):
  8 |     r"""
  9 |     This class implements an Piecewise Exponential model for univariate data. The model has parameterized
 10 |     hazard rate:
 11 | 
 12 |     .. math::  h(t) = \begin{cases}
 13 |                         1/\lambda_0,  & \text{if $t \le \tau_0$} \\
 14 |                         1/\lambda_1 & \text{if $\tau_0 < t \le \tau_1$} \\
 15 |                         1/\lambda_2 & \text{if $\tau_1 < t \le \tau_2$} \\
 16 |                         ...
 17 |                       \end{cases}
 18 | 
 19 |     You specify the breakpoints, :math:`\tau_i`, and *lifelines* will find the
 20 |     optional values for the parameters.
 21 | 
 22 |     After calling the `.fit` method, you have access to properties like: ``survival_function_``, ``plot``, ``cumulative_hazard_``
 23 |     A summary of the fit is available with the method ``print_summary()``
 24 | 
 25 |     Parameters
 26 |     -----------
 27 |     breakpoints: list
 28 |         a list of times when a new exponential model is constructed.
 29 |     alpha: float, optional (default=0.05)
 30 |         the level in the confidence intervals.
 31 | 
 32 |     Important
 33 |     ----------
 34 |     The parameterization of this model changed in lifelines 0.19.1. Previously, the cumulative hazard looked like
 35 |     :math:`\lambda_i t`. The parameterization is now the reciprocal of :math:`\lambda_i`.
 36 | 
 37 |     Attributes
 38 |     ----------
 39 |     cumulative_hazard_ : DataFrame
 40 |         The estimated cumulative hazard (with custom timeline if provided)
 41 |     confidence_interval_cumulative_hazard_ : DataFrame
 42 |         The lower and upper confidence intervals for the cumulative hazard
 43 |     hazard_ : DataFrame
 44 |         The estimated hazard (with custom timeline if provided)
 45 |     confidence_interval_hazard_ : DataFrame
 46 |         The lower and upper confidence intervals for the hazard
 47 |     survival_function_ : DataFrame
 48 |         The estimated survival function (with custom timeline if provided)
 49 |     confidence_interval_survival_function_ : DataFrame
 50 |         The lower and upper confidence intervals for the survival function
 51 |     cumumlative_density_ : DataFrame
 52 |         The estimated cumulative density function (with custom timeline if provided)
 53 |     confidence_interval_cumumlative_density_ : DataFrame
 54 |         The lower and upper confidence intervals for the cumulative density
 55 |     variance_matrix_ : numpy array
 56 |         The variance matrix of the coefficients
 57 |     median_: float
 58 |         The median time to event
 59 |     lambda_i_: float
 60 |         The fitted parameter in the model, for i = 0, 1 ... n-1 breakpoints
 61 |     durations: array
 62 |         The durations provided
 63 |     event_observed: array
 64 |         The event_observed variable provided
 65 |     timeline: array
 66 |         The time line to use for plotting and indexing
 67 |     entry: array or None
 68 |         The entry array provided, or None
 69 |     breakpoints: array
 70 |         The provided breakpoints
 71 | 
 72 |     """
 73 | 
 74 |     def __init__(self, breakpoints, *args, **kwargs):
 75 |         if not breakpoints:
 76 |             raise ValueError("Breakpoints must be provided.")
 77 | 
 78 |         if not (max(breakpoints) < np.inf):
 79 |             raise ValueError("Do not add inf to the breakpoints.")
 80 | 
 81 |         if min(breakpoints) <= 0:
 82 |             raise ValueError("First breakpoint must be greater than 0.")
 83 | 
 84 |         breakpoints = np.sort(breakpoints)
 85 |         self.breakpoints = np.append(breakpoints, [np.inf])
 86 |         n_breakpoints = len(self.breakpoints)
 87 | 
 88 |         self._fitted_parameter_names = ["lambda_%d_" % i for i in range(n_breakpoints)]
 89 | 
 90 |         super(PiecewiseExponentialFitter, self).__init__(*args, **kwargs)
 91 | 
 92 |     def _cumulative_hazard(self, params, times):
 93 |         warnings.simplefilter(action="ignore", category=FutureWarning)
 94 | 
 95 |         n = times.shape[0]
 96 |         times = times.reshape((n, 1))
 97 |         bp = self.breakpoints
 98 |         M = np.minimum(np.tile(bp, (n, 1)), times)
 99 |         M = np.hstack([M[:, tuple([0])], np.diff(M, axis=1)])
100 |         return np.dot(M, 1 / params)
101 | 


--------------------------------------------------------------------------------
/lifelines/utils/btree.py:
--------------------------------------------------------------------------------
  1 | import numpy as np
  2 | 
  3 | 
  4 | class _BTree(object):
  5 | 
  6 |     """A simple balanced binary order statistic tree to help compute the concordance.
  7 | 
  8 |     When computing the concordance, we know all the values the tree will ever contain. That
  9 |     condition simplifies this tree a lot. It means that instead of crazy AVL/red-black shenanigans
 10 |     we can simply do the following:
 11 | 
 12 |     - Store the final tree in flattened form in an array (so node i's children are 2i+1, 2i+2)
 13 |     - Additionally, store the current size of each subtree in another array with the same indices
 14 |     - To insert a value, just find its index, increment the size of the subtree at that index and
 15 |       propagate
 16 |     - To get the rank of an element, you add up a bunch of subtree counts
 17 |     """
 18 | 
 19 |     def __init__(self, values):
 20 |         """
 21 |         Parameters
 22 |         ----------
 23 |         values: list
 24 |             List of sorted (ascending), unique values that will be inserted.
 25 |         """
 26 |         self._tree = self._treeify(values)
 27 |         self._counts = np.zeros_like(self._tree, dtype=int)
 28 | 
 29 |     @staticmethod
 30 |     def _treeify(values):
 31 |         """Convert the np.ndarray `values` into a complete balanced tree.
 32 | 
 33 |         Assumes `values` is sorted ascending. Returns a list `t` of the same length in which t[i] >
 34 |         t[2i+1] and t[i] < t[2i+2] for all i."""
 35 |         if len(values) == 1:  # this case causes problems later
 36 |             return values
 37 |         tree = np.empty_like(values)
 38 |         # Tree indices work as follows:
 39 |         # 0 is the root
 40 |         # 2n+1 is the left child of n
 41 |         # 2n+2 is the right child of n
 42 |         # So we now rearrange `values` into that format...
 43 | 
 44 |         # The first step is to remove the bottom row of leaves, which might not be exactly full
 45 |         last_full_row = int(np.log2(len(values) + 1) - 1)
 46 |         len_ragged_row = len(values) - (2 ** (last_full_row + 1) - 1)
 47 |         if len_ragged_row > 0:
 48 |             bottom_row_ix = np.s_[: 2 * len_ragged_row : 2]
 49 |             tree[-len_ragged_row:] = values[bottom_row_ix]
 50 |             values = np.delete(values, bottom_row_ix)
 51 | 
 52 |         # Now `values` is length 2**n - 1, so can be packed efficiently into a tree
 53 |         # Last row of nodes is indices 0, 2, ..., 2**n - 2
 54 |         # Second-last row is indices 1, 5, ..., 2**n - 3
 55 |         # nth-last row is indices (2**n - 1)::(2**(n+1))
 56 |         values_start = 0
 57 |         values_space = 2
 58 |         values_len = 2 ** last_full_row
 59 |         while values_start < len(values):
 60 |             tree[values_len - 1 : 2 * values_len - 1] = values[values_start::values_space]
 61 |             values_start += int(values_space / 2)
 62 |             values_space *= 2
 63 |             values_len = int(values_len / 2)
 64 |         return tree
 65 | 
 66 |     def insert(self, value):
 67 |         """Insert an occurrence of `value` into the btree."""
 68 |         i = 0
 69 |         n = len(self._tree)
 70 |         while i < n:
 71 |             cur = self._tree[i]
 72 |             self._counts[i] += 1
 73 |             if value < cur:
 74 |                 i = 2 * i + 1
 75 |             elif value > cur:
 76 |                 i = 2 * i + 2
 77 |             else:
 78 |                 return
 79 |         raise ValueError("Value %s not contained in tree." "Also, the counts are now messed up." % value)
 80 | 
 81 |     def __len__(self):
 82 |         return self._counts[0]
 83 | 
 84 |     def rank(self, value):
 85 |         """Returns the rank and count of the value in the btree."""
 86 |         i = 0
 87 |         n = len(self._tree)
 88 |         rank = 0
 89 |         count = 0
 90 |         while i < n:
 91 |             cur = self._tree[i]
 92 |             if value < cur:
 93 |                 i = 2 * i + 1
 94 |                 continue
 95 |             elif value > cur:
 96 |                 rank += self._counts[i]
 97 |                 # subtract off the right tree if exists
 98 |                 nexti = 2 * i + 2
 99 |                 if nexti < n:
100 |                     rank -= self._counts[nexti]
101 |                     i = nexti
102 |                     continue
103 |                 else:
104 |                     return (rank, count)
105 |             else:  # value == cur
106 |                 count = self._counts[i]
107 |                 lefti = 2 * i + 1
108 |                 if lefti < n:
109 |                     nleft = self._counts[lefti]
110 |                     count -= nleft
111 |                     rank += nleft
112 |                     righti = lefti + 1
113 |                     if righti < n:
114 |                         count -= self._counts[righti]
115 |                 return (rank, count)
116 |         return (rank, count)
117 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | ![](http://i.imgur.com/EOowdSD.png)
 2 | 
 3 | [![PyPI version](https://badge.fury.io/py/lifelines.svg)](https://badge.fury.io/py/lifelines)
 4 | [![Build Status](https://travis-ci.org/CamDavidsonPilon/lifelines.svg?branch=master)](https://travis-ci.org/CamDavidsonPilon/lifelines)
 5 | [![Coverage Status](https://coveralls.io/repos/github/CamDavidsonPilon/lifelines/badge.svg?branch=master)](https://coveralls.io/github/CamDavidsonPilon/lifelines?branch=master)
 6 | [![Total alerts](https://img.shields.io/lgtm/alerts/g/CamDavidsonPilon/lifelines.svg?logo=lgtm&logoWidth=18)](https://lgtm.com/projects/g/CamDavidsonPilon/lifelines/alerts/)
 7 | [![Language grade: Python](https://img.shields.io/lgtm/grade/python/g/CamDavidsonPilon/lifelines.svg?logo=lgtm&logoWidth=18)](https://lgtm.com/projects/g/CamDavidsonPilon/lifelines/context:python)
 8 | [![Join the chat at https://gitter.im/python-lifelines/Lobby](https://badges.gitter.im/python-lifelines/Lobby.svg)](https://gitter.im/python-lifelines/Lobby)
 9 | [![Code style: black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/ambv/black)
10 | [![DOI](https://zenodo.org/badge/12420595.svg)](https://zenodo.org/badge/latestdoi/12420595)
11 | 
12 | 
13 | [What is survival analysis and why should I learn it?](http://lifelines.readthedocs.org/en/latest/Survival%20Analysis%20intro.html)
14 |  Survival analysis was originally developed and applied heavily by the actuarial and medical community. Its purpose was to answer *why do events occur now versus later* under uncertainty (where *events* might refer to deaths, disease remission, etc.). This is great for researchers who are interested in measuring lifetimes: they can answer questions like *what factors might influence deaths?*
15 | 
16 | But outside of medicine and actuarial science, there are many other interesting and exciting applications of this survival analysis. For example:
17 | - SaaS providers are interested in measuring customer lifetimes, or time to first behaviors
18 | - inventory stock out is a censoring event for true "demand" of a good.
19 | - sociologists are interested in measuring political parties' lifetimes, or relationships, or marriages
20 | - analyzing [Godwin's law](https://raw.githubusercontent.com/lukashalim/GODWIN/master/Kaplan-Meier-Godwin.png) in Reddit comments
21 | - A/B tests to determine how long it takes different groups to perform an action.
22 | 
23 | *lifelines* is a pure Python implementation of the best parts of survival analysis. We'd love to hear if you are using *lifelines*, please leave an Issue and let us know your thoughts on the library.
24 | 
25 | ## Installation:
26 | 
27 | You can install *lifelines* using
28 | 
29 |        pip install lifelines
30 | 
31 | 
32 | Or getting the bleeding edge version with:
33 | 
34 |        pip install --upgrade --no-deps git+https://github.com/CamDavidsonPilon/lifelines.git
35 | 
36 | from the command line.
37 | 
38 | ### Installation Issues?
39 | 
40 | See the common [problems/solutions for installing lifelines](https://github.com/CamDavidsonPilon/lifelines/issues?utf8=%E2%9C%93&q=label%3Ainstallation+).
41 | 
42 | 
43 | ## *lifelines* Documentation and an intro to survival analysis
44 | 
45 | If you are new to survival analysis, wondering why it is useful, or are interested in *lifelines* examples, API, and syntax, please check out the [Documentation and Tutorials page](http://lifelines.readthedocs.org/en/latest/index.html)
46 | 
47 | Example:
48 | ```python
49 | from lifelines import KaplanMeierFitter
50 | 
51 | durations = [11, 74, 71, 76, 28, 92, 89, 48, 90, 39, 63, 36, 54, 64, 34, 73, 94, 37, 56, 76]
52 | event_observed = [True, True, False, True, True, True, True, False, False, True, True,
53 |                   True, True, True, True, True, False, True, False, True]
54 | 
55 | kmf = KaplanMeierFitter()
56 | kmf.fit(durations, event_observed)
57 | kmf.plot()
58 | ```
59 | 
60 | <img src="https://imgur.com/d4Gi5J0.png" width="600">
61 | 
62 | ## Contacting & troubleshooting
63 |  - There is a [Gitter](https://gitter.im/python-lifelines/) channel available.
64 |  - Some users have posted common questions at [stats.stackexchange.com](https://stats.stackexchange.com/search?tab=votes&q=%22lifelines%22%20is%3aquestion)
65 |  - creating an issue in the [Github repository](https://github.com/camdavidsonpilon/lifelines).
66 | 
67 | ## Roadmap
68 | You can find the roadmap for lifelines [here](https://www.notion.so/camdp/6e2965207f564eb2a3e48b5937873c14?v=47edda47ab774ca2ac7532bb0c750559).
69 | 
70 | ## Development
71 | 
72 | See our [Contributing](https://github.com/CamDavidsonPilon/lifelines/blob/master/CONTRIBUTING.md) guidelines.
73 | 
74 | -------------------------------------------------------------------------------
75 | 
76 | ## Citing lifelines
77 | 
78 | You can use this badge below to generate a DOI and reference text for the latest related version of lifelines:
79 | 
80 |  [![DOI](https://zenodo.org/badge/12420595.svg)](https://zenodo.org/badge/latestdoi/12420595)
81 | 


--------------------------------------------------------------------------------
/lifelines/datasets/nh4.csv:
--------------------------------------------------------------------------------
  1 | "","Date.On","Date.Off","Week","NH4.Orig.mg.per.L","NH4.mg.per.L","Censored"
  2 | "1",2009-01-06,2009-01-13,2,"<0.006",0.006,TRUE
  3 | "2",2009-01-20,2009-01-27,4,"<0.006",0.006,TRUE
  4 | "3",2009-01-27,2009-02-03,5," 0.006",0.006,FALSE
  5 | "4",2009-02-10,2009-02-16,7," 0.016",0.016,FALSE
  6 | "5",2009-02-16,2009-02-24,8,"<0.006",0.006,TRUE
  7 | "6",2009-03-03,2009-03-10,10," 0.015",0.015,FALSE
  8 | "7",2009-03-10,2009-03-17,11," 0.023",0.023,FALSE
  9 | "8",2009-03-17,2009-03-24,12," 0.034",0.034,FALSE
 10 | "9",2009-03-24,2009-03-31,13," 0.022",0.022,FALSE
 11 | "10",2009-03-31,2009-04-08,14," 0.007",0.007,FALSE
 12 | "11",2009-04-08,2009-04-14,15," 0.021",0.021,FALSE
 13 | "12",2009-04-14,2009-04-21,16," 0.012",0.012,FALSE
 14 | "13",2009-04-21,2009-04-28,17,"<0.006",0.006,TRUE
 15 | "14",2009-04-28,2009-05-05,18," 0.021",0.021,FALSE
 16 | "15",2009-05-05,2009-05-12,19," 0.015",0.015,FALSE
 17 | "16",2009-05-12,2009-05-19,20," 0.088",0.088,FALSE
 18 | "17",2009-05-19,2009-05-26,21," 0.058",0.058,FALSE
 19 | "18",2009-06-09,2009-06-17,24,"<0.006",0.006,TRUE
 20 | "19",2009-06-17,2009-06-23,25,"<0.006",0.006,TRUE
 21 | "20",2009-06-23,2009-06-30,26,"<0.006",0.006,TRUE
 22 | "21",2009-06-30,2009-07-07,27,"<0.006",0.006,TRUE
 23 | "22",2009-07-07,2009-07-14,28," 0.074",0.074,FALSE
 24 | "23",2009-08-04,2009-08-11,32," 0.011",0.011,FALSE
 25 | "24",2009-08-11,2009-08-18,33," 0.121",0.121,FALSE
 26 | "25",2009-08-18,2009-08-25,34,"<0.006",0.006,TRUE
 27 | "26",2009-08-25,2009-09-01,35," 0.007",0.007,FALSE
 28 | "27",2009-09-01,2009-09-08,36," 0.007",0.007,FALSE
 29 | "28",2009-09-08,2009-09-15,37," 0.015",0.015,FALSE
 30 | "29",2009-10-13,2009-10-20,42,"<0.006",0.006,TRUE
 31 | "30",2009-10-20,2009-10-27,43,"<0.006",0.006,TRUE
 32 | "31",2009-10-27,2009-11-03,44,"<0.006",0.006,TRUE
 33 | "32",2009-11-03,2009-11-10,45,"<0.006",0.006,TRUE
 34 | "33",2009-11-10,2009-11-17,46,"<0.006",0.006,TRUE
 35 | "34",2009-11-17,2009-11-24,47,"<0.006",0.006,TRUE
 36 | "35",2009-11-24,2009-12-01,48,"<0.006",0.006,TRUE
 37 | "36",2009-12-08,2009-12-15,50,"<0.006",0.006,TRUE
 38 | "37",2009-12-15,2009-12-22,51,"<0.006",0.006,TRUE
 39 | "38",2009-12-29,2010-01-06,53,"<0.01",0.01,TRUE
 40 | "39",2010-01-06,2010-01-12,54,"<0.01",0.01,TRUE
 41 | "40",2010-01-12,2010-01-19,55,"<0.01",0.01,TRUE
 42 | "41",2010-02-02,2010-02-09,58," 0.042",0.042,FALSE
 43 | "42",2010-02-09,2010-02-16,59,"<0.01",0.01,TRUE
 44 | "43",2010-02-16,2010-02-23,60," 0.013",0.013,FALSE
 45 | "44",2010-02-23,2010-03-02,61,"<0.01",0.01,TRUE
 46 | "45",2010-03-02,2010-03-10,62," 0.028",0.028,FALSE
 47 | "46",2010-03-17,2010-03-23,64,"<0.01",0.01,TRUE
 48 | "47",2010-03-23,2010-03-30,65,"<0.01",0.01,TRUE
 49 | "48",2010-03-30,2010-04-06,66,"<0.01",0.01,TRUE
 50 | "49",2010-04-06,2010-04-12,67," 0.049",0.049,FALSE
 51 | "50",2010-04-12,2010-04-20,68," 0.036",0.036,FALSE
 52 | "51",2010-04-20,2010-04-27,69,"<0.01",0.01,TRUE
 53 | "52",2010-04-27,2010-05-04,70," 0.011",0.011,FALSE
 54 | "53",2010-05-04,2010-05-11,71," 0.019",0.019,FALSE
 55 | "54",2010-06-15,2010-06-22,77," 0.253",0.253,FALSE
 56 | "55",2010-06-22,2010-06-30,78,"<0.018",0.018,TRUE
 57 | "56",2010-06-30,2010-07-06,79,"<0.01",0.01,TRUE
 58 | "57",2010-08-24,2010-08-31,87," 0.014",0.014,FALSE
 59 | "58",2010-09-14,2010-09-22,90," 0.08",0.08,FALSE
 60 | "59",2010-09-22,2010-09-28,91,"<0.01",0.01,TRUE
 61 | "60",2010-09-28,2010-10-05,92," 0.065",0.065,FALSE
 62 | "61",2010-10-05,2010-10-12,93,"<0.01",0.01,TRUE
 63 | "62",2010-10-26,2010-11-02,96,"<0.01",0.01,TRUE
 64 | "63",2010-11-02,2010-11-09,97,"<0.01",0.01,TRUE
 65 | "64",2010-11-09,2010-11-16,98,"<0.01",0.01,TRUE
 66 | "65",2010-11-16,2010-11-23,99,"<0.01",0.01,TRUE
 67 | "66",2010-11-23,2010-11-30,100,"<0.01",0.01,TRUE
 68 | "67",2011-01-04,2011-01-11,106,"<0.008",0.008,TRUE
 69 | "68",2011-01-11,2011-01-18,107,"<0.008",0.008,TRUE
 70 | "69",2011-01-18,2011-01-25,108,"<0.008",0.008,TRUE
 71 | "70",2011-01-25,2011-02-01,109,"<0.008",0.008,TRUE
 72 | "71",2011-02-01,2011-02-08,110," 0.009",0.009,FALSE
 73 | "72",2011-02-08,2011-02-15,111,"<0.008",0.008,TRUE
 74 | "73",2011-02-15,2011-02-22,112," 0.017",0.017,FALSE
 75 | "74",2011-03-08,2011-03-15,115," 0.012",0.012,FALSE
 76 | "75",2011-03-15,2011-03-22,116," 0.02",0.02,FALSE
 77 | "76",2011-03-22,2011-03-29,117," 0.009",0.009,FALSE
 78 | "77",2011-03-29,2011-04-05,118," 0.014",0.014,FALSE
 79 | "78",2011-04-05,2011-04-12,119," 0.03",0.03,FALSE
 80 | "79",2011-04-12,2011-04-19,120," 0.06",0.06,FALSE
 81 | "80",2011-04-19,2011-04-26,121," 0.031",0.031,FALSE
 82 | "81",2011-04-26,2011-05-03,122," 0.024",0.024,FALSE
 83 | "82",2011-05-03,2011-05-10,123," 0.013",0.013,FALSE
 84 | "83",2011-05-10,2011-05-17,124," 0.059",0.059,FALSE
 85 | "84",2011-05-24,2011-05-31,126," 0.009",0.009,FALSE
 86 | "85",2011-05-31,2011-06-07,127," 0.017",0.017,FALSE
 87 | "86",2011-06-07,2011-06-14,128," 0.033",0.033,FALSE
 88 | "87",2011-06-14,2011-06-21,129," 0.052",0.052,FALSE
 89 | "88",2011-06-21,2011-06-28,130," 0.015",0.015,FALSE
 90 | "89",2011-06-28,2011-07-06,131," 0.019",0.019,FALSE
 91 | "90",2011-07-12,2011-07-20,133,"<0.008",0.008,TRUE
 92 | "91",2011-07-20,2011-07-26,134,"<0.008",0.008,TRUE
 93 | "92",2011-07-26,2011-08-02,135,"<0.008",0.008,TRUE
 94 | "93",2011-08-16,2011-08-23,138,"<0.008",0.008,TRUE
 95 | "94",2011-09-13,2011-09-20,142," 0.009",0.009,FALSE
 96 | "95",2011-09-30,2011-10-04,144," 0.013",0.013,FALSE
 97 | "96",2011-10-04,2011-10-12,145," 0.023",0.023,FALSE
 98 | "97",2011-10-12,2011-10-18,146," 0.036",0.036,FALSE
 99 | "98",2011-10-18,2011-10-25,147,"<0.008",0.008,TRUE
100 | "99",2011-10-25,2011-11-01,148," 0.012",0.012,FALSE
101 | "100",2011-11-01,2011-11-08,149," 0.03",0.03,FALSE
102 | "101",2011-11-08,2011-11-15,150," 0.022",0.022,FALSE
103 | "102",2011-12-13,2011-12-20,155," 0.008",0.008,FALSE
104 | 


--------------------------------------------------------------------------------
/paper/paper.md:
--------------------------------------------------------------------------------
 1 | ---
 2 | title: 'lifelines: survival analysis in Python'
 3 | tags:
 4 |   - survival analysis
 5 |   - reliability analysis
 6 |   - maximum likelihood
 7 | authors:
 8 |  - name: Cameron Davidson-Pilon
 9 |    orcid: 0000-0003-1794-9143
10 |    affiliation: 1
11 | affiliations:
12 |  - name: University of Waterloo
13 |    index: 1
14 | date: 07 March 2019
15 | bibliography: paper.bib
16 | ---
17 | 
18 | # Summary
19 | 
20 | One frustration of data scientists and statisticians is moving between programming languages to complete projects. The most common two are R and Python. For example, a survival analysis model may be fit using R's *survival-package*[@survival-package] or *flexsurv*[@flexsurv], but needs to be deployed into a Python system. Previously, this may have meant using Python libraries to call out to R (still shuffling between two languages, but now abstracted), or translating the fitted model to Python (likely to introduce bugs). Libraries like Patsy [@nathaniel_j_smith_2018_1472929] and Statsmodels [@skipper_seabold_2017_275519] have helped data scientists and statisticians work in solely in Python. *lifelines* extends the toolbox of data scientists so they can perform common survival analysis tasks in Python. Its value comes from its intuitive and well documented API, its flexibility in modeling novel hazard functions, and its easy deployment in production systems & research stations along side other Python libraries. The internals of *lifelines* uses some novel approaches to survival analysis algorithms like automatic differentiation and meta-algorithms. We present high-level descriptions of these novel approaches next.
21 | 
22 | 
23 | One goal of *lifelines* is to be pure Python so as to make installation and maintenance simple. This can be at odds with users' desire for high-performance model fitting. Though Python is becoming more and more performant, datasets are getting larger and larger at a faster rate. Internally, *lifelines* uses some interesting tricks to improve performance. I'd like to share the approaches taken as they can be applied to other Python libraries. For example, the Cox proportional hazard model with Efron's tie-handling method has a complicated partial-likelihood [@wiki:ph]:
24 | 
25 | $$
26 | \ell(\beta) = \sum_j \left(\sum_{i\in H_j} X_i \cdot \beta -\sum_{\ell=0}^{m-1}\log\left(\sum_{i:Y_i\ge t_j}\theta_i - \frac{\ell}{m}\sum_{i\in H_j}\theta_i\right)\right),
27 | $$
28 | 
29 | where $\theta_i = \exp{(X_i \cdot \beta)}$, and the Hessian matrix is:
30 | 
31 | $$
32 | \ell^{\prime\prime}(\beta) = -\sum_j \sum_{\ell=0}^{m-1} \left(\frac{\sum_{i:Y_i\ge t_j}\theta_iX_iX_i^\prime - \frac{\ell}{m}\sum_{i\in H_j}\theta_iX_iX_i^\prime}{\phi_{j,\ell,m}} - \frac{Z_{j,\ell,m} Z_{j,\ell,m}^\prime}{\phi_{j,\ell,m}^2}\right),
33 | $$
34 | 
35 | where
36 | 
37 | $$
38 | \phi_{j,\ell,m} = \sum_{i:Y_i\ge t_j}\theta_i - \frac{\ell}{m}\sum_{i\in H_j}\theta_i
39 | $$
40 | 
41 | $$
42 | Z_{j,\ell,m} = \sum_{i:Y_i\ge t_j}\theta_iX_i - \frac{\ell}{m}\sum_{i\in H_j}\theta_iX_i.
43 | $$
44 | 
45 | These could be implemented in Python using, for example, Python's native `for` loops. However, this would be too slow. We would like to use NumPy, which offers vectorized operations. However, even with NumPy, there are still some Python `for` loops. *lifelines* has cleverly implemented these equations using NumPy's `einsum` function, which is used to express tensor products in Einstein summation notation. The result is that the tensor products, which are just `for` loops, are pushed down to as close to the C layer as possible. From internal tests, using `einsum` resulted in a 4x speed improvement.
46 | 
47 | Another optimization in the *lifelines*' implementation of Cox proportional hazard model is using a meta-algorithm to pick the most performant algorithm at runtime. There are two algorithms that can be used to compute the partial likelihood (and its gradient and Hessian). One algorithm is faster when there is a high cardinality of times in the dataset (low count of ties), and the other is faster when there low cardinality of times (high count of ties). There is not a simple heuristic of when one is faster than the other, at it depends on other factors like the size of the dataset and the average count of data points per time. To overcome this, I generated hundreds of artificial datasets of varying size, varying cardinality of times, and varying average count of data points per time. After running both algorithms against the datasets and recording their durations, I fitted a linear regression model to predict the ratio of duration. This model is accurate (R-squared over 80%), easy to implement, and importantly can predict very fast. Thus, at runtime, we compute summary values for the dataset and let the linear model predict which algorithm will be faster. By choosing the appropriate algorithm, we achieve an up-to 3x performance improvement on some datasets. When other performance improvements are made to either algorithm, we rerun the dataset generation and model training to get a new linear model for prediction.
48 | 
49 | A non-performance innovation in *lifelines* is the incredible flexibility for user-defined parametric cumulative hazards. This allows the user to specify precise parametric models and perform inference and statistical tests on them. This generalization of parametric models, which previously was confined to well-known probability distributions, is possible due to the automatic differentiation engine, Autograd, and the fact that any probability distribution can be defined by a cumulative hazard function. *lifelines* has implemented the log-likelihood for an arbitrary cumulative hazard, $H(t | \theta)$, including possible censoring and left-truncation:
50 | 
51 | $$
52 | \log{l(\theta|t, c, s)} = \sum_{i: c_i=1}\left( \log{h(t_i)} - H(t_i)\right) - \sum_{i: c_i=0} H(t_i) + \sum_{i} H(s_i)
53 | $$
54 | 
55 | where $t_i$ are the observed or censored times of subject $i$, $c_i$ is 0 if the subject was censored, $s_i$ is time the subject entered the study, and $h(t)$ is the hazard which is the derivative of the cumulative hazard with respect to time. We use automatic differentiation to compute $h(t)$ and the gradient and Hessian with respect to the unknown parameters $\theta$. The user only needs to specify a cumulative hazard (in Python code). *lifelines* will invoke SciPy's `minimize` with the computed derivatives and return the maximum likelihood estimators of the model, along with standard errors, p-values, confidence intervals, etc. An example user defined cumulative hazard is below:
56 | 
57 | ```
58 | from lifelines.fitters import ParametericUnivariateFitter
59 | 
60 | class ThreeParamHazardFitter(ParametericUnivariateFitter):
61 | 
62 |     _fitted_parameter_names = ['alpha_', 'beta_', 'gamma_']
63 |     _bounds = [(0, None), (75, None), (0, None)]
64 | 
65 |     # this is the only function we need to define. It always takes two arguments:
66 |     #   params: an iterable that unpacks the parameters you'll need in the order of _fitted_parameter_names
67 |     #   times: a numpy vector of times that will be passed in by the optimizer
68 |     def _cumulative_hazard(self, params, times):
69 |         a, b, c = params
70 |         return a / (b - times) ** c
71 | 
72 | ```
73 | 
74 | 
75 | Some more examples of user-defined cumulative hazards are in the main documentation.
76 | 
77 | 
78 | # Acknowledgments
79 | 
80 | I'd like to acknowledge all the researchers in survival analysis, specifically Terry Therneau. I'd also like to acknowledge the contributers to the *lifelines* projects.
81 | 
82 | # References
83 | 


--------------------------------------------------------------------------------
/docs/Makefile:
--------------------------------------------------------------------------------
  1 | # Makefile for Sphinx documentation
  2 | #
  3 | 
  4 | # You can set these variables from the command line.
  5 | SPHINXOPTS    =
  6 | SPHINXBUILD   = sphinx-build
  7 | PAPER         =
  8 | BUILDDIR      = _build
  9 | 
 10 | # User-friendly check for sphinx-build
 11 | ifeq ($(shell which $(SPHINXBUILD) >/dev/null 2>&1; echo $$?), 1)
 12 | $(error The '$(SPHINXBUILD)' command was not found. Make sure you have Sphinx installed, then set the SPHINXBUILD environment variable to point to the full path of the '$(SPHINXBUILD)' executable. Alternatively you can add the directory with the executable to your PATH. If you don't have Sphinx installed, grab it from http://sphinx-doc.org/)
 13 | endif
 14 | 
 15 | # Internal variables.
 16 | PAPEROPT_a4     = -D latex_paper_size=a4
 17 | PAPEROPT_letter = -D latex_paper_size=letter
 18 | ALLSPHINXOPTS   = -d $(BUILDDIR)/doctrees $(PAPEROPT_$(PAPER)) $(SPHINXOPTS) .
 19 | # the i18n builder cannot share the environment and doctrees with the others
 20 | I18NSPHINXOPTS  = $(PAPEROPT_$(PAPER)) $(SPHINXOPTS) .
 21 | 
 22 | .PHONY: help clean html dirhtml singlehtml pickle json htmlhelp qthelp devhelp epub latex latexpdf text man changes linkcheck doctest gettext
 23 | 
 24 | help:
 25 | 	@echo "Please use \`make <target>' where <target> is one of"
 26 | 	@echo "  html       to make standalone HTML files"
 27 | 	@echo "  dirhtml    to make HTML files named index.html in directories"
 28 | 	@echo "  singlehtml to make a single large HTML file"
 29 | 	@echo "  pickle     to make pickle files"
 30 | 	@echo "  json       to make JSON files"
 31 | 	@echo "  htmlhelp   to make HTML files and a HTML help project"
 32 | 	@echo "  qthelp     to make HTML files and a qthelp project"
 33 | 	@echo "  devhelp    to make HTML files and a Devhelp project"
 34 | 	@echo "  epub       to make an epub"
 35 | 	@echo "  latex      to make LaTeX files, you can set PAPER=a4 or PAPER=letter"
 36 | 	@echo "  latexpdf   to make LaTeX files and run them through pdflatex"
 37 | 	@echo "  latexpdfja to make LaTeX files and run them through platex/dvipdfmx"
 38 | 	@echo "  text       to make text files"
 39 | 	@echo "  man        to make manual pages"
 40 | 	@echo "  texinfo    to make Texinfo files"
 41 | 	@echo "  info       to make Texinfo files and run them through makeinfo"
 42 | 	@echo "  gettext    to make PO message catalogs"
 43 | 	@echo "  changes    to make an overview of all changed/added/deprecated items"
 44 | 	@echo "  xml        to make Docutils-native XML files"
 45 | 	@echo "  pseudoxml  to make pseudoxml-XML files for display purposes"
 46 | 	@echo "  linkcheck  to check all external links for integrity"
 47 | 	@echo "  doctest    to run all doctests embedded in the documentation (if enabled)"
 48 | 
 49 | clean:
 50 | 	rm -rf $(BUILDDIR)/*
 51 | 
 52 | html:
 53 | 	$(SPHINXBUILD) -b html $(ALLSPHINXOPTS) $(BUILDDIR)/html
 54 | 	@echo
 55 | 	@echo "Build finished. The HTML pages are in $(BUILDDIR)/html."
 56 | 
 57 | dirhtml:
 58 | 	$(SPHINXBUILD) -b dirhtml $(ALLSPHINXOPTS) $(BUILDDIR)/dirhtml
 59 | 	@echo
 60 | 	@echo "Build finished. The HTML pages are in $(BUILDDIR)/dirhtml."
 61 | 
 62 | singlehtml:
 63 | 	$(SPHINXBUILD) -b singlehtml $(ALLSPHINXOPTS) $(BUILDDIR)/singlehtml
 64 | 	@echo
 65 | 	@echo "Build finished. The HTML page is in $(BUILDDIR)/singlehtml."
 66 | 
 67 | pickle:
 68 | 	$(SPHINXBUILD) -b pickle $(ALLSPHINXOPTS) $(BUILDDIR)/pickle
 69 | 	@echo
 70 | 	@echo "Build finished; now you can process the pickle files."
 71 | 
 72 | json:
 73 | 	$(SPHINXBUILD) -b json $(ALLSPHINXOPTS) $(BUILDDIR)/json
 74 | 	@echo
 75 | 	@echo "Build finished; now you can process the JSON files."
 76 | 
 77 | htmlhelp:
 78 | 	$(SPHINXBUILD) -b htmlhelp $(ALLSPHINXOPTS) $(BUILDDIR)/htmlhelp
 79 | 	@echo
 80 | 	@echo "Build finished; now you can run HTML Help Workshop with the" \
 81 | 	      ".hhp project file in $(BUILDDIR)/htmlhelp."
 82 | 
 83 | qthelp:
 84 | 	$(SPHINXBUILD) -b qthelp $(ALLSPHINXOPTS) $(BUILDDIR)/qthelp
 85 | 	@echo
 86 | 	@echo "Build finished; now you can run "qcollectiongenerator" with the" \
 87 | 	      ".qhcp project file in $(BUILDDIR)/qthelp, like this:"
 88 | 	@echo "# qcollectiongenerator $(BUILDDIR)/qthelp/lifelines.qhcp"
 89 | 	@echo "To view the help file:"
 90 | 	@echo "# assistant -collectionFile $(BUILDDIR)/qthelp/lifelines.qhc"
 91 | 
 92 | devhelp:
 93 | 	$(SPHINXBUILD) -b devhelp $(ALLSPHINXOPTS) $(BUILDDIR)/devhelp
 94 | 	@echo
 95 | 	@echo "Build finished."
 96 | 	@echo "To view the help file:"
 97 | 	@echo "# mkdir -p $$HOME/.local/share/devhelp/lifelines"
 98 | 	@echo "# ln -s $(BUILDDIR)/devhelp $$HOME/.local/share/devhelp/lifelines"
 99 | 	@echo "# devhelp"
100 | 
101 | epub:
102 | 	$(SPHINXBUILD) -b epub $(ALLSPHINXOPTS) $(BUILDDIR)/epub
103 | 	@echo
104 | 	@echo "Build finished. The epub file is in $(BUILDDIR)/epub."
105 | 
106 | latex:
107 | 	$(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex
108 | 	@echo
109 | 	@echo "Build finished; the LaTeX files are in $(BUILDDIR)/latex."
110 | 	@echo "Run \`make' in that directory to run these through (pdf)latex" \
111 | 	      "(use \`make latexpdf' here to do that automatically)."
112 | 
113 | latexpdf:
114 | 	$(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex
115 | 	@echo "Running LaTeX files through pdflatex..."
116 | 	$(MAKE) -C $(BUILDDIR)/latex all-pdf
117 | 	@echo "pdflatex finished; the PDF files are in $(BUILDDIR)/latex."
118 | 
119 | latexpdfja:
120 | 	$(SPHINXBUILD) -b latex $(ALLSPHINXOPTS) $(BUILDDIR)/latex
121 | 	@echo "Running LaTeX files through platex and dvipdfmx..."
122 | 	$(MAKE) -C $(BUILDDIR)/latex all-pdf-ja
123 | 	@echo "pdflatex finished; the PDF files are in $(BUILDDIR)/latex."
124 | 
125 | text:
126 | 	$(SPHINXBUILD) -b text $(ALLSPHINXOPTS) $(BUILDDIR)/text
127 | 	@echo
128 | 	@echo "Build finished. The text files are in $(BUILDDIR)/text."
129 | 
130 | man:
131 | 	$(SPHINXBUILD) -b man $(ALLSPHINXOPTS) $(BUILDDIR)/man
132 | 	@echo
133 | 	@echo "Build finished. The manual pages are in $(BUILDDIR)/man."
134 | 
135 | texinfo:
136 | 	$(SPHINXBUILD) -b texinfo $(ALLSPHINXOPTS) $(BUILDDIR)/texinfo
137 | 	@echo
138 | 	@echo "Build finished. The Texinfo files are in $(BUILDDIR)/texinfo."
139 | 	@echo "Run \`make' in that directory to run these through makeinfo" \
140 | 	      "(use \`make info' here to do that automatically)."
141 | 
142 | info:
143 | 	$(SPHINXBUILD) -b texinfo $(ALLSPHINXOPTS) $(BUILDDIR)/texinfo
144 | 	@echo "Running Texinfo files through makeinfo..."
145 | 	make -C $(BUILDDIR)/texinfo info
146 | 	@echo "makeinfo finished; the Info files are in $(BUILDDIR)/texinfo."
147 | 
148 | gettext:
149 | 	$(SPHINXBUILD) -b gettext $(I18NSPHINXOPTS) $(BUILDDIR)/locale
150 | 	@echo
151 | 	@echo "Build finished. The message catalogs are in $(BUILDDIR)/locale."
152 | 
153 | changes:
154 | 	$(SPHINXBUILD) -b changes $(ALLSPHINXOPTS) $(BUILDDIR)/changes
155 | 	@echo
156 | 	@echo "The overview file is in $(BUILDDIR)/changes."
157 | 
158 | linkcheck:
159 | 	$(SPHINXBUILD) -b linkcheck $(ALLSPHINXOPTS) $(BUILDDIR)/linkcheck
160 | 	@echo
161 | 	@echo "Link check complete; look for any errors in the above output " \
162 | 	      "or in $(BUILDDIR)/linkcheck/output.txt."
163 | 
164 | doctest:
165 | 	$(SPHINXBUILD) -b doctest $(ALLSPHINXOPTS) $(BUILDDIR)/doctest
166 | 	@echo "Testing of doctests in the sources finished, look at the " \
167 | 	      "results in $(BUILDDIR)/doctest/output.txt."
168 | 
169 | xml:
170 | 	$(SPHINXBUILD) -b xml $(ALLSPHINXOPTS) $(BUILDDIR)/xml
171 | 	@echo
172 | 	@echo "Build finished. The XML files are in $(BUILDDIR)/xml."
173 | 
174 | pseudoxml:
175 | 	$(SPHINXBUILD) -b pseudoxml $(ALLSPHINXOPTS) $(BUILDDIR)/pseudoxml
176 | 	@echo
177 | 	@echo "Build finished. The pseudo-XML files are in $(BUILDDIR)/pseudoxml."
178 | 


--------------------------------------------------------------------------------
/lifelines/fitters/weibull_aft_fitter.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | from autograd import numpy as np
  3 | from scipy.special import gamma
  4 | import pandas as pd
  5 | 
  6 | from lifelines.utils import _get_index, coalesce
  7 | from lifelines.fitters import ParametericAFTRegressionFitter
  8 | 
  9 | 
 10 | class WeibullAFTFitter(ParametericAFTRegressionFitter):
 11 |     r"""
 12 |     This class implements a Weibull AFT model. The model has parameterized
 13 |     form, with :math:`\lambda(x) = \exp\left(\beta_0 + \beta_1x_1 + ... + \beta_n x_n \right)`,
 14 |     and optionally, :math:`\rho(y) = \exp\left(\alpha_0 + \alpha_1 y_1 + ... + \alpha_m y_m \right)`,
 15 | 
 16 |     .. math::  S(t; x, y) = \exp\left(-\left(\frac{t}{\lambda(x)}\right)^{\rho(y)}\right),
 17 | 
 18 |     which implies the cumulative hazard rate is
 19 | 
 20 |     .. math:: H(t; x, y) = \left(\frac{t}{\lambda(x)} \right)^{\rho(y)},
 21 | 
 22 |     After calling the ``.fit`` method, you have access to properties like:
 23 |     ``params_``, ``print_summary()``. A summary of the fit is available with the method ``print_summary()``.
 24 | 
 25 | 
 26 |     Parameters
 27 |     -----------
 28 |     alpha: float, optional (default=0.05)
 29 |         the level in the confidence intervals.
 30 | 
 31 |     fit_intercept: boolean, optional (default=True)
 32 |         Allow lifelines to add an intercept column of 1s to df, and ancillary_df if applicable.
 33 | 
 34 |     penalizer: float, optional (default=0.0)
 35 |         the penalizer coefficient to the size of the coefficients. See `l1_ratio`. Must be equal to or greater than 0.
 36 | 
 37 |     l1_ratio: float, optional (default=0.0)
 38 |         how much of the penalizer should be attributed to an l1 penalty (otherwise an l2 penalty). The penalty function looks like
 39 |         ``penalizer * l1_ratio * ||w||_1 + 0.5 * penalizer * (1 - l1_ratio) * ||w||^2_2``
 40 | 
 41 |     Attributes
 42 |     ----------
 43 |     params_ : DataFrame
 44 |         The estimated coefficients
 45 |     confidence_intervals_ : DataFrame
 46 |         The lower and upper confidence intervals for the coefficients
 47 |     durations: Series
 48 |         The event_observed variable provided
 49 |     event_observed: Series
 50 |         The event_observed variable provided
 51 |     weights: Series
 52 |         The event_observed variable provided
 53 |     variance_matrix_ : numpy array
 54 |         The variance matrix of the coefficients
 55 |     standard_errors_: Series
 56 |         the standard errors of the estimates
 57 |     score_: float
 58 |         the concordance index of the model.
 59 |     """
 60 | 
 61 |     def __init__(self, alpha=0.05, penalizer=0.0, l1_ratio=0.0, fit_intercept=True):
 62 |         self._ancillary_parameter_name = "rho_"
 63 |         self._primary_parameter_name = "lambda_"
 64 |         super(WeibullAFTFitter, self).__init__(alpha, penalizer, l1_ratio, fit_intercept)
 65 | 
 66 |     def _cumulative_hazard(self, params, T, *Xs):
 67 |         lambda_params = params[self._LOOKUP_SLICE["lambda_"]]
 68 |         lambda_ = np.exp(np.dot(Xs[0], lambda_params))
 69 | 
 70 |         rho_params = params[self._LOOKUP_SLICE["rho_"]]
 71 |         rho_ = np.exp(np.dot(Xs[1], rho_params))
 72 |         return (T / lambda_) ** rho_
 73 | 
 74 |     def _log_hazard(self, params, T, *Xs):
 75 |         lambda_params = params[self._LOOKUP_SLICE["lambda_"]]
 76 |         log_lambda_ = np.dot(Xs[0], lambda_params)
 77 | 
 78 |         rho_params = params[self._LOOKUP_SLICE["rho_"]]
 79 |         log_rho_ = np.dot(Xs[1], rho_params)
 80 | 
 81 |         return log_rho_ - log_lambda_ + np.expm1(log_rho_) * (np.log(T) - log_lambda_)
 82 | 
 83 |     def predict_percentile(self, X, ancillary_X=None, p=0.5):
 84 |         """
 85 |         Returns the median lifetimes for the individuals, by default. If the survival curve of an
 86 |         individual does not cross 0.5, then the result is infinity.
 87 |         http://stats.stackexchange.com/questions/102986/percentile-loss-functions
 88 | 
 89 |         Parameters
 90 |         ----------
 91 |         X:  numpy array or DataFrame
 92 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
 93 |             can be in any order. If a numpy array, columns must be in the
 94 |             same order as the training data.
 95 |         ancillary_X: numpy array or DataFrame, optional
 96 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
 97 |             can be in any order. If a numpy array, columns must be in the
 98 |             same order as the training data.
 99 |         p: float, optional (default=0.5)
100 |             the percentile, must be between 0 and 1.
101 | 
102 |         Returns
103 |         -------
104 |         percentiles: DataFrame
105 | 
106 |         See Also
107 |         --------
108 |         predict_median
109 | 
110 |         """
111 |         lambda_, rho_ = self._prep_inputs_for_prediction_and_return_scores(X, ancillary_X)
112 | 
113 |         return pd.DataFrame(lambda_ * np.power(-np.log(p), 1 / rho_), index=_get_index(X))
114 | 
115 |     def predict_expectation(self, X, ancillary_X=None):
116 |         """
117 |         Predict the expectation of lifetimes, :math:`E[T | x]`.
118 | 
119 |         Parameters
120 |         ----------
121 |         X: numpy array or DataFrame
122 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
123 |             can be in any order. If a numpy array, columns must be in the
124 |             same order as the training data.
125 |         ancillary_X: numpy array or DataFrame, optional
126 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
127 |             can be in any order. If a numpy array, columns must be in the
128 |             same order as the training data.
129 | 
130 |         Returns
131 |         -------
132 |         percentiles: DataFrame
133 |             the median lifetimes for the individuals. If the survival curve of an
134 |             individual does not cross 0.5, then the result is infinity.
135 | 
136 | 
137 |         See Also
138 |         --------
139 |         predict_median
140 |         """
141 |         lambda_, rho_ = self._prep_inputs_for_prediction_and_return_scores(X, ancillary_X)
142 |         return pd.DataFrame((lambda_ * gamma(1 + 1 / rho_)), index=_get_index(X))
143 | 
144 |     def predict_cumulative_hazard(self, X, times=None, ancillary_X=None):
145 |         """
146 |         Return the cumulative hazard rate of subjects in X at time points.
147 | 
148 |         Parameters
149 |         ----------
150 |         X: numpy array or DataFrame
151 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
152 |             can be in any order. If a numpy array, columns must be in the
153 |             same order as the training data.
154 |         times: iterable, optional
155 |             an iterable of increasing times to predict the cumulative hazard at. Default
156 |             is the set of all durations (observed and unobserved). Uses a linear interpolation if
157 |             points in time are not in the index.
158 |         ancillary_X: numpy array or DataFrame, optional
159 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
160 |             can be in any order. If a numpy array, columns must be in the
161 |             same order as the training data.
162 | 
163 |         Returns
164 |         -------
165 |         cumulative_hazard_ : DataFrame
166 |             the cumulative hazard of individuals over the timeline
167 |         """
168 |         times = coalesce(times, self.timeline, np.unique(self.durations))
169 |         lambda_, rho_ = self._prep_inputs_for_prediction_and_return_scores(X, ancillary_X)
170 | 
171 |         return pd.DataFrame(np.outer(times, 1 / lambda_) ** rho_, columns=_get_index(X), index=times)
172 | 


--------------------------------------------------------------------------------
/lifelines/fitters/log_logistic_aft_fitter.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | 
  3 | 
  4 | from autograd import numpy as np
  5 | import pandas as pd
  6 | 
  7 | from lifelines.utils import _get_index, coalesce
  8 | from lifelines.fitters import ParametericAFTRegressionFitter
  9 | 
 10 | 
 11 | class LogLogisticAFTFitter(ParametericAFTRegressionFitter):
 12 |     r"""
 13 |     This class implements a Log-Logistic AFT model. The model has parameterized
 14 |     form, with :math:`\alpha(x) = \exp\left(a_0 + a_1x_1 + ... + a_n x_n \right)`,
 15 |     and optionally, :math:`\beta(y) = \exp\left(b_0 + b_1 y_1 + ... + b_m y_m \right)`,
 16 | 
 17 |     The cumulative hazard rate is
 18 | 
 19 |     .. math:: H(t; x , y) = \log\left(1 + \left(\frac{t}{\alpha(x)}\right)^ \beta(y)\right)
 20 | 
 21 |     After calling the ``.fit`` method, you have access to properties like:
 22 |     ``params_``, ``print_summary()``. A summary of the fit is available with the method ``print_summary()``.
 23 | 
 24 | 
 25 |     Parameters
 26 |     -----------
 27 |     alpha: float, optional (default=0.05)
 28 |         the level in the confidence intervals.
 29 | 
 30 |     fit_intercept: boolean, optional (default=True)
 31 |         Allow lifelines to add an intercept column of 1s to df, and ancillary_df if applicable.
 32 | 
 33 |     penalizer: float, optional (default=0.0)
 34 |         the penalizer coefficient to the size of the coefficients. See `l1_ratio`. Must be equal to or greater than 0.
 35 | 
 36 |     l1_ratio: float, optional (default=0.0)
 37 |         how much of the penalizer should be attributed to an l1 penalty (otherwise an l2 penalty). The penalty function looks like
 38 |         ``penalizer * l1_ratio * ||w||_1 + 0.5 * penalizer * (1 - l1_ratio) * ||w||^2_2``
 39 | 
 40 |     Attributes
 41 |     ----------
 42 |     params_ : DataFrame
 43 |         The estimated coefficients
 44 |     confidence_intervals_ : DataFrame
 45 |         The lower and upper confidence intervals for the coefficients
 46 |     durations: Series
 47 |         The event_observed variable provided
 48 |     event_observed: Series
 49 |         The event_observed variable provided
 50 |     weights: Series
 51 |         The event_observed variable provided
 52 |     variance_matrix_ : numpy array
 53 |         The variance matrix of the coefficients
 54 |     standard_errors_: Series
 55 |         the standard errors of the estimates
 56 |     score_: float
 57 |         the concordance index of the model.
 58 |     """
 59 | 
 60 |     def __init__(self, alpha=0.05, penalizer=0.0, l1_ratio=0.0, fit_intercept=True):
 61 |         self._ancillary_parameter_name = "beta_"
 62 |         self._primary_parameter_name = "alpha_"
 63 |         super(LogLogisticAFTFitter, self).__init__(alpha, penalizer, l1_ratio, fit_intercept)
 64 | 
 65 |     def _cumulative_hazard(self, params, T, *Xs):
 66 |         alpha_params = params[self._LOOKUP_SLICE["alpha_"]]
 67 |         alpha_ = np.exp(np.dot(Xs[0], alpha_params))
 68 | 
 69 |         beta_params = params[self._LOOKUP_SLICE["beta_"]]
 70 |         beta_ = np.exp(np.dot(Xs[1], beta_params))
 71 |         return np.log1p((T / alpha_) ** beta_)
 72 | 
 73 |     def _log_hazard(self, params, T, *Xs):
 74 |         alpha_params = params[self._LOOKUP_SLICE["alpha_"]]
 75 |         log_alpha_ = np.dot(Xs[0], alpha_params)
 76 |         alpha_ = np.exp(log_alpha_)
 77 | 
 78 |         beta_params = params[self._LOOKUP_SLICE["beta_"]]
 79 |         log_beta_ = np.dot(Xs[1], beta_params)
 80 |         beta_ = np.exp(log_beta_)
 81 | 
 82 |         return log_beta_ - log_alpha_ + np.expm1(log_beta_) * (np.log(T) - log_alpha_) - np.log1p((T / alpha_) ** beta_)
 83 | 
 84 |     def _log_1m_sf(self, params, T, *Xs):
 85 |         alpha_params = params[self._LOOKUP_SLICE["alpha_"]]
 86 |         log_alpha_ = np.dot(Xs[0], alpha_params)
 87 |         alpha_ = np.exp(log_alpha_)
 88 | 
 89 |         beta_params = params[self._LOOKUP_SLICE["beta_"]]
 90 |         log_beta_ = np.dot(Xs[1], beta_params)
 91 |         beta_ = np.exp(log_beta_)
 92 |         return -np.log1p((T / alpha_) ** -beta_)
 93 | 
 94 |     def predict_percentile(self, X, ancillary_X=None, p=0.5):
 95 |         """
 96 |         Returns the median lifetimes for the individuals, by default. If the survival curve of an
 97 |         individual does not cross ``p``, then the result is infinity.
 98 |         http://stats.stackexchange.com/questions/102986/percentile-loss-functions
 99 | 
100 |         Parameters
101 |         ----------
102 |         X:  numpy array or DataFrame
103 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
104 |             can be in any order. If a numpy array, columns must be in the
105 |             same order as the training data.
106 |         ancillary_X: numpy array or DataFrame, optional
107 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
108 |             can be in any order. If a numpy array, columns must be in the
109 |             same order as the training data.
110 |         p: float, optional (default=0.5)
111 |             the percentile, must be between 0 and 1.
112 | 
113 |         Returns
114 |         -------
115 |         percentiles: DataFrame
116 | 
117 |         See Also
118 |         --------
119 |         predict_median
120 | 
121 |         """
122 |         alpha_, beta_ = self._prep_inputs_for_prediction_and_return_scores(X, ancillary_X)
123 | 
124 |         return pd.DataFrame(alpha_ * (1 / p - 1) ** beta_, index=_get_index(X))
125 | 
126 |     def predict_expectation(self, X, ancillary_X=None):
127 |         """
128 |         Predict the expectation of lifetimes, :math:`E[T | x]`.
129 | 
130 |         Parameters
131 |         ----------
132 |         X: numpy array or DataFrame
133 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
134 |             can be in any order. If a numpy array, columns must be in the
135 |             same order as the training data.
136 |         ancillary_X: numpy array or DataFrame, optional
137 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
138 |             can be in any order. If a numpy array, columns must be in the
139 |             same order as the training data.
140 | 
141 |         Returns
142 |         -------
143 |         percentiles: DataFrame
144 |             the median lifetimes for the individuals. If the survival curve of an
145 |             individual does not cross 0.5, then the result is infinity.
146 | 
147 | 
148 |         See Also
149 |         --------
150 |         predict_median
151 |         """
152 |         alpha_, beta_ = self._prep_inputs_for_prediction_and_return_scores(X, ancillary_X)
153 |         v = (alpha_ * np.pi / beta_) / np.sin(np.pi / beta_)
154 |         v = np.where(beta_ > 1, v, np.nan)
155 |         return pd.DataFrame(v, index=_get_index(X))
156 | 
157 |     def predict_cumulative_hazard(self, X, times=None, ancillary_X=None):
158 |         """
159 |         Return the cumulative hazard rate of subjects in X at time points.
160 | 
161 |         Parameters
162 |         ----------
163 |         X: numpy array or DataFrame
164 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
165 |             can be in any order. If a numpy array, columns must be in the
166 |             same order as the training data.
167 |         times: iterable, optional
168 |             an iterable of increasing times to predict the cumulative hazard at. Default
169 |             is the set of all durations (observed and unobserved). Uses a linear interpolation if
170 |             points in time are not in the index.
171 |         ancillary_X: numpy array or DataFrame, optional
172 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
173 |             can be in any order. If a numpy array, columns must be in the
174 |             same order as the training data.
175 | 
176 |         Returns
177 |         -------
178 |         cumulative_hazard_ : DataFrame
179 |             the cumulative hazard of individuals over the timeline
180 |         """
181 |         times = coalesce(times, self.timeline, np.unique(self.durations))
182 |         alpha_, beta_ = self._prep_inputs_for_prediction_and_return_scores(X, ancillary_X)
183 |         return pd.DataFrame(np.log1p(np.outer(times, 1 / alpha_) ** beta_), columns=_get_index(X), index=times)
184 | 


--------------------------------------------------------------------------------
/docs/Survival Analysis intro.rst:
--------------------------------------------------------------------------------
  1 | .. image:: http://i.imgur.com/EOowdSD.png
  2 | 
  3 | -------------------------------------
  4 | 
  5 | 
  6 | Introduction to survival analysis
  7 | '''''''''''''''''''''''''''''''''
  8 | 
  9 | Applications
 10 | ------------
 11 | 
 12 | 
 13 | Traditionally, survival analysis was developed to measure lifespans of individuals.
 14 | An actuary or health professional would ask questions like
 15 | "how long does this population live for?", and answer it using survival analysis.
 16 | For example, the population may be a nation's population (for actuaries),
 17 | or a population stricken by a disease (in the medical professionals case).
 18 | Traditionally, sort of a morbid subject.
 19 | 
 20 | The analysis can be further applied to not just traditional *births and
 21 | deaths*, but any duration. Medical professionals might be interested in
 22 | the *time between childbirths*, where a birth in this case is the event
 23 | of having a child, and a death is becoming pregnant again! (obviously,
 24 | we are loose with our definitions of *birth and death*) Another example
 25 | is users subscribing to a service: a birth is a user who joins the
 26 | service, and a death is when the user leaves the service.
 27 | 
 28 | Censoring
 29 | ----------
 30 | 
 31 | 
 32 | At the time you want to make inferences about durations, it is possible, likely
 33 | true, that not all the death events have occurred yet. For example, a
 34 | medical professional will not wait 50 years for each individual in the
 35 | study to pass away before investigating -- he or she is interested in
 36 | the effectiveness of improving lifetimes after only a few years, or months possibly.
 37 | 
 38 | The individuals in a population who have not been subject to the death
 39 | event are labeled as *right-censored*, i.e.,
 40 | we did not (or can not) view the rest of their life history
 41 | due to some external circumstances. All the information we have on
 42 | these individuals are their current lifetime durations (which is
 43 | naturally *less* than their actual lifetimes).
 44 | 
 45 | .. note:: There is also left-censoring and interval censoring, which are expanded on later.
 46 | 
 47 | A common mistake data analysts make is choosing to ignore the
 48 | right-censored individuals. We will see why this is a mistake next.
 49 | 
 50 | Consider a case where the population is actually made up of two
 51 | subpopulations, :math:`A` and :math:`B`. Population :math:`A` has a very
 52 | small lifespan, say 2 months on average, and population :math:`B`
 53 | enjoys a much larger lifespan, say 12 months on average. We may
 54 | not know this distinction beforehand. At :math:`t=10`, we
 55 | wish to investigate the average lifespan for everyone.
 56 | 
 57 | In the figure below, the red lines denote the lifespan of individuals where the death event
 58 | has been observed, and the blue lines denote the lifespan of the
 59 | right-censored individuals (deaths have not been observed). If we are
 60 | asked to estimate the average lifetime of our population, and we naively
 61 | decided to *not* included the right-censored individuals, it is clear
 62 | that we would be severely underestimating the true average lifespan.
 63 | 
 64 | .. code:: python
 65 | 
 66 | 
 67 |     from lifelines.plotting import plot_lifetimes
 68 |     from numpy.random import uniform, exponential
 69 | 
 70 |     N = 25
 71 | 
 72 |     CURRENT_TIME = 10
 73 | 
 74 |     actual_lifetimes = np.array([
 75 |         exponential(12) if (uniform() < 0.5) else exponential(2) for i in range(N)
 76 |     ])
 77 |     observed_lifetimes = np.minimum(actual_lifetimes, CURRENT_TIME)
 78 |     death_observed = actual_lifetimes < CURRENT_TIME
 79 | 
 80 |     ax = plot_lifetimes(observed_lifetimes, event_observed=death_observed)
 81 | 
 82 |     ax.set_xlim(0, 25)
 83 |     ax.vlines(10, 0, 30, lw=2, linestyles='--')
 84 |     ax.set_xlabel("time")
 85 |     ax.set_title("Births and deaths of our population, at $t=10$")
 86 |     print("Observed lifetimes at time %d:\n" % (CURRENT_TIME), observed_lifetimes)
 87 | 
 88 | 
 89 | .. image:: images/survival_analysis_intro_censoring.png
 90 | 
 91 | 
 92 | .. parsed-literal::
 93 | 
 94 |     Observed lifetimes at time 10:
 95 |     [10.   1.1   8.   10.  3.43   0.63   6.28   1.03   2.37   6.17  10.
 96 |        0.21   2.71   1.25  10.   3.4  0.62   1.94   0.22   7.43   6.16  10.
 97 |        9.41  10.  10.]
 98 | 
 99 | 
100 | Furthermore, if we instead simply took the mean of *all* observed
101 | lifespans, including the current lifespans of right-censored instances,
102 | we would *still* be underestimating the true average lifespan. Below we
103 | plot the actual lifetimes of all instances (recall we do not see this
104 | information at :math:`t=10`).
105 | 
106 | .. code:: python
107 | 
108 |     ax = plot_lifetimes(actual_lifetimes, event_observed=death_observed)
109 |     ax.vlines(10, 0, 30, lw=2, linestyles='--')
110 |     ax.set_xlim(0, 25)
111 | 
112 | 
113 | .. image:: images/survival_analysis_intro_censoring_revealed.png
114 | 
115 | 
116 | Survival analysis was originally developed to solve this type of
117 | problem, that is, to deal with estimation when our data is
118 | right-censored. Even in the case where all events have been
119 | observed, i.e. no censoring, survival analysis is still a very useful tool
120 | to understand durations.
121 | 
122 | The observations need not always start at zero, either. This was done
123 | only for understanding in the above example. Consider the example where
124 | a customer entering a store is a birth: a customer can enter at
125 | any time, and not necessarily at time zero. In survival analysis, durations
126 | are relative: individuals may start at different times.
127 | (We actually only need the *duration* of the observation, and not
128 | necessarily the start and end time.)
129 | 
130 | We next introduce the two fundamental objects in survival analysis, the
131 | *survival function* and the *hazard function*.
132 | 
133 | --------------
134 | 
135 | Survival function
136 | -----------------
137 | 
138 | 
139 | Let :math:`T` be a (possibly infinite, but always non-negative) random
140 | lifetime taken from the population under study. For example, the
141 | amount of time a couple is married. Or the time it takes a user to enter
142 | a webpage (an infinite time if they never do). The survival function -
143 | :math:`S(t)` - of a population is defined as
144 | 
145 | .. math::  S(t) = Pr( T > t)
146 | 
147 | In plain English: the survival function defines the probability the death event has not occurred yet at time
148 | :math:`t`, or equivalently, the probability of surviving past time
149 | :math:`t`. Note the following properties of the survival function:
150 | 
151 | 1. :math:`0 \le S(t) \le 1`
152 | 2. :math:`F_T(t) = 1 - S(t)`, where :math:`F_T(t)` is the CDF of :math:`T`, which implies
153 | 3. :math:`S(t)` is a non-increasing function of :math:`t`.
154 | 
155 | 
156 | Hazard curve
157 | ------------
158 | 
159 | 
160 | We are also interested in the probability of the death event occurring at time :math:`t`,
161 | given that the death event has not occurred until time :math:`t`. Mathematically, that is:
162 | 
163 | .. math::  \lim_{\delta t \rightarrow 0 } \; Pr( t \le T \le t + \delta t | T > t)
164 | 
165 | This quantity goes to 0 as :math:`\delta t` shrinks, so we divide this
166 | by the interval :math:`\delta t` (like we might do in calculus). This
167 | defines the hazard function at time :math:`t`, :math:`h(t)`:
168 | 
169 | .. math:: h(t) =  \lim_{\delta t \rightarrow 0 } \; \frac{Pr( t \le T \le t + \delta t | T > t)}{\delta t}
170 | 
171 | It can be shown that this is equal to:
172 | 
173 | .. math:: h(t) = \frac{-S'(t)}{S(t)}
174 | 
175 | and solving this differential equation (cool, it is a differential
176 | equation!), we get:
177 | 
178 | .. math:: S(t) = \exp\left( -\int_0^t h(z) \mathrm{d}z \right)
179 | 
180 | What I love about the above equation is that it defines **all** survival
181 | functions. Notice that we can now speak either about the
182 | survival function, :math:`S(t)`, or the hazard function,
183 | :math:`h(t)`, and we can convert back and forth quite easily. It
184 | also gives us another, albeit not as useful, expression for :math:`T`.
185 | Upon differentiation and some algebra, we recover:
186 | 
187 | .. math:: f_T(t) = h(t)\exp\left( -\int_0^t h(z) \mathrm{d}z \right) = h(t) S(t)
188 | 
189 | Of course, we do not observe the true survival curve of a population. We
190 | must use the observed data to estimate it. There are many ways to estimate the survival function and the hazard rate, which brings us to :doc:`estimation using lifelines</Survival analysis with lifelines>`.
191 | 


--------------------------------------------------------------------------------
/lifelines/datasets/regression.csv:
--------------------------------------------------------------------------------
  1 | var1,var2,var3,T,E
  2 | 0.59517,1.143472,1.571079,14.7856515748,1
  3 | 0.209325,0.184677,0.35698,7.33584583652,1
  4 | 0.693919,0.071893,0.55796,5.26979701571,1
  5 | 0.443804,1.364646,0.374221,11.6840920212,1
  6 | 1.613324,0.125566,1.921325,7.63949212526,1
  7 | 0.065636,0.098375,0.237896,12.6784581817,1
  8 | 0.386294,1.663092,0.790314,6.60166572026,1
  9 | 0.946688,1.345394,3.209113,11.3670916491,1
 10 | 0.11374,0.40986,0.064934,14.6805866317,1
 11 | 0.777793,0.33499,0.411055,10.5854086595,1
 12 | 0.04428,0.305158,0.17648,19.3721173864,1
 13 | 1.03545,3.304733,0.997323,5.55904466985,1
 14 | 0.229195,0.581355,0.484794,11.2924891948,1
 15 | 0.05597,2.674135,0.355279,9.92047433529,0
 16 | 1.236583,1.796598,0.179952,9.88652411916,1
 17 | 1.162835,0.464759,2.028854,6.26643301257,1
 18 | 0.149436,2.949291,0.277801,13.8127296,1
 19 | 0.399475,0.822413,0.673405,6.43309776107,1
 20 | 0.762121,0.050407,1.285163,6.97979741031,1
 21 | 1.239718,1.869215,0.020202,7.74300832502,1
 22 | 0.019221,1.435543,0.255689,4.70530329608,1
 23 | 0.090253,0.211037,0.372809,11.2335841641,1
 24 | 0.205849,0.048722,0.00253,6.66273101972,1
 25 | 0.088185,1.319679,0.201675,10.7174137318,1
 26 | 4.629747,0.363522,1.08207,11.5938047533,1
 27 | 1.602836,1.217881,0.350837,8.46420655566,1
 28 | 0.014804,0.684737,0.493267,5.43255855841,1
 29 | 0.08402,1.432093,0.456541,10.276593667,1
 30 | 2.260223,1.23893,5.541838,7.21736226987,1
 31 | 0.621968,0.684428,0.135933,13.2176584654,1
 32 | 0.01322,3.280555,1.193551,8.0299335416,1
 33 | 0.070651,1.430517,0.005205,9.80826804874,1
 34 | 0.20598,0.29064,0.096565,2.63226375911,1
 35 | 1.389882,0.143133,0.821257,6.16269524116,1
 36 | 0.104143,2.072924,0.449696,6.26182607469,1
 37 | 0.428481,0.065739,3.00755,4.6048190364,0
 38 | 1.785151,1.572282,0.475059,11.1239077928,1
 39 | 0.228893,0.429025,0.60805,6.08263253911,1
 40 | 0.640837,0.311084,3.165658,9.22065563383,1
 41 | 1.450683,0.847022,2.521177,7.12012891282,0
 42 | 0.469459,0.318871,0.164498,13.0551806715,1
 43 | 0.36617,0.234991,0.678709,4.95133583707,1
 44 | 1.43257,2.668335,0.558046,4.85889534209,1
 45 | 2.696463,0.244077,1.315111,8.50543244101,1
 46 | 0.152624,0.379501,0.330164,7.03794878748,1
 47 | 0.277399,0.871603,1.555185,10.8353931443,1
 48 | 0.353633,0.294236,0.928573,9.92109564592,1
 49 | 0.620956,0.021884,3.20576,5.29165212342,1
 50 | 0.000757,1.216615,0.861069,20.9813809356,1
 51 | 0.497674,2.744032,0.473589,5.80982311606,1
 52 | 1.213709,0.072756,0.09842,11.2908076197,1
 53 | 0.426255,2.550392,0.16762,8.19779319557,1
 54 | 0.008408,1.132205,1.234917,7.47213923892,1
 55 | 1.207833,0.13335,0.528231,10.670073183,1
 56 | 0.036975,0.040631,0.2664,10.543203936,1
 57 | 0.789439,0.669067,1.332697,6.28852320244,1
 58 | 1.482055,0.627205,0.738271,9.080334859,1
 59 | 1.028671,0.21521,0.457692,14.1822947115,1
 60 | 0.521986,2.282683,0.315976,21.9399783806,1
 61 | 0.262622,0.345999,0.921097,8.88229093093,1
 62 | 0.360319,1.001364,0.237533,9.98342539597,1
 63 | 0.362587,0.110046,2.486691,9.55638379129,1
 64 | 1.793598,0.310001,0.263066,8.65928769028,1
 65 | 0.419275,0.114308,1.124784,5.6434659532,1
 66 | 1.470247,0.289054,0.331833,10.9977552573,1
 67 | 0.27476,0.523508,2.139204,8.05076874352,1
 68 | 0.119805,0.733774,0.212057,11.2503684762,1
 69 | 0.369294,0.609847,0.89402,10.2129272163,0
 70 | 1.01825,2.119666,0.716002,12.3366190173,1
 71 | 0.607065,2.350112,0.03139,15.7231628796,1
 72 | 4.169831,0.316285,0.16935,11.8302258308,0
 73 | 1.483383,2.242744,0.26543,7.36252640465,1
 74 | 0.323597,0.165159,0.97204,12.5169357575,1
 75 | 1.82716,0.327794,0.941539,8.51322372304,1
 76 | 0.104104,0.923302,1.22007,12.7973318626,1
 77 | 0.392766,0.422794,3.482608,8.54052212332,1
 78 | 2.579629,0.109011,2.280028,3.56358063047,1
 79 | 0.775092,0.974519,2.223699,9.57756677618,1
 80 | 0.507593,0.917278,0.103131,9.64881133972,1
 81 | 0.138437,2.474084,1.635005,11.789052178,1
 82 | 1.120586,1.480593,0.638244,4.6478831396,0
 83 | 0.001842,0.601452,0.40551,14.1629885287,1
 84 | 0.996979,0.44859,0.782013,7.49170332816,1
 85 | 1.067263,0.304582,0.795276,10.7391507856,1
 86 | 1.123429,1.409315,0.090895,8.23925481073,1
 87 | 0.139158,3.203523,0.287349,7.63092764446,1
 88 | 1.276529,1.039313,1.217827,7.8203073558,1
 89 | 0.175824,1.371635,1.785488,12.4208671834,1
 90 | 0.241301,4.048806,0.423415,10.5633022553,1
 91 | 1.864444,0.821839,0.426364,6.29314423772,1
 92 | 0.340295,0.727143,0.341437,12.4052831947,1
 93 | 5.130831,0.074513,0.801526,10.7964133954,1
 94 | 1.404635,0.039251,0.785162,17.0955898105,1
 95 | 0.073944,0.053315,0.186262,15.4629258426,0
 96 | 1.271488,0.10678,0.291883,9.61273262267,1
 97 | 0.781452,1.229076,0.069747,14.4093766173,1
 98 | 0.3909,0.356907,0.23058,10.0869453587,1
 99 | 2.193825,0.621184,0.466925,5.81874836313,1
100 | 2.942882,0.16383,1.040333,7.98833687105,1
101 | 0.705527,0.592699,0.923248,11.8312524366,1
102 | 1.662925,2.18517,0.664273,11.8731640313,1
103 | 0.407842,1.011611,0.485592,4.14387121547,1
104 | 0.091321,0.281593,0.153947,8.2907236782,1
105 | 3.538509,1.80715,1.336961,4.32535868496,1
106 | 0.661027,1.171563,0.30091,14.2454199869,1
107 | 0.106552,0.121843,0.257878,5.66506177628,1
108 | 0.104327,1.513503,0.314581,7.91846164924,1
109 | 0.811837,1.683324,0.061925,11.8443153255,1
110 | 0.402495,0.43152,0.489576,11.0761501869,1
111 | 1.322155,0.521161,1.859989,6.88916431026,1
112 | 0.647954,3.243631,0.034075,8.34491489657,1
113 | 0.851476,0.217366,0.29733,4.47399978584,1
114 | 0.149994,3.027889,0.542749,9.24722217844,1
115 | 0.381276,1.146927,0.22583,11.2146024447,1
116 | 0.019479,1.374707,1.566595,8.28623107033,1
117 | 0.806793,0.60941,1.903648,10.0738349202,1
118 | 0.926828,1.062158,0.048544,14.4854236558,1
119 | 0.998282,0.385911,1.403305,11.0245383745,1
120 | 0.198755,1.668675,0.182337,6.25197764519,1
121 | 1.668232,0.717113,0.39318,15.8836989034,1
122 | 0.903388,0.34757,0.796215,11.34167126,1
123 | 3.094217,0.764497,3.063756,7.6440979558,1
124 | 0.565765,0.855644,2.412222,8.36665621446,1
125 | 0.600544,0.019666,2.356107,11.9012822052,1
126 | 0.453201,0.242149,0.761114,9.91242335863,1
127 | 0.441605,0.271366,0.977522,8.32289768512,1
128 | 0.41135,0.029484,1.843458,11.9717347284,1
129 | 0.53512,0.045629,0.160067,11.1247094819,1
130 | 0.472119,2.239749,0.148828,6.15413791004,1
131 | 0.485754,1.464013,0.380293,8.91144648631,1
132 | 5.353937,0.855298,0.001006,4.88104290364,1
133 | 0.000974,0.354965,0.698741,20.6652251814,1
134 | 0.361457,2.792862,1.503787,11.0822662185,1
135 | 1.202673,1.825852,0.391339,8.00771353063,1
136 | 0.853077,0.221376,1.635539,9.78044985255,1
137 | 1.646959,3.337169,1.262672,5.66532639351,1
138 | 0.050491,1.042388,0.040406,10.5017493224,1
139 | 0.693033,0.067717,1.63193,9.96821890209,1
140 | 3.875361,1.206579,0.656785,4.83539084237,1
141 | 0.401754,1.526443,0.449621,7.95252897093,1
142 | 2.112141,0.994604,0.125928,4.44530592881,1
143 | 2.358111,1.411174,4.747023,6.92942222099,1
144 | 0.406167,0.747936,1.240233,11.9701980352,1
145 | 0.983312,1.330699,0.931057,12.7687578904,1
146 | 2.802856,0.141768,0.96447,6.1536973616,1
147 | 0.22598,0.156969,0.771678,9.09300617059,1
148 | 1.020212,1.338747,1.485407,9.70355645693,1
149 | 0.737183,0.211967,1.479703,10.4173960087,1
150 | 0.694596,0.133065,1.612199,13.1829276562,1
151 | 1.614919,1.628414,3.339563,2.57553764605,1
152 | 1.263567,0.041626,0.134488,7.09141708798,1
153 | 1.81759,0.89371,0.256831,5.73937524269,1
154 | 0.221442,1.00047,0.135565,12.9241740121,1
155 | 0.388571,2.331312,0.048117,12.8735020088,1
156 | 1.365461,0.44473,0.26388,4.72642629428,1
157 | 0.017446,1.50251,1.859648,9.83594179776,1
158 | 0.803217,0.259678,0.305695,6.06237621553,1
159 | 1.153738,2.357565,0.264925,8.09338513449,1
160 | 0.546425,0.516525,0.059806,8.04406734742,1
161 | 0.061367,2.453071,0.234816,8.71594708122,1
162 | 0.421136,0.295455,1.117664,13.2869538904,1
163 | 1.574779,0.741122,0.533676,10.5135003978,1
164 | 1.394351,0.877793,1.637652,6.42775744203,1
165 | 0.923441,1.107614,0.78291,3.63878040929,1
166 | 0.231346,0.620135,1.821355,4.74775344975,1
167 | 0.735706,3.405054,3.457625,11.6770199376,1
168 | 1.748839,1.132628,0.812584,11.5594329742,1
169 | 0.280291,1.664837,0.05146,8.75824998324,1
170 | 0.150857,2.545696,1.456119,12.8268461929,1
171 | 1.551681,0.125114,0.148355,15.6204061094,0
172 | 0.746388,0.267458,0.420036,11.9422735844,1
173 | 0.068177,0.193788,2.693533,7.95449616061,1
174 | 0.305141,0.858988,3.883753,12.3573764607,1
175 | 3.614956,0.659784,1.013164,3.56383007199,1
176 | 1.981033,0.737972,0.272071,8.5619748224,1
177 | 0.19708,1.164958,0.820487,4.20656850475,1
178 | 0.027854,0.653326,0.08022,21.0318230188,1
179 | 1.806666,3.535072,2.176759,5.81052910695,1
180 | 0.165288,1.623395,1.994551,8.79849009986,1
181 | 1.617063,0.494798,0.131597,7.79923023169,0
182 | 1.298794,1.778036,0.453693,12.6551650347,1
183 | 0.707968,1.081388,0.477484,14.3014540711,1
184 | 0.246455,0.113618,0.407209,13.3297030877,1
185 | 0.282453,0.731784,0.002421,6.12506421389,1
186 | 0.133855,0.096552,0.152854,4.93564074908,0
187 | 0.025306,0.07387,0.163927,6.3156952171,1
188 | 1.017839,0.737884,3.126409,6.57321280053,0
189 | 0.847491,1.142187,1.342932,8.61060494656,1
190 | 0.942093,0.161735,1.388318,9.9956084953,1
191 | 0.383001,0.006451,0.901114,7.74825868839,1
192 | 0.011166,0.220669,0.691791,7.34226786253,1
193 | 1.543502,1.472249,0.830817,6.98633720723,1
194 | 0.168033,3.052163,0.035085,18.1313105791,1
195 | 2.159946,0.001644,1.443158,4.38165504789,1
196 | 0.249142,0.628992,2.318513,8.74257448673,1
197 | 0.137399,0.107748,0.354812,11.4454572735,1
198 | 0.637341,2.847188,1.459137,7.62462675408,1
199 | 1.109732,0.405561,0.018856,10.6346199544,1
200 | 0.031865,1.753759,0.25204,8.51971771151,1
201 | 1.631269,1.588621,3.709899,4.47895208711,1
202 | 


--------------------------------------------------------------------------------
/lifelines/datasets/stanford_heart.csv:
--------------------------------------------------------------------------------
  1 | "start","stop","event","age","year","surgery","transplant","id"
  2 | 0,50,1,-17.1553730321697,0.123203285420945,0,"0",1
  3 | 0,6,1,3.83572895277207,0.254620123203285,0,"0",2
  4 | 0,1,0,6.29705681040383,0.265571526351814,0,"0",3
  5 | 1,16,1,6.29705681040383,0.265571526351814,0,"1",3
  6 | 0,36,0,-7.73716632443532,0.490075290896646,0,"0",4
  7 | 36,39,1,-7.73716632443532,0.490075290896646,0,"1",4
  8 | 0,18,1,-27.2142368240931,0.607802874743327,0,"0",5
  9 | 0,3,1,6.59548254620123,0.700889801505818,0,"0",6
 10 | 0,51,0,2.86926762491444,0.780287474332649,0,"0",7
 11 | 51,675,1,2.86926762491444,0.780287474332649,0,"1",7
 12 | 0,40,1,-2.65023956194388,0.835044490075291,0,"0",8
 13 | 0,85,1,-0.837782340862425,0.856947296372348,0,"0",9
 14 | 0,12,0,-5.49760438056126,0.862422997946612,0,"0",10
 15 | 12,58,1,-5.49760438056126,0.862422997946612,0,"1",10
 16 | 0,26,0,-0.0191649555099218,0.87337440109514,0,"0",11
 17 | 26,153,1,-0.0191649555099218,0.87337440109514,0,"1",11
 18 | 0,8,1,5.1937029431896,0.9637234770705,0,"0",12
 19 | 0,17,0,6.57357973990418,0.969199178644764,0,"0",13
 20 | 17,81,1,6.57357973990418,0.969199178644764,0,"1",13
 21 | 0,37,0,6.0123203285421,0.971937029431896,0,"0",14
 22 | 37,1387,1,6.0123203285421,0.971937029431896,0,"1",14
 23 | 0,1,1,5.81519507186858,0.991101984941821,1,"0",15
 24 | 0,28,0,1.44832306639288,1.07049965776865,0,"0",16
 25 | 28,308,1,1.44832306639288,1.07049965776865,0,"1",16
 26 | 0,36,1,-27.668720054757,1.07597535934292,0,"0",17
 27 | 0,20,0,8.84873374401095,1.08692676249144,0,"0",18
 28 | 20,43,1,8.84873374401095,1.08692676249144,0,"1",18
 29 | 0,37,1,11.1238877481177,1.13347022587269,0,"0",19
 30 | 0,18,0,7.27994524298425,1.3305954825462,0,"0",20
 31 | 18,28,1,7.27994524298425,1.3305954825462,0,"1",20
 32 | 0,8,0,-4.6570841889117,1.3388090349076,0,"0",21
 33 | 8,1032,1,-4.6570841889117,1.3388090349076,0,"1",21
 34 | 0,12,0,-5.21560574948666,1.46201232032854,0,"0",22
 35 | 12,51,1,-5.21560574948666,1.46201232032854,0,"1",22
 36 | 0,3,0,10.3572895277207,1.52772073921971,0,"0",23
 37 | 3,733,1,10.3572895277207,1.52772073921971,0,"1",23
 38 | 0,83,0,3.80013689253936,1.56605065023956,0,"0",24
 39 | 83,219,1,3.80013689253936,1.56605065023956,0,"1",24
 40 | 0,25,0,-14.776180698152,1.57426420260096,0,"0",25
 41 | 25,1800,0,-14.776180698152,1.57426420260096,0,"1",25
 42 | 0,1401,0,-17.4647501711157,1.58247775496235,0,"0",26
 43 | 0,263,1,-39.2142368240931,1.59069130732375,0,"0",27
 44 | 0,71,0,6.02327173169062,1.68377823408624,0,"0",28
 45 | 71,72,1,6.02327173169062,1.68377823408624,0,"1",28
 46 | 0,35,1,2.43394934976044,1.78507871321013,0,"0",29
 47 | 0,16,0,-3.08829568788501,1.88364134154689,0,"0",30
 48 | 16,852,1,-3.08829568788501,1.88364134154689,0,"1",30
 49 | 0,16,1,6.88569472963724,1.89459274469541,0,"0",31
 50 | 0,17,0,16.4079397672827,1.91101984941821,0,"0",32
 51 | 17,77,1,16.4079397672827,1.91101984941821,0,"1",32
 52 | 0,51,0,0.903490759753595,2.1574264202601,0,"0",33
 53 | 51,1587,0,0.903490759753595,2.1574264202601,0,"1",33
 54 | 0,23,0,-7.44695414099932,2.19849418206708,0,"0",34
 55 | 23,1572,0,-7.44695414099932,2.19849418206708,0,"1",34
 56 | 0,12,1,-4.53388090349076,2.30800821355236,0,"0",35
 57 | 0,46,0,0.925393566050651,2.507871321013,0,"0",36
 58 | 46,100,1,0.925393566050651,2.507871321013,0,"1",36
 59 | 0,19,0,13.5003422313484,2.56536618754278,0,"0",37
 60 | 19,66,1,13.5003422313484,2.56536618754278,0,"1",37
 61 | 0,4.5,0,-6.52977412731006,2.5927446954141,0,"0",38
 62 | 4.5,5,1,-6.52977412731006,2.5927446954141,0,"1",38
 63 | 0,2,0,2.51882272416153,2.63381245722108,0,"0",39
 64 | 2,53,1,2.51882272416153,2.63381245722108,0,"1",39
 65 | 0,41,0,0.481861738535251,2.64750171115674,1,"0",40
 66 | 41,1408,0,0.481861738535251,2.64750171115674,1,"1",40
 67 | 0,58,0,-2.69678302532512,2.8829568788501,1,"0",41
 68 | 58,1322,0,-2.69678302532512,2.8829568788501,1,"1",41
 69 | 0,3,1,-11.5592060232717,2.88843258042437,0,"0",42
 70 | 0,2,1,-4.60780287474333,3.05817932922656,1,"0",43
 71 | 0,40,1,-5.42094455852156,3.16495550992471,1,"0",44
 72 | 0,1,0,-11.8165639972622,3.26351813826146,0,"0",45
 73 | 1,45,1,-11.8165639972622,3.26351813826146,0,"1",45
 74 | 0,2,0,0.610540725530456,3.27720739219713,1,"0",46
 75 | 2,996,1,0.610540725530456,3.27720739219713,1,"1",46
 76 | 0,21,0,-0.90075290896646,3.34017796030116,0,"0",47
 77 | 21,72,1,-0.90075290896646,3.34017796030116,0,"1",47
 78 | 0,9,1,8.03559206023272,3.34839151266256,0,"0",48
 79 | 0,36,0,-11.3456536618754,3.37577002053388,1,"0",49
 80 | 36,1142,0,-11.3456536618754,3.37577002053388,1,"1",49
 81 | 0,83,0,-2.11362080766598,3.37577002053388,1,"0",50
 82 | 83,980,1,-2.11362080766598,3.37577002053388,1,"1",50
 83 | 0,32,0,0.733744010951405,3.47707049965777,0,"0",51
 84 | 32,285,1,0.733744010951405,3.47707049965777,0,"1",51
 85 | 0,102,1,-6.75154004106776,3.564681724846,0,"0",52
 86 | 0,41,0,-0.657084188911703,3.75085557837098,0,"0",53
 87 | 41,188,1,-0.657084188911703,3.75085557837098,0,"1",53
 88 | 0,3,1,-0.208076659822041,3.75085557837098,0,"0",54
 89 | 0,10,0,4.45448323066393,3.854893908282,0,"0",55
 90 | 10,61,1,4.45448323066393,3.854893908282,0,"1",55
 91 | 0,67,0,-9.25667351129363,3.9233401779603,0,"0",56
 92 | 67,942,0,-9.25667351129363,3.9233401779603,0,"1",56
 93 | 0,149,1,-6.73511293634497,3.95071868583162,0,"0",57
 94 | 0,21,0,0.0164271047227942,3.97809719370294,1,"0",58
 95 | 21,343,1,0.0164271047227942,3.97809719370294,1,"1",58
 96 | 0,78,0,-6.61738535249829,3.99452429842574,1,"0",59
 97 | 78,916,0,-6.61738535249829,3.99452429842574,1,"1",59
 98 | 0,3,0,1.05407255304586,4.13141683778234,0,"0",60
 99 | 3,68,1,1.05407255304586,4.13141683778234,0,"1",60
100 | 0,2,1,4.56399726214921,4.17522245037645,0,"0",61
101 | 0,69,1,-8.64613278576318,4.18891170431212,0,"0",62
102 | 0,27,0,-15.3401779603012,4.19712525667351,0,"0",63
103 | 27,842,0,-15.3401779603012,4.19712525667351,0,"1",63
104 | 0,33,0,0.815879534565369,4.33675564681725,1,"0",64
105 | 33,584,1,0.815879534565369,4.33675564681725,1,"1",64
106 | 0,12,0,3.29363449691992,4.42984257357974,0,"0",65
107 | 12,78,1,3.29363449691992,4.42984257357974,0,"1",65
108 | 0,32,1,5.21286789869952,4.46817248459959,0,"0",66
109 | 0,57,0,-28.4490075290897,4.47638603696099,0,"0",67
110 | 57,285,1,-28.4490075290897,4.47638603696099,0,"1",67
111 | 0,3,0,-2.75975359342916,4.51745379876797,0,"0",68
112 | 3,68,1,-2.75975359342916,4.51745379876797,0,"1",68
113 | 0,10,0,-0.0109514031485318,4.66803559206023,0,"0",69
114 | 10,670,0,-0.0109514031485318,4.66803559206023,0,"1",69
115 | 0,5,0,5.00205338809035,4.71184120465435,0,"0",70
116 | 5,30,1,5.00205338809035,4.71184120465435,0,"1",70
117 | 0,31,0,-0.591375770020534,4.80492813141684,0,"0",71
118 | 31,620,0,-0.591375770020534,4.80492813141684,0,"1",71
119 | 0,4,0,-21.2731006160164,4.87063655030801,0,"0",72
120 | 4,596,0,-21.2731006160164,4.87063655030801,0,"1",72
121 | 0,27,0,8.33127994524298,4.94729637234771,0,"0",73
122 | 27,90,1,8.33127994524298,4.94729637234771,0,"1",73
123 | 0,5,0,-18.8336755646817,4.96646132785763,0,"0",74
124 | 5,17,1,-18.8336755646817,4.96646132785763,0,"1",74
125 | 0,2,1,4.18069815195072,4.99657768651609,0,"0",75
126 | 0,46,0,4.0848733744011,5.01026694045174,1,"0",76
127 | 46,545,0,4.0848733744011,5.01026694045174,1,"1",76
128 | 0,21,1,-6.88843258042436,5.01574264202601,0,"0",77
129 | 0,210,0,0.703627652292951,5.09240246406571,0,"0",78
130 | 210,515,0,0.703627652292951,5.09240246406571,0,"1",78
131 | 0,67,0,5.782340862423,5.16632443531828,0,"0",79
132 | 67,96,1,5.782340862423,5.16632443531828,0,"1",79
133 | 0,26,0,-1.55509924709104,5.18275154004107,1,"0",80
134 | 26,482,0,-1.55509924709104,5.18275154004107,1,"1",80
135 | 0,6,0,4.89253935660506,5.28405201916496,0,"0",81
136 | 6,445,0,4.89253935660506,5.28405201916496,0,"1",81
137 | 0,428,0,-18.798083504449,4.08487337440109,0,"0",82
138 | 0,32,0,5.30869267624914,5.31690622861054,0,"0",83
139 | 32,80,1,5.30869267624914,5.31690622861054,0,"1",83
140 | 0,37,0,-5.28131416837783,5.33333333333333,0,"0",84
141 | 37,334,1,-5.28131416837783,5.33333333333333,0,"1",84
142 | 0,5,1,-0.0191649555099218,5.35249828884326,0,"0",85
143 | 0,8,0,0.919917864476389,5.4154688569473,0,"0",86
144 | 8,397,0,0.919917864476389,5.4154688569473,0,"1",86
145 | 0,60,0,-1.74674880219028,5.47022587268994,0,"0",87
146 | 60,110,1,-1.74674880219028,5.47022587268994,0,"1",87
147 | 0,31,0,6.362765229295,5.48939082819986,0,"0",88
148 | 31,370,0,6.362765229295,5.48939082819986,0,"1",88
149 | 0,139,0,3.04722792607803,5.51129363449692,0,"0",89
150 | 139,207,1,3.04722792607803,5.51129363449692,0,"1",89
151 | 0,160,0,4.03285420944559,5.51403148528405,1,"0",90
152 | 160,186,1,4.03285420944559,5.51403148528405,1,"1",90
153 | 0,340,1,-0.40520191649555,5.53319644079398,0,"0",91
154 | 0,310,0,-3.01711156741958,5.57152635181383,0,"0",92
155 | 310,340,0,-3.01711156741958,5.57152635181383,0,"1",92
156 | 0,28,0,-0.249144421629019,5.77686516084873,0,"0",93
157 | 28,265,0,-0.249144421629019,5.77686516084873,0,"1",93
158 | 0,4,0,-4.15879534565367,5.95482546201232,1,"0",94
159 | 4,165,1,-4.15879534565367,5.95482546201232,1,"1",94
160 | 0,2,0,-7.71800136892539,5.97672826830938,0,"0",95
161 | 2,16,1,-7.71800136892539,5.97672826830938,0,"1",95
162 | 0,13,0,-21.3497604380561,6.00958247775496,0,"0",96
163 | 13,180,0,-21.3497604380561,6.00958247775496,0,"1",96
164 | 0,21,0,-24.3832991101985,6.14373716632443,0,"0",97
165 | 21,131,0,-24.3832991101985,6.14373716632443,0,"1",97
166 | 0,96,0,-19.3702943189596,6.20396988364134,0,"0",98
167 | 96,109,0,-19.3702943189596,6.20396988364134,0,"1",98
168 | 0,21,1,1.83436002737851,6.23408624229979,0,"0",99
169 | 0,38,0,-12.9390828199863,6.39561943874059,1,"0",100
170 | 38,39,0,-12.9390828199863,6.39561943874059,1,"1",100
171 | 0,31,0,1.51676933607118,6.41752224503765,0,"0",101
172 | 0,11,0,-7.60848733744011,6.47227926078029,0,"0",102
173 | 0,6,1,-8.68446269678302,-0.0492813141683778,0,"0",103
174 | 


--------------------------------------------------------------------------------
/lifelines/fitters/log_normal_aft_fitter.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | from autograd import numpy as np
  3 | from autograd.scipy.stats import norm
  4 | from scipy.special import erfinv
  5 | import pandas as pd
  6 | 
  7 | from lifelines.utils import _get_index, coalesce
  8 | from lifelines.fitters import ParametericAFTRegressionFitter
  9 | from lifelines.utils.logsf import logsf
 10 | 
 11 | 
 12 | class LogNormalAFTFitter(ParametericAFTRegressionFitter):
 13 |     r"""
 14 |     This class implements a Log-Normal AFT model. The model has parameterized
 15 |     form, with :math:`\mu(x) = \exp\left(a_0 + a_1x_1 + ... + a_n x_n \right)`,
 16 |     and optionally, :math:`\sigma(y) = \exp\left(b_0 + b_1 y_1 + ... + b_m y_m \right)`,
 17 | 
 18 |     The cumulative hazard rate is
 19 | 
 20 |     .. math:: H(t; x, y) = -\log(1 - \Phi\left(\frac{\log(T) - \mu(x)}{\sigma(y)}\right))
 21 | 
 22 |     After calling the ``.fit`` method, you have access to properties like:
 23 |     ``params_``, ``print_summary()``. A summary of the fit is available with the method ``print_summary()``.
 24 | 
 25 | 
 26 |     Parameters
 27 |     -----------
 28 |     alpha: float, optional (default=0.05)
 29 |         the level in the confidence intervals.
 30 | 
 31 |     fit_intercept: boolean, optional (default=True)
 32 |         Allow lifelines to add an intercept column of 1s to df, and ancillary_df if applicable.
 33 | 
 34 |     penalizer: float, optional (default=0.0)
 35 |         the penalizer coefficient to the size of the coefficients. See `l1_ratio`. Must be equal to or greater than 0.
 36 | 
 37 |     l1_ratio: float, optional (default=0.0)
 38 |         how much of the penalizer should be attributed to an l1 penalty (otherwise an l2 penalty). The penalty function looks like
 39 |         ``penalizer * l1_ratio * ||w||_1 + 0.5 * penalizer * (1 - l1_ratio) * ||w||^2_2``
 40 | 
 41 |     Attributes
 42 |     ----------
 43 |     params_ : DataFrame
 44 |         The estimated coefficients
 45 |     confidence_intervals_ : DataFrame
 46 |         The lower and upper confidence intervals for the coefficients
 47 |     durations: Series
 48 |         The event_observed variable provided
 49 |     event_observed: Series
 50 |         The event_observed variable provided
 51 |     weights: Series
 52 |         The event_observed variable provided
 53 |     variance_matrix_ : numpy array
 54 |         The variance matrix of the coefficients
 55 |     standard_errors_: Series
 56 |         the standard errors of the estimates
 57 |     score_: float
 58 |         the concordance index of the model.
 59 |     """
 60 | 
 61 |     def __init__(self, alpha=0.05, penalizer=0.0, l1_ratio=0.0, fit_intercept=True):
 62 |         self._primary_parameter_name = "mu_"
 63 |         self._ancillary_parameter_name = "sigma_"
 64 |         super(LogNormalAFTFitter, self).__init__(alpha, penalizer, l1_ratio, fit_intercept)
 65 | 
 66 |     def _cumulative_hazard(self, params, T, *Xs):
 67 |         mu_params = params[self._LOOKUP_SLICE["mu_"]]
 68 |         mu_ = np.dot(Xs[0], mu_params)
 69 | 
 70 |         sigma_params = params[self._LOOKUP_SLICE["sigma_"]]
 71 |         sigma_ = np.exp(np.dot(Xs[1], sigma_params))
 72 |         Z = (np.log(T) - mu_) / sigma_
 73 |         return -logsf(Z)
 74 | 
 75 |     def _log_hazard(self, params, T, *Xs):
 76 |         mu_params = params[self._LOOKUP_SLICE["mu_"]]
 77 |         mu_ = np.dot(Xs[0], mu_params)
 78 | 
 79 |         sigma_params = params[self._LOOKUP_SLICE["sigma_"]]
 80 | 
 81 |         log_sigma_ = np.dot(Xs[1], sigma_params)
 82 |         sigma_ = np.exp(log_sigma_)
 83 |         Z = (np.log(T) - mu_) / sigma_
 84 | 
 85 |         return norm.logpdf(Z) - log_sigma_ - np.log(T) - logsf(Z)
 86 | 
 87 |     def _log_1m_sf(self, params, T, *Xs):
 88 |         mu_params = params[self._LOOKUP_SLICE["mu_"]]
 89 |         mu_ = np.dot(Xs[0], mu_params)
 90 | 
 91 |         sigma_params = params[self._LOOKUP_SLICE["sigma_"]]
 92 | 
 93 |         log_sigma_ = np.dot(Xs[1], sigma_params)
 94 |         sigma_ = np.exp(log_sigma_)
 95 |         Z = (np.log(T) - mu_) / sigma_
 96 |         return norm.logcdf(Z, loc=0, scale=1)
 97 | 
 98 |     def predict_percentile(self, X, ancillary_X=None, p=0.5):
 99 |         """
100 |         Returns the median lifetimes for the individuals, by default. If the survival curve of an
101 |         individual does not cross ``p``, then the result is infinity.
102 |         http://stats.stackexchange.com/questions/102986/percentile-loss-functions
103 | 
104 |         Parameters
105 |         ----------
106 |         X:  numpy array or DataFrame
107 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
108 |             can be in any order. If a numpy array, columns must be in the
109 |             same order as the training data.
110 |         ancillary_X: numpy array or DataFrame, optional
111 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
112 |             can be in any order. If a numpy array, columns must be in the
113 |             same order as the training data.
114 |         p: float, optional (default=0.5)
115 |             the percentile, must be between 0 and 1.
116 | 
117 |         Returns
118 |         -------
119 |         percentiles: DataFrame
120 | 
121 |         See Also
122 |         --------
123 |         predict_median
124 | 
125 |         """
126 |         exp_mu_, sigma_ = self._prep_inputs_for_prediction_and_return_scores(X, ancillary_X)
127 |         return pd.DataFrame(exp_mu_ * np.exp(np.sqrt(2) * sigma_ * erfinv(2 * p - 1)), index=_get_index(X))
128 | 
129 |     def predict_median(self, X, ancillary_X=None):
130 |         """
131 |         Returns the median lifetimes for the individuals. If the survival curve of an
132 |         individual does not cross 0.5, then the result is infinity.
133 |         http://stats.stackexchange.com/questions/102986/percentile-loss-functions
134 | 
135 |         Parameters
136 |         ----------
137 |         X:  numpy array or DataFrame
138 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
139 |             can be in any order. If a numpy array, columns must be in the
140 |             same order as the training data.
141 |         ancillary_X: numpy array or DataFrame, optional
142 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
143 |             can be in any order. If a numpy array, columns must be in the
144 |             same order as the training data.
145 |         p: float, optional (default=0.5)
146 |             the percentile, must be between 0 and 1.
147 | 
148 |         Returns
149 |         -------
150 |         DataFrame
151 | 
152 |         See Also
153 |         --------
154 |         predict_percentile
155 | 
156 |         """
157 |         exp_mu_, _ = self._prep_inputs_for_prediction_and_return_scores(X, ancillary_X)
158 |         return pd.DataFrame(exp_mu_, index=_get_index(X))
159 | 
160 |     def predict_expectation(self, X, ancillary_X=None):
161 |         """
162 |         Predict the expectation of lifetimes, :math:`E[T | x]`.
163 | 
164 |         Parameters
165 |         ----------
166 |         X: numpy array or DataFrame
167 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
168 |             can be in any order. If a numpy array, columns must be in the
169 |             same order as the training data.
170 |         ancillary_X: numpy array or DataFrame, optional
171 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
172 |             can be in any order. If a numpy array, columns must be in the
173 |             same order as the training data.
174 | 
175 |         Returns
176 |         -------
177 |         percentiles: DataFrame
178 |             the median lifetimes for the individuals. If the survival curve of an
179 |             individual does not cross 0.5, then the result is infinity.
180 | 
181 | 
182 |         See Also
183 |         --------
184 |         predict_median
185 |         """
186 |         exp_mu_, sigma_ = self._prep_inputs_for_prediction_and_return_scores(X, ancillary_X)
187 |         return pd.DataFrame(exp_mu_ * np.exp(sigma_ ** 2 / 2), index=_get_index(X))
188 | 
189 |     def predict_cumulative_hazard(self, X, times=None, ancillary_X=None):
190 |         """
191 |         Return the cumulative hazard rate of subjects in X at time points.
192 | 
193 |         Parameters
194 |         ----------
195 | 
196 |         X: numpy array or DataFrame
197 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
198 |             can be in any order. If a numpy array, columns must be in the
199 |             same order as the training data.
200 |         times: iterable, optional
201 |             an iterable of increasing times to predict the cumulative hazard at. Default
202 |             is the set of all durations (observed and unobserved). Uses a linear interpolation if
203 |             points in time are not in the index.
204 |         ancillary_X: numpy array or DataFrame, optional
205 |             a (n,d) covariate numpy array or DataFrame. If a DataFrame, columns
206 |             can be in any order. If a numpy array, columns must be in the
207 |             same order as the training data.
208 | 
209 |         Returns
210 |         -------
211 |         cumulative_hazard_ : DataFrame
212 |             the cumulative hazard of individuals over the timeline
213 |         """
214 |         import numpy as np
215 | 
216 |         times = coalesce(times, self.timeline, np.unique(self.durations))
217 |         exp_mu_, sigma_ = self._prep_inputs_for_prediction_and_return_scores(X, ancillary_X)
218 |         mu_ = np.log(exp_mu_)
219 |         Z = np.subtract.outer(np.log(times), mu_) / sigma_
220 |         return pd.DataFrame(-logsf(Z), columns=_get_index(X), index=times)
221 | 


--------------------------------------------------------------------------------
/lifelines/datasets/lung.csv:
--------------------------------------------------------------------------------
  1 | inst,time,status,age,sex,ph.ecog,ph.karno,pat.karno,meal.cal,wt.loss
  2 | 3.0,306,2,74,1,1.0,90.0,100.0,1175.0,
  3 | 3.0,455,2,68,1,0.0,90.0,90.0,1225.0,15.0
  4 | 3.0,1010,1,56,1,0.0,90.0,90.0,,15.0
  5 | 5.0,210,2,57,1,1.0,90.0,60.0,1150.0,11.0
  6 | 1.0,883,2,60,1,0.0,100.0,90.0,,0.0
  7 | 12.0,1022,1,74,1,1.0,50.0,80.0,513.0,0.0
  8 | 7.0,310,2,68,2,2.0,70.0,60.0,384.0,10.0
  9 | 11.0,361,2,71,2,2.0,60.0,80.0,538.0,1.0
 10 | 1.0,218,2,53,1,1.0,70.0,80.0,825.0,16.0
 11 | 7.0,166,2,61,1,2.0,70.0,70.0,271.0,34.0
 12 | 6.0,170,2,57,1,1.0,80.0,80.0,1025.0,27.0
 13 | 16.0,654,2,68,2,2.0,70.0,70.0,,23.0
 14 | 11.0,728,2,68,2,1.0,90.0,90.0,,5.0
 15 | 21.0,71,2,60,1,,60.0,70.0,1225.0,32.0
 16 | 12.0,567,2,57,1,1.0,80.0,70.0,2600.0,60.0
 17 | 1.0,144,2,67,1,1.0,80.0,90.0,,15.0
 18 | 22.0,613,2,70,1,1.0,90.0,100.0,1150.0,-5.0
 19 | 16.0,707,2,63,1,2.0,50.0,70.0,1025.0,22.0
 20 | 1.0,61,2,56,2,2.0,60.0,60.0,238.0,10.0
 21 | 21.0,88,2,57,1,1.0,90.0,80.0,1175.0,
 22 | 11.0,301,2,67,1,1.0,80.0,80.0,1025.0,17.0
 23 | 6.0,81,2,49,2,0.0,100.0,70.0,1175.0,-8.0
 24 | 11.0,624,2,50,1,1.0,70.0,80.0,,16.0
 25 | 15.0,371,2,58,1,0.0,90.0,100.0,975.0,13.0
 26 | 12.0,394,2,72,1,0.0,90.0,80.0,,0.0
 27 | 12.0,520,2,70,2,1.0,90.0,80.0,825.0,6.0
 28 | 4.0,574,2,60,1,0.0,100.0,100.0,1025.0,-13.0
 29 | 13.0,118,2,70,1,3.0,60.0,70.0,1075.0,20.0
 30 | 13.0,390,2,53,1,1.0,80.0,70.0,875.0,-7.0
 31 | 1.0,12,2,74,1,2.0,70.0,50.0,305.0,20.0
 32 | 12.0,473,2,69,2,1.0,90.0,90.0,1025.0,-1.0
 33 | 1.0,26,2,73,1,2.0,60.0,70.0,388.0,20.0
 34 | 7.0,533,2,48,1,2.0,60.0,80.0,,-11.0
 35 | 16.0,107,2,60,2,2.0,50.0,60.0,925.0,-15.0
 36 | 12.0,53,2,61,1,2.0,70.0,100.0,1075.0,10.0
 37 | 1.0,122,2,62,2,2.0,50.0,50.0,1025.0,
 38 | 22.0,814,2,65,1,2.0,70.0,60.0,513.0,28.0
 39 | 15.0,965,1,66,2,1.0,70.0,90.0,875.0,4.0
 40 | 1.0,93,2,74,1,2.0,50.0,40.0,1225.0,24.0
 41 | 1.0,731,2,64,2,1.0,80.0,100.0,1175.0,15.0
 42 | 5.0,460,2,70,1,1.0,80.0,60.0,975.0,10.0
 43 | 11.0,153,2,73,2,2.0,60.0,70.0,1075.0,11.0
 44 | 10.0,433,2,59,2,0.0,90.0,90.0,363.0,27.0
 45 | 12.0,145,2,60,2,2.0,70.0,60.0,,
 46 | 7.0,583,2,68,1,1.0,60.0,70.0,1025.0,7.0
 47 | 7.0,95,2,76,2,2.0,60.0,60.0,625.0,-24.0
 48 | 1.0,303,2,74,1,0.0,90.0,70.0,463.0,30.0
 49 | 3.0,519,2,63,1,1.0,80.0,70.0,1025.0,10.0
 50 | 13.0,643,2,74,1,0.0,90.0,90.0,1425.0,2.0
 51 | 22.0,765,2,50,2,1.0,90.0,100.0,1175.0,4.0
 52 | 3.0,735,2,72,2,1.0,90.0,90.0,,9.0
 53 | 12.0,189,2,63,1,0.0,80.0,70.0,,0.0
 54 | 21.0,53,2,68,1,0.0,90.0,100.0,1025.0,0.0
 55 | 1.0,246,2,58,1,0.0,100.0,90.0,1175.0,7.0
 56 | 6.0,689,2,59,1,1.0,90.0,80.0,1300.0,15.0
 57 | 1.0,65,2,62,1,0.0,90.0,80.0,725.0,
 58 | 5.0,5,2,65,2,0.0,100.0,80.0,338.0,5.0
 59 | 22.0,132,2,57,1,2.0,70.0,60.0,,18.0
 60 | 3.0,687,2,58,2,1.0,80.0,80.0,1225.0,10.0
 61 | 1.0,345,2,64,2,1.0,90.0,80.0,1075.0,-3.0
 62 | 22.0,444,2,75,2,2.0,70.0,70.0,438.0,8.0
 63 | 12.0,223,2,48,1,1.0,90.0,80.0,1300.0,68.0
 64 | 21.0,175,2,73,1,1.0,80.0,100.0,1025.0,
 65 | 11.0,60,2,65,2,1.0,90.0,80.0,1025.0,0.0
 66 | 3.0,163,2,69,1,1.0,80.0,60.0,1125.0,0.0
 67 | 3.0,65,2,68,1,2.0,70.0,50.0,825.0,8.0
 68 | 16.0,208,2,67,2,2.0,70.0,,538.0,2.0
 69 | 5.0,821,1,64,2,0.0,90.0,70.0,1025.0,3.0
 70 | 22.0,428,2,68,1,0.0,100.0,80.0,1039.0,0.0
 71 | 6.0,230,2,67,1,1.0,80.0,100.0,488.0,23.0
 72 | 13.0,840,1,63,1,0.0,90.0,90.0,1175.0,-1.0
 73 | 3.0,305,2,48,2,1.0,80.0,90.0,538.0,29.0
 74 | 5.0,11,2,74,1,2.0,70.0,100.0,1175.0,0.0
 75 | 2.0,132,2,40,1,1.0,80.0,80.0,,3.0
 76 | 21.0,226,2,53,2,1.0,90.0,80.0,825.0,3.0
 77 | 12.0,426,2,71,2,1.0,90.0,90.0,1075.0,19.0
 78 | 1.0,705,2,51,2,0.0,100.0,80.0,1300.0,0.0
 79 | 6.0,363,2,56,2,1.0,80.0,70.0,1225.0,-2.0
 80 | 3.0,11,2,81,1,0.0,90.0,,731.0,15.0
 81 | 1.0,176,2,73,1,0.0,90.0,70.0,169.0,30.0
 82 | 4.0,791,2,59,1,0.0,100.0,80.0,768.0,5.0
 83 | 13.0,95,2,55,1,1.0,70.0,90.0,1500.0,15.0
 84 | 11.0,196,1,42,1,1.0,80.0,80.0,1425.0,8.0
 85 | 21.0,167,2,44,2,1.0,80.0,90.0,588.0,-1.0
 86 | 16.0,806,1,44,1,1.0,80.0,80.0,1025.0,1.0
 87 | 6.0,284,2,71,1,1.0,80.0,90.0,1100.0,14.0
 88 | 22.0,641,2,62,2,1.0,80.0,80.0,1150.0,1.0
 89 | 21.0,147,2,61,1,0.0,100.0,90.0,1175.0,4.0
 90 | 13.0,740,1,44,2,1.0,90.0,80.0,588.0,39.0
 91 | 1.0,163,2,72,1,2.0,70.0,70.0,910.0,2.0
 92 | 11.0,655,2,63,1,0.0,100.0,90.0,975.0,-1.0
 93 | 22.0,239,2,70,1,1.0,80.0,100.0,,23.0
 94 | 5.0,88,2,66,1,1.0,90.0,80.0,875.0,8.0
 95 | 10.0,245,2,57,2,1.0,80.0,60.0,280.0,14.0
 96 | 1.0,588,1,69,2,0.0,100.0,90.0,,13.0
 97 | 12.0,30,2,72,1,2.0,80.0,60.0,288.0,7.0
 98 | 3.0,179,2,69,1,1.0,80.0,80.0,,25.0
 99 | 12.0,310,2,71,1,1.0,90.0,100.0,,0.0
100 | 11.0,477,2,64,1,1.0,90.0,100.0,910.0,0.0
101 | 3.0,166,2,70,2,0.0,90.0,70.0,,10.0
102 | 1.0,559,1,58,2,0.0,100.0,100.0,710.0,15.0
103 | 6.0,450,2,69,2,1.0,80.0,90.0,1175.0,3.0
104 | 13.0,364,2,56,1,1.0,70.0,80.0,,4.0
105 | 6.0,107,2,63,1,1.0,90.0,70.0,,0.0
106 | 13.0,177,2,59,1,2.0,50.0,,,32.0
107 | 12.0,156,2,66,1,1.0,80.0,90.0,875.0,14.0
108 | 26.0,529,1,54,2,1.0,80.0,100.0,975.0,-3.0
109 | 1.0,11,2,67,1,1.0,90.0,90.0,925.0,
110 | 21.0,429,2,55,1,1.0,100.0,80.0,975.0,5.0
111 | 3.0,351,2,75,2,2.0,60.0,50.0,925.0,11.0
112 | 13.0,15,2,69,1,0.0,90.0,70.0,575.0,10.0
113 | 1.0,181,2,44,1,1.0,80.0,90.0,1175.0,5.0
114 | 10.0,283,2,80,1,1.0,80.0,100.0,1030.0,6.0
115 | 3.0,201,2,75,2,0.0,90.0,100.0,,1.0
116 | 6.0,524,2,54,2,1.0,80.0,100.0,,15.0
117 | 1.0,13,2,76,1,2.0,70.0,70.0,413.0,20.0
118 | 3.0,212,2,49,1,2.0,70.0,60.0,675.0,20.0
119 | 1.0,524,2,68,1,2.0,60.0,70.0,1300.0,30.0
120 | 16.0,288,2,66,1,2.0,70.0,60.0,613.0,24.0
121 | 15.0,363,2,80,1,1.0,80.0,90.0,346.0,11.0
122 | 22.0,442,2,75,1,0.0,90.0,90.0,,0.0
123 | 26.0,199,2,60,2,2.0,70.0,80.0,675.0,10.0
124 | 3.0,550,2,69,2,1.0,70.0,80.0,910.0,0.0
125 | 11.0,54,2,72,1,2.0,60.0,60.0,768.0,-3.0
126 | 1.0,558,2,70,1,0.0,90.0,90.0,1025.0,17.0
127 | 22.0,207,2,66,1,1.0,80.0,80.0,925.0,20.0
128 | 7.0,92,2,50,1,1.0,80.0,60.0,1075.0,13.0
129 | 12.0,60,2,64,1,1.0,80.0,90.0,993.0,0.0
130 | 16.0,551,1,77,2,2.0,80.0,60.0,750.0,28.0
131 | 12.0,543,1,48,2,0.0,90.0,60.0,,4.0
132 | 4.0,293,2,59,2,1.0,80.0,80.0,925.0,52.0
133 | 16.0,202,2,53,1,1.0,80.0,80.0,,20.0
134 | 6.0,353,2,47,1,0.0,100.0,90.0,1225.0,5.0
135 | 13.0,511,1,55,2,1.0,80.0,70.0,,49.0
136 | 1.0,267,2,67,1,0.0,90.0,70.0,313.0,6.0
137 | 22.0,511,1,74,2,2.0,60.0,40.0,96.0,37.0
138 | 12.0,371,2,58,2,1.0,80.0,70.0,,0.0
139 | 13.0,387,2,56,1,2.0,80.0,60.0,1075.0,
140 | 1.0,457,2,54,1,1.0,90.0,90.0,975.0,-5.0
141 | 5.0,337,2,56,1,0.0,100.0,100.0,1500.0,15.0
142 | 21.0,201,2,73,2,2.0,70.0,60.0,1225.0,-16.0
143 | 3.0,404,1,74,1,1.0,80.0,70.0,413.0,38.0
144 | 26.0,222,2,76,1,2.0,70.0,70.0,1500.0,8.0
145 | 1.0,62,2,65,2,1.0,80.0,90.0,1075.0,0.0
146 | 11.0,458,1,57,1,1.0,80.0,100.0,513.0,30.0
147 | 26.0,356,1,53,2,1.0,90.0,90.0,,2.0
148 | 16.0,353,2,71,1,0.0,100.0,80.0,775.0,2.0
149 | 16.0,163,2,54,1,1.0,90.0,80.0,1225.0,13.0
150 | 12.0,31,2,82,1,0.0,100.0,90.0,413.0,27.0
151 | 13.0,340,2,59,2,0.0,100.0,90.0,,0.0
152 | 13.0,229,2,70,1,1.0,70.0,60.0,1175.0,-2.0
153 | 22.0,444,1,60,1,0.0,90.0,100.0,,7.0
154 | 5.0,315,1,62,2,0.0,90.0,90.0,,0.0
155 | 16.0,182,2,53,2,1.0,80.0,60.0,,4.0
156 | 32.0,156,2,55,1,2.0,70.0,30.0,1025.0,10.0
157 | ,329,2,69,1,2.0,70.0,80.0,713.0,20.0
158 | 26.0,364,1,68,2,1.0,90.0,90.0,,7.0
159 | 4.0,291,2,62,1,2.0,70.0,60.0,475.0,27.0
160 | 12.0,179,2,63,1,1.0,80.0,70.0,538.0,-2.0
161 | 1.0,376,1,56,2,1.0,80.0,90.0,825.0,17.0
162 | 32.0,384,1,62,2,0.0,90.0,90.0,588.0,8.0
163 | 10.0,268,2,44,2,1.0,90.0,100.0,2450.0,2.0
164 | 11.0,292,1,69,1,2.0,60.0,70.0,2450.0,36.0
165 | 6.0,142,2,63,1,1.0,90.0,80.0,875.0,2.0
166 | 7.0,413,1,64,1,1.0,80.0,70.0,413.0,16.0
167 | 16.0,266,1,57,2,0.0,90.0,90.0,1075.0,3.0
168 | 11.0,194,2,60,2,1.0,80.0,60.0,,33.0
169 | 21.0,320,2,46,1,0.0,100.0,100.0,860.0,4.0
170 | 6.0,181,2,61,1,1.0,90.0,90.0,730.0,0.0
171 | 12.0,285,2,65,1,0.0,100.0,90.0,1025.0,0.0
172 | 13.0,301,1,61,1,1.0,90.0,100.0,825.0,2.0
173 | 2.0,348,2,58,2,0.0,90.0,80.0,1225.0,10.0
174 | 2.0,197,2,56,1,1.0,90.0,60.0,768.0,37.0
175 | 16.0,382,1,43,2,0.0,100.0,90.0,338.0,6.0
176 | 1.0,303,1,53,1,1.0,90.0,80.0,1225.0,12.0
177 | 13.0,296,1,59,2,1.0,80.0,100.0,1025.0,0.0
178 | 1.0,180,2,56,1,2.0,60.0,80.0,1225.0,-2.0
179 | 13.0,186,2,55,2,1.0,80.0,70.0,,
180 | 1.0,145,2,53,2,1.0,80.0,90.0,588.0,13.0
181 | 7.0,269,1,74,2,0.0,100.0,100.0,588.0,0.0
182 | 13.0,300,1,60,1,0.0,100.0,100.0,975.0,5.0
183 | 1.0,284,1,39,1,0.0,100.0,90.0,1225.0,-5.0
184 | 16.0,350,2,66,2,0.0,90.0,100.0,1025.0,
185 | 32.0,272,1,65,2,1.0,80.0,90.0,,-1.0
186 | 12.0,292,1,51,2,0.0,90.0,80.0,1225.0,0.0
187 | 12.0,332,1,45,2,0.0,90.0,100.0,975.0,5.0
188 | 2.0,285,2,72,2,2.0,70.0,90.0,463.0,20.0
189 | 3.0,259,1,58,1,0.0,90.0,80.0,1300.0,8.0
190 | 15.0,110,2,64,1,1.0,80.0,60.0,1025.0,12.0
191 | 22.0,286,2,53,1,0.0,90.0,90.0,1225.0,8.0
192 | 16.0,270,2,72,1,1.0,80.0,90.0,488.0,14.0
193 | 16.0,81,2,52,1,2.0,60.0,70.0,1075.0,
194 | 12.0,131,2,50,1,1.0,90.0,80.0,513.0,
195 | 1.0,225,1,64,1,1.0,90.0,80.0,825.0,33.0
196 | 22.0,269,2,71,1,1.0,90.0,90.0,1300.0,-2.0
197 | 12.0,225,1,70,1,0.0,100.0,100.0,1175.0,6.0
198 | 32.0,243,1,63,2,1.0,80.0,90.0,825.0,0.0
199 | 21.0,279,1,64,1,1.0,90.0,90.0,,4.0
200 | 1.0,276,1,52,2,0.0,100.0,80.0,975.0,0.0
201 | 32.0,135,2,60,1,1.0,90.0,70.0,1275.0,0.0
202 | 15.0,79,2,64,2,1.0,90.0,90.0,488.0,37.0
203 | 22.0,59,2,73,1,1.0,60.0,60.0,2200.0,5.0
204 | 32.0,240,1,63,2,0.0,90.0,100.0,1025.0,0.0
205 | 3.0,202,1,50,2,0.0,100.0,100.0,635.0,1.0
206 | 26.0,235,1,63,2,0.0,100.0,90.0,413.0,0.0
207 | 33.0,105,2,62,1,2.0,,70.0,,
208 | 5.0,224,1,55,2,0.0,80.0,90.0,,23.0
209 | 13.0,239,2,50,2,2.0,60.0,60.0,1025.0,-3.0
210 | 21.0,237,1,69,1,1.0,80.0,70.0,,
211 | 33.0,173,1,59,2,1.0,90.0,80.0,,10.0
212 | 1.0,252,1,60,2,0.0,100.0,90.0,488.0,-2.0
213 | 6.0,221,1,67,1,1.0,80.0,70.0,413.0,23.0
214 | 15.0,185,1,69,1,1.0,90.0,70.0,1075.0,0.0
215 | 11.0,92,1,64,2,2.0,70.0,100.0,,31.0
216 | 11.0,13,2,65,1,1.0,80.0,90.0,,10.0
217 | 11.0,222,1,65,1,1.0,90.0,70.0,1025.0,18.0
218 | 13.0,192,1,41,2,1.0,90.0,80.0,,-10.0
219 | 21.0,183,2,76,1,2.0,80.0,60.0,825.0,7.0
220 | 11.0,211,1,70,2,2.0,70.0,30.0,131.0,3.0
221 | 2.0,175,1,57,2,0.0,80.0,80.0,725.0,11.0
222 | 22.0,197,1,67,1,1.0,80.0,90.0,1500.0,2.0
223 | 11.0,203,1,71,2,1.0,80.0,90.0,1025.0,0.0
224 | 1.0,116,2,76,1,1.0,80.0,80.0,,0.0
225 | 1.0,188,1,77,1,1.0,80.0,60.0,,3.0
226 | 13.0,191,1,39,1,0.0,90.0,90.0,2350.0,-5.0
227 | 32.0,105,1,75,2,2.0,60.0,70.0,1025.0,5.0
228 | 6.0,174,1,66,1,1.0,90.0,100.0,1075.0,1.0
229 | 22.0,177,1,58,2,1.0,80.0,90.0,1060.0,0.0
230 | 


--------------------------------------------------------------------------------
/docs/conf.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python3
  2 | # -*- coding: utf-8 -*-
  3 | #
  4 | # lifelines documentation build configuration file, created by
  5 | # sphinx-quickstart on Sun Feb  2 17:10:21 2014.
  6 | #
  7 | # This file is execfile()d with the current directory set to its
  8 | # containing dir.
  9 | #
 10 | # Note that not all possible configuration values are present in this
 11 | # autogenerated file.
 12 | #
 13 | # All configuration values have a default; values that are commented out
 14 | # serve to show the default.
 15 | from datetime import date
 16 | import sys
 17 | import os
 18 | 
 19 | # If extensions (or modules to document with autodoc) are in another directory,
 20 | # add these directories to sys.path here. If the directory is relative to the
 21 | # documentation root, use os.path.abspath to make it absolute, like shown here.
 22 | sys.path.insert(0, os.path.abspath("."))
 23 | 
 24 | # -- General configuration ------------------------------------------------
 25 | 
 26 | # If your documentation needs a minimal Sphinx version, state it here.
 27 | # needs_sphinx = '1.0'
 28 | 
 29 | # Add any Sphinx extension module names here, as strings. They can be
 30 | # extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
 31 | # ones.
 32 | extensions = [
 33 |     "sphinx.ext.coverage",
 34 |     "sphinx.ext.mathjax",
 35 |     "sphinx.ext.autodoc",
 36 |     "sphinx.ext.autosectionlabel",
 37 |     "sphinx.ext.napoleon",
 38 |     "nbsphinx",
 39 | ]
 40 | 
 41 | exclude_patterns = ["_build", "jupyter_notebooks/.ipynb_checkpoints/*.ipynb"]
 42 | 
 43 | # Add any paths that contain templates here, relative to this directory.
 44 | templates_path = ["_templates"]
 45 | 
 46 | # The suffix of source filenames.
 47 | source_suffix = ".rst"
 48 | 
 49 | # The encoding of source files.
 50 | # source_encoding = 'utf-8-sig'
 51 | 
 52 | # The master toctree document.
 53 | master_doc = "index"
 54 | 
 55 | # General information about the project.
 56 | project = "lifelines"
 57 | copyright = "2014-{},  Cam Davidson-Pilon".format(date.today().year)
 58 | 
 59 | 
 60 | # The version info for the project you're documenting, acts as replacement for
 61 | # |version| and |release|, also used in various other places throughout the
 62 | # built documents.
 63 | #
 64 | # The short X.Y version.
 65 | 
 66 | version = "0.21.0"
 67 | # The full version, including dev info
 68 | release = version
 69 | 
 70 | # The language for content autogenerated by Sphinx. Refer to documentation
 71 | # for a list of supported languages.
 72 | # language = None
 73 | 
 74 | autoclass_content = "both"  # include both class docstring and __init__
 75 | autodoc_default_flags = [
 76 |     # Make sure that any autodoc declarations show the right members
 77 |     "members",
 78 |     "inherited-members",
 79 |     "show-inheritance",
 80 | ]
 81 | autosummary_generate = True  # Make _autosummary files and include them
 82 | 
 83 | 
 84 | # There are two options for replacing |today|: either, you set today to some
 85 | # non-false value, then it is used:
 86 | # today = ''
 87 | # Else, today_fmt is used as the format for a strftime call.
 88 | # today_fmt = '%B %d, %Y'
 89 | 
 90 | # List of patterns, relative to source directory, that match files and
 91 | # directories to ignore when looking for source files.
 92 | exclude_patterns = ["_build"]
 93 | 
 94 | # The reST default role (used for this markup: `text`) to use for all
 95 | # documents.
 96 | # default_role = None
 97 | 
 98 | # If true, '()' will be appended to :func: etc. cross-reference text.
 99 | # add_function_parentheses = True
100 | 
101 | # If true, the current module name will be prepended to all description
102 | # unit titles (such as .. function::).
103 | # add_module_names = True
104 | 
105 | # If true, sectionauthor and moduleauthor directives will be shown in the
106 | # output. They are ignored by default.
107 | # show_authors = False
108 | 
109 | # The name of the Pygments (syntax highlighting) style to use.
110 | pygments_style = "sphinx"
111 | 
112 | # A list of ignored prefixes for module index sorting.
113 | # modindex_common_prefix = []
114 | 
115 | # If true, keep warnings as "system message" paragraphs in the built documents.
116 | # keep_warnings = False
117 | 
118 | 
119 | # -- Options for HTML output ----------------------------------------------
120 | 
121 | # The theme to use for HTML and HTML Help pages.  See the documentation for
122 | # a list of builtin themes.
123 | html_theme = "default"
124 | # Theme options are theme-specific and customize the look and feel of a theme
125 | # further.  For a list of options available for each theme, see the
126 | # documentation.
127 | # html_theme_options = {}
128 | 
129 | # Add any paths that contain custom themes here, relative to this directory.
130 | # html_theme_path = []
131 | 
132 | # The name for this set of Sphinx documents.  If None, it defaults to
133 | # "<project> v<release> documentation".
134 | # html_title = None
135 | 
136 | # A shorter title for the navigation bar.  Default is the same as html_title.
137 | # html_short_title = None
138 | 
139 | # The name of an image file (relative to this directory) to place at the top
140 | # of the sidebar.
141 | # html_logo = None
142 | 
143 | # The name of an image file (within the static path) to use as favicon of the
144 | # docs.  This file should be a Windows icon file (.ico) being 16x16 or 32x32
145 | # pixels large.
146 | # html_favicon = None
147 | 
148 | # Add any paths that contain custom static files (such as style sheets) here,
149 | # relative to this directory. They are copied after the builtin static files,
150 | # so a file named "default.css" will overwrite the builtin "default.css".
151 | html_static_path = ["_static"]
152 | 
153 | # Add any extra paths that contain custom files (such as robots.txt or
154 | # .htaccess) here, relative to this directory. These files are copied
155 | # directly to the root of the documentation.
156 | # html_extra_path = []
157 | 
158 | # If not '', a 'Last updated on:' timestamp is inserted at every page bottom,
159 | # using the given strftime format.
160 | # html_last_updated_fmt = '%b %d, %Y'
161 | 
162 | # If true, SmartyPants will be used to convert quotes and dashes to
163 | # typographically correct entities.
164 | # html_use_smartypants = True
165 | 
166 | # Custom sidebar templates, maps document names to template names.
167 | # html_sidebars = {}
168 | 
169 | # Additional templates that should be rendered to pages, maps page names to
170 | # template names.
171 | # html_additional_pages = {}
172 | 
173 | # If false, no module index is generated.
174 | # html_domain_indices = True
175 | 
176 | # If false, no index is generated.
177 | # html_use_index = True
178 | 
179 | # If true, the index is split into individual pages for each letter.
180 | # html_split_index = False
181 | 
182 | # If true, links to the reST sources are added to the pages.
183 | # html_show_sourcelink = True
184 | 
185 | # If true, "Created using Sphinx" is shown in the HTML footer. Default is True.
186 | # html_show_sphinx = True
187 | 
188 | # If true, "(C) Copyright ..." is shown in the HTML footer. Default is True.
189 | # html_show_copyright = True
190 | 
191 | # If true, an OpenSearch description file will be output, and all pages will
192 | # contain a <link> tag referring to it.  The value of this option must be the
193 | # base URL from which the finished HTML is served.
194 | # html_use_opensearch = ''
195 | 
196 | # This is the file name suffix for HTML files (e.g. ".xhtml").
197 | # html_file_suffix = None
198 | 
199 | # Output file base name for HTML help builder.
200 | htmlhelp_basename = "lifelinesdoc"
201 | 
202 | # treat ``x, y : type`` as vars x and y instead of default ``y(x,) : type``
203 | napoleon_use_param = False
204 | 
205 | 
206 | # -- Options for LaTeX output ---------------------------------------------
207 | 
208 | latex_elements = {
209 |     # The paper size ('letterpaper' or 'a4paper').
210 |     #'papersize': 'letterpaper',
211 |     # The font size ('10pt', '11pt' or '12pt').
212 |     #'pointsize': '10pt',
213 |     # Additional stuff for the LaTeX preamble.
214 |     #'preamble': '',
215 | }
216 | 
217 | # Grouping the document tree into LaTeX files. List of tuples
218 | # (source start file, target name, title,
219 | #  author, documentclass [howto, manual, or own class]).
220 | latex_documents = [("index", "lifelines.tex", "lifelines Documentation", "Cam Davidson-Pilon", "manual")]
221 | 
222 | # The name of an image file (relative to this directory) to place at the top of
223 | # the title page.
224 | # latex_logo = None
225 | 
226 | # For "manual" documents, if this is true, then toplevel headings are parts,
227 | # not chapters.
228 | # latex_use_parts = False
229 | 
230 | # If true, show page references after internal links.
231 | # latex_show_pagerefs = False
232 | 
233 | # If true, show URL addresses after external links.
234 | # latex_show_urls = False
235 | 
236 | # Documents to append as an appendix to all manuals.
237 | # latex_appendices = []
238 | 
239 | # If false, no module index is generated.
240 | # latex_domain_indices = True
241 | 
242 | 
243 | # -- Options for manual page output ---------------------------------------
244 | 
245 | # One entry per manual page. List of tuples
246 | # (source start file, name, description, authors, manual section).
247 | man_pages = [("index", "lifelines", "lifelines Documentation", ["Cam Davidson-Pilon"], 1)]
248 | 
249 | # If true, show URL addresses after external links.
250 | # man_show_urls = False
251 | 
252 | 
253 | # nbsphinx
254 | nbsphinx_prolog = r"""
255 | .. image:: http://i.imgur.com/EOowdSD.png
256 | 
257 | -------------------------------------
258 | 
259 | 
260 | """
261 | 
262 | 
263 | # -- Options for Texinfo output -------------------------------------------
264 | 
265 | # Grouping the document tree into Texinfo files. List of tuples
266 | # (source start file, target name, title, author,
267 | #  dir menu entry, description, category)
268 | texinfo_documents = [
269 |     ("index", "lifelines", "lifelines Documentation", "Cam Davidson-Pilon", "lifelines", "Survival analysis in Python.")
270 | ]
271 | 
272 | # Documents to append as an appendix to all manuals.
273 | # texinfo_appendices = []
274 | 
275 | # If false, no module index is generated.
276 | # texinfo_domain_indices = True
277 | 
278 | # How to display URL addresses: 'footnote', 'no', or 'inline'.
279 | # texinfo_show_urls = 'footnote'
280 | 
281 | # If true, do not generate a @detailmenu in the "Top" node's menu.
282 | # texinfo_no_detailmenu = False
283 | 
284 | # use RTFD theme locally
285 | # on_rtd is whether we are on readthedocs.org, this line of code grabbed from docs.readthedocs.org
286 | import os
287 | 
288 | on_rtd = os.environ.get("READTHEDOCS", None) == "True"
289 | 
290 | if not on_rtd:  # only import and set the theme if we're building docs locally
291 |     import sphinx_rtd_theme
292 | 
293 |     html_theme = "sphinx_rtd_theme"
294 |     html_theme_path = [sphinx_rtd_theme.get_html_theme_path()]
295 | 
296 | 
297 | def setup(app):
298 |     app.add_stylesheet("custom.css")
299 | 


--------------------------------------------------------------------------------
/lifelines/datasets/rossi.csv:
--------------------------------------------------------------------------------
  1 | week,arrest,fin,age,race,wexp,mar,paro,prio
  2 | 20,1,0,27,1,0,0,1,3
  3 | 17,1,0,18,1,0,0,1,8
  4 | 25,1,0,19,0,1,0,1,13
  5 | 52,0,1,23,1,1,1,1,1
  6 | 52,0,0,19,0,1,0,1,3
  7 | 52,0,0,24,1,1,0,0,2
  8 | 23,1,0,25,1,1,1,1,0
  9 | 52,0,1,21,1,1,0,1,4
 10 | 52,0,0,22,1,0,0,0,6
 11 | 52,0,0,20,1,1,0,0,0
 12 | 52,0,1,26,1,0,0,1,3
 13 | 52,0,0,40,1,1,0,0,2
 14 | 37,1,0,17,1,1,0,1,5
 15 | 52,0,0,37,1,1,0,0,2
 16 | 25,1,0,20,1,0,0,1,3
 17 | 46,1,1,22,1,1,0,1,2
 18 | 28,1,0,19,1,0,0,0,7
 19 | 52,0,0,20,1,0,0,0,2
 20 | 52,0,0,25,1,0,0,1,12
 21 | 52,0,0,24,0,1,0,1,1
 22 | 52,0,0,23,1,0,0,1,4
 23 | 52,0,1,44,1,1,1,1,0
 24 | 24,1,1,29,1,1,0,1,2
 25 | 52,0,1,28,0,1,0,1,1
 26 | 52,0,1,21,1,1,0,0,0
 27 | 52,0,1,19,1,1,0,1,2
 28 | 52,0,0,33,1,1,0,1,1
 29 | 52,0,0,19,1,0,0,0,2
 30 | 52,0,1,19,1,0,0,1,3
 31 | 52,0,1,23,1,1,1,1,9
 32 | 52,0,1,23,1,0,0,1,3
 33 | 52,0,1,19,1,0,0,1,1
 34 | 52,0,1,42,1,1,0,0,0
 35 | 52,0,0,23,1,1,1,0,2
 36 | 52,0,0,24,1,1,0,0,3
 37 | 50,1,1,20,1,1,0,1,2
 38 | 52,0,0,22,1,1,0,1,5
 39 | 52,0,0,27,1,1,0,0,2
 40 | 52,0,1,19,1,0,0,0,4
 41 | 52,0,0,28,1,1,0,1,3
 42 | 52,0,1,33,1,1,1,0,9
 43 | 52,0,0,24,1,1,0,1,1
 44 | 10,1,0,21,1,0,0,1,14
 45 | 52,0,0,22,1,0,0,1,2
 46 | 52,0,1,19,1,0,0,1,2
 47 | 52,0,1,22,1,0,0,0,2
 48 | 52,0,1,22,1,0,0,0,15
 49 | 20,1,1,23,1,1,0,1,5
 50 | 52,0,0,32,1,1,1,1,2
 51 | 52,0,1,27,1,1,0,1,0
 52 | 52,0,1,36,1,1,0,0,0
 53 | 52,0,1,22,1,1,0,1,1
 54 | 52,0,1,32,1,1,0,1,1
 55 | 50,1,1,19,1,1,0,0,10
 56 | 52,0,0,28,1,1,1,1,1
 57 | 52,0,0,32,0,1,0,0,3
 58 | 52,0,0,33,1,1,1,1,1
 59 | 52,0,0,26,1,0,0,1,1
 60 | 52,0,1,20,1,1,0,1,0
 61 | 52,0,1,42,1,1,0,0,9
 62 | 6,1,0,19,1,0,0,0,6
 63 | 52,0,0,22,1,1,0,0,2
 64 | 52,0,0,22,1,0,0,1,5
 65 | 52,0,0,36,1,0,0,0,11
 66 | 52,1,0,23,1,1,0,0,2
 67 | 52,0,1,27,1,1,0,1,3
 68 | 52,0,1,21,1,0,0,1,1
 69 | 52,0,1,22,1,1,0,1,2
 70 | 49,1,0,35,1,1,0,1,3
 71 | 52,0,0,21,1,1,0,1,4
 72 | 52,0,1,25,1,1,0,1,5
 73 | 52,0,0,18,1,0,0,1,0
 74 | 52,0,1,26,1,1,0,1,2
 75 | 52,0,0,30,1,1,0,0,4
 76 | 52,0,0,20,1,0,0,1,2
 77 | 52,0,1,43,1,1,0,1,1
 78 | 43,1,0,23,1,1,1,1,4
 79 | 52,0,0,42,0,1,0,0,2
 80 | 52,0,0,21,0,0,0,0,2
 81 | 5,1,0,19,1,0,0,0,3
 82 | 27,1,0,29,1,0,0,0,4
 83 | 52,0,0,30,1,1,0,1,3
 84 | 52,0,1,21,0,1,1,1,10
 85 | 52,0,0,20,1,0,0,1,7
 86 | 22,1,1,19,1,0,0,1,10
 87 | 52,0,1,22,1,1,0,1,1
 88 | 52,0,0,25,1,0,0,1,3
 89 | 18,1,0,22,1,0,0,0,4
 90 | 52,0,1,22,1,1,0,1,4
 91 | 52,0,1,24,1,0,0,1,2
 92 | 52,0,0,39,1,1,1,1,4
 93 | 52,0,0,21,1,1,0,1,1
 94 | 52,0,1,20,1,1,0,1,2
 95 | 52,0,1,24,1,0,0,0,1
 96 | 52,0,0,25,1,1,0,1,2
 97 | 24,1,1,21,1,1,0,0,4
 98 | 52,0,1,20,1,0,0,1,1
 99 | 52,0,1,19,1,0,0,1,3
100 | 52,0,1,24,1,0,0,0,2
101 | 52,0,1,24,1,1,0,1,1
102 | 2,1,0,44,1,1,0,1,2
103 | 26,1,0,32,1,1,0,0,2
104 | 52,0,0,23,1,1,0,0,3
105 | 49,1,1,19,1,0,0,1,1
106 | 52,0,0,20,1,0,0,1,1
107 | 21,1,0,27,1,1,0,1,0
108 | 48,1,0,19,1,0,0,0,6
109 | 52,0,1,21,1,1,0,0,1
110 | 52,0,0,20,1,0,0,1,1
111 | 52,0,0,25,1,0,0,1,3
112 | 52,0,0,20,1,0,0,1,6
113 | 52,0,1,23,1,1,0,1,3
114 | 52,0,0,20,1,0,0,0,2
115 | 52,0,1,30,1,1,0,0,1
116 | 52,0,0,25,1,1,1,1,0
117 | 52,0,0,22,1,1,0,1,1
118 | 52,0,0,24,1,1,0,1,3
119 | 52,0,1,18,1,0,0,0,4
120 | 8,1,1,40,1,1,0,1,1
121 | 52,0,0,22,1,0,0,1,1
122 | 52,0,1,23,1,0,0,1,6
123 | 49,1,0,21,1,1,0,1,1
124 | 52,0,1,24,0,1,1,1,2
125 | 52,0,1,24,1,0,0,1,14
126 | 52,0,0,38,1,1,0,1,2
127 | 52,0,0,26,0,1,0,0,3
128 | 52,0,1,29,1,1,0,0,1
129 | 52,0,0,21,1,0,0,1,8
130 | 52,0,1,21,1,1,1,1,2
131 | 52,0,0,22,0,0,0,1,4
132 | 8,1,0,23,1,0,0,1,5
133 | 52,0,0,27,1,1,0,0,2
134 | 52,0,1,18,1,0,0,1,2
135 | 13,1,0,23,1,0,0,0,5
136 | 52,0,1,24,1,0,0,1,2
137 | 52,0,1,21,1,0,0,0,3
138 | 52,0,1,20,1,0,0,1,4
139 | 52,0,1,27,1,1,0,0,4
140 | 8,1,1,20,1,0,0,1,11
141 | 52,0,1,29,1,1,1,1,5
142 | 33,1,0,19,1,0,0,0,10
143 | 52,0,0,20,1,0,0,0,8
144 | 52,0,1,18,1,0,0,1,0
145 | 11,1,1,19,1,0,0,1,2
146 | 52,0,1,24,1,1,0,1,1
147 | 52,0,0,28,0,1,0,1,4
148 | 52,0,1,26,1,0,0,0,4
149 | 52,0,1,17,1,0,0,1,0
150 | 52,0,0,21,1,0,0,1,3
151 | 37,1,0,34,1,1,0,0,2
152 | 52,0,1,26,1,1,0,0,1
153 | 52,0,1,43,1,1,0,1,2
154 | 52,0,0,20,1,0,0,1,0
155 | 44,1,0,20,1,1,0,1,1
156 | 52,0,0,32,1,1,0,1,1
157 | 52,1,0,25,0,1,0,1,1
158 | 52,0,1,22,1,0,0,1,1
159 | 52,0,1,31,0,1,0,1,1
160 | 52,0,1,42,1,1,1,1,4
161 | 52,0,1,32,1,1,0,0,10
162 | 52,0,1,20,1,0,0,0,8
163 | 52,0,0,20,0,0,0,0,1
164 | 52,0,1,36,1,0,0,1,8
165 | 52,0,1,34,1,1,0,1,2
166 | 52,0,1,28,1,1,1,1,3
167 | 52,0,1,21,1,1,0,1,2
168 | 52,0,0,18,0,0,0,1,6
169 | 52,0,1,20,0,0,0,1,4
170 | 52,0,0,17,0,0,0,1,3
171 | 52,0,1,44,1,0,0,1,3
172 | 52,0,1,30,1,1,0,1,5
173 | 52,0,1,22,1,0,0,0,11
174 | 9,1,1,30,1,0,0,0,3
175 | 17,1,0,23,1,0,0,0,8
176 | 52,0,1,20,1,1,0,0,2
177 | 52,0,0,19,1,0,0,0,10
178 | 52,0,1,21,1,0,0,1,1
179 | 52,0,1,22,1,0,0,1,6
180 | 52,0,1,19,1,0,0,1,2
181 | 52,0,1,21,1,0,0,0,10
182 | 16,1,0,38,1,0,0,1,3
183 | 52,0,1,24,1,0,0,0,7
184 | 52,0,1,39,1,1,1,0,2
185 | 3,1,0,30,1,0,0,1,3
186 | 52,0,0,37,1,1,0,0,0
187 | 52,0,1,23,1,0,0,1,2
188 | 52,0,0,21,0,0,0,1,1
189 | 52,0,1,31,1,1,0,1,1
190 | 52,0,1,24,1,0,0,0,13
191 | 52,0,0,31,0,1,1,1,3
192 | 52,0,0,24,1,0,0,1,2
193 | 52,0,1,24,1,1,0,1,1
194 | 52,0,1,21,0,1,0,0,1
195 | 52,0,1,22,1,0,0,0,2
196 | 45,1,0,20,1,0,0,1,5
197 | 52,0,1,21,1,1,0,1,0
198 | 52,0,1,24,1,1,0,1,2
199 | 52,0,0,25,1,1,0,1,1
200 | 52,0,0,19,1,0,0,1,1
201 | 52,0,0,20,0,0,0,0,2
202 | 52,0,0,20,1,1,0,1,4
203 | 28,1,0,24,1,1,0,0,1
204 | 52,0,1,18,1,0,0,0,4
205 | 16,1,1,28,1,0,0,1,5
206 | 15,1,1,19,1,0,0,0,4
207 | 52,0,0,19,1,1,0,0,1
208 | 52,0,0,25,1,1,1,0,0
209 | 52,0,1,19,0,0,0,0,1
210 | 52,0,1,25,1,0,0,0,2
211 | 14,1,0,24,1,0,0,0,0
212 | 52,0,1,20,1,1,0,1,1
213 | 52,0,1,30,1,0,0,1,1
214 | 52,0,0,29,1,1,0,1,4
215 | 52,0,0,28,0,1,1,1,4
216 | 52,0,1,36,1,0,0,1,1
217 | 52,0,1,23,1,1,0,0,7
218 | 52,0,1,23,1,0,0,0,2
219 | 52,0,0,24,1,1,0,1,4
220 | 52,0,0,29,1,1,1,1,1
221 | 52,0,0,26,1,1,1,1,2
222 | 52,0,0,39,0,1,1,0,3
223 | 52,0,1,20,1,1,0,1,1
224 | 52,0,0,23,1,1,0,1,3
225 | 52,0,1,21,1,1,0,1,2
226 | 52,0,1,21,1,0,0,1,1
227 | 7,1,1,20,0,0,0,1,2
228 | 52,0,1,20,0,0,0,1,3
229 | 52,0,1,27,1,1,0,1,2
230 | 43,1,0,18,0,1,0,0,3
231 | 46,1,1,25,1,1,0,0,1
232 | 40,1,1,20,1,0,0,0,6
233 | 52,0,1,20,1,1,0,0,5
234 | 14,1,0,20,0,0,0,0,7
235 | 52,0,0,24,0,1,1,0,11
236 | 52,0,1,23,1,0,0,0,1
237 | 8,1,0,28,1,1,0,0,4
238 | 52,0,0,21,1,0,0,0,2
239 | 52,0,0,25,1,0,0,0,1
240 | 52,0,0,24,1,1,0,1,1
241 | 52,0,0,29,1,1,1,0,3
242 | 52,0,0,22,1,1,1,1,2
243 | 25,1,0,28,1,0,0,1,18
244 | 52,0,0,19,1,0,0,1,1
245 | 52,0,0,20,1,1,0,1,1
246 | 17,1,0,20,1,0,0,1,5
247 | 37,1,1,22,1,1,0,1,1
248 | 52,0,0,20,1,0,0,1,8
249 | 52,0,1,21,1,0,0,1,2
250 | 52,0,1,21,1,1,0,1,1
251 | 32,1,0,19,1,0,0,1,3
252 | 52,0,0,26,1,1,0,1,1
253 | 52,0,0,23,1,1,1,1,2
254 | 52,0,1,22,0,1,0,1,4
255 | 52,0,1,24,1,1,0,0,8
256 | 52,0,1,40,1,0,0,0,5
257 | 52,0,1,32,1,0,0,0,2
258 | 52,0,0,38,1,1,0,0,0
259 | 52,0,0,26,1,1,0,1,1
260 | 12,1,1,27,1,1,0,1,0
261 | 52,0,0,29,1,1,1,1,3
262 | 18,1,0,20,1,1,0,1,4
263 | 52,0,0,22,1,0,0,0,1
264 | 52,0,0,22,0,0,0,0,5
265 | 14,1,1,19,1,1,0,0,12
266 | 52,0,0,22,1,1,0,0,1
267 | 52,0,0,19,1,0,0,0,3
268 | 52,0,1,32,1,1,0,0,1
269 | 52,0,1,25,1,1,0,1,2
270 | 38,1,0,21,1,0,0,1,2
271 | 52,0,1,36,1,1,0,1,1
272 | 24,1,0,40,1,1,0,0,2
273 | 20,1,1,20,1,0,0,1,1
274 | 32,1,1,19,1,0,0,1,0
275 | 52,0,0,18,1,0,0,1,4
276 | 52,0,1,28,1,1,0,0,0
277 | 52,0,1,22,1,1,0,0,2
278 | 52,0,1,25,1,0,0,1,1
279 | 52,0,1,28,1,1,0,0,2
280 | 52,0,1,25,1,1,0,0,2
281 | 52,0,1,20,1,1,0,0,4
282 | 52,0,1,24,1,0,0,0,5
283 | 52,0,0,24,1,1,0,0,0
284 | 52,0,1,36,0,1,0,1,2
285 | 52,0,1,34,1,1,0,0,1
286 | 31,1,0,19,1,1,0,1,5
287 | 20,1,1,23,1,0,0,1,1
288 | 40,1,0,19,1,1,0,1,3
289 | 52,0,1,40,1,1,0,0,2
290 | 52,0,1,31,1,1,0,0,2
291 | 52,0,0,23,1,1,1,1,0
292 | 52,0,0,42,1,0,0,1,2
293 | 42,1,1,26,1,1,1,1,1
294 | 52,0,0,20,1,0,0,1,9
295 | 26,1,0,27,1,1,0,1,1
296 | 52,0,1,24,1,0,0,0,5
297 | 52,0,0,25,1,0,0,0,2
298 | 52,0,1,22,1,1,0,1,3
299 | 52,0,1,20,1,0,0,1,2
300 | 52,0,1,20,1,1,0,1,2
301 | 47,1,0,22,1,0,0,1,3
302 | 52,0,0,18,1,1,0,1,1
303 | 52,0,0,20,1,1,0,1,2
304 | 40,1,0,20,1,1,0,1,1
305 | 52,0,0,22,1,1,0,1,2
306 | 52,0,1,30,1,1,1,0,2
307 | 52,0,0,36,0,1,0,0,1
308 | 52,0,0,25,0,1,1,1,5
309 | 21,1,0,29,1,0,0,1,3
310 | 52,0,0,19,1,1,0,1,3
311 | 52,0,1,24,1,1,0,1,2
312 | 52,0,1,21,1,0,0,0,0
313 | 52,0,1,35,1,1,0,1,6
314 | 52,0,1,19,0,1,0,0,4
315 | 1,1,0,20,1,0,0,0,0
316 | 43,1,0,22,0,0,0,0,3
317 | 24,1,0,23,1,1,0,0,1
318 | 11,1,0,19,1,0,0,0,18
319 | 52,0,0,18,1,0,0,1,3
320 | 52,0,1,38,0,1,0,1,2
321 | 52,0,1,18,0,0,0,1,6
322 | 52,0,0,22,1,1,1,1,1
323 | 33,1,0,21,1,0,0,1,3
324 | 52,0,0,21,1,1,0,1,1
325 | 46,1,1,21,1,0,0,1,5
326 | 36,1,1,17,1,0,0,1,3
327 | 52,0,1,22,1,1,0,1,1
328 | 52,0,1,23,1,1,1,1,0
329 | 18,1,1,19,1,0,0,1,4
330 | 52,0,1,21,1,1,0,0,1
331 | 52,0,1,35,1,1,0,0,5
332 | 50,1,0,23,1,1,0,0,8
333 | 52,0,1,22,1,0,0,0,2
334 | 34,1,1,25,1,0,0,0,11
335 | 52,0,1,20,1,1,0,0,4
336 | 35,1,1,19,0,0,0,0,1
337 | 52,0,0,20,1,0,0,0,1
338 | 52,0,1,41,0,1,1,1,3
339 | 39,1,0,23,0,1,0,1,4
340 | 9,1,1,26,1,1,0,0,0
341 | 52,0,0,26,1,0,0,0,2
342 | 52,0,1,38,1,1,0,1,1
343 | 52,0,0,27,1,1,0,1,1
344 | 34,1,1,19,1,0,0,1,3
345 | 52,0,0,25,1,1,0,0,1
346 | 52,0,1,30,1,1,0,0,2
347 | 52,0,1,42,1,1,0,0,1
348 | 44,1,0,20,1,1,0,1,2
349 | 52,0,1,23,1,1,0,1,1
350 | 52,0,0,21,1,0,0,1,3
351 | 35,1,1,20,1,1,0,0,3
352 | 30,1,0,17,1,0,0,0,1
353 | 39,1,1,26,1,0,1,0,5
354 | 52,0,1,24,1,1,0,1,1
355 | 52,0,0,37,1,1,1,1,1
356 | 52,0,0,28,1,1,1,1,1
357 | 52,0,0,33,1,1,0,1,0
358 | 19,1,1,22,1,0,0,1,4
359 | 52,0,0,25,1,1,1,1,2
360 | 43,1,0,20,0,0,1,0,10
361 | 52,0,0,20,1,0,0,0,1
362 | 48,1,1,24,0,1,0,0,4
363 | 37,1,1,26,0,0,0,0,11
364 | 20,1,1,26,1,1,0,1,1
365 | 52,0,0,25,0,1,0,1,1
366 | 52,0,0,26,1,1,0,1,1
367 | 36,1,1,23,1,0,0,0,3
368 | 52,0,1,28,1,0,0,1,4
369 | 52,0,0,27,1,1,0,1,0
370 | 52,0,1,23,1,0,0,0,3
371 | 52,0,0,17,1,0,0,1,7
372 | 52,0,0,20,0,0,0,1,4
373 | 52,0,1,20,1,0,0,1,5
374 | 52,0,1,20,0,0,0,1,9
375 | 30,1,1,22,1,1,0,1,2
376 | 52,0,0,31,1,0,0,1,1
377 | 52,0,0,43,1,1,0,0,1
378 | 52,0,0,29,1,1,0,0,1
379 | 52,0,1,21,1,0,0,0,0
380 | 52,0,0,24,0,1,0,0,2
381 | 52,0,1,30,1,1,1,0,3
382 | 52,0,0,22,1,1,0,0,0
383 | 52,0,1,26,1,1,1,0,1
384 | 42,1,1,20,1,1,0,0,0
385 | 52,0,0,23,1,1,0,0,6
386 | 52,0,0,25,1,1,0,1,5
387 | 52,0,1,40,1,1,0,1,2
388 | 52,0,1,30,1,1,1,1,0
389 | 26,1,0,22,1,0,1,1,2
390 | 40,1,0,18,1,0,0,1,2
391 | 52,0,0,18,1,0,0,1,0
392 | 52,0,0,24,1,1,0,1,2
393 | 52,0,1,25,1,1,1,1,2
394 | 35,1,1,19,1,0,0,1,2
395 | 52,0,0,24,1,1,0,1,2
396 | 46,1,0,24,1,0,1,1,2
397 | 52,0,0,18,1,1,0,1,3
398 | 49,1,1,18,1,1,0,1,0
399 | 52,0,0,23,1,1,0,0,0
400 | 52,0,0,20,1,0,0,1,2
401 | 49,1,1,18,1,1,0,1,1
402 | 52,0,0,23,1,1,0,1,2
403 | 52,0,1,20,1,0,0,1,1
404 | 52,0,0,23,1,0,0,0,5
405 | 52,0,0,23,1,1,0,1,1
406 | 52,0,0,23,1,1,1,1,2
407 | 35,1,0,20,1,1,0,1,4
408 | 52,0,1,26,1,1,1,0,4
409 | 52,0,1,30,1,0,0,0,1
410 | 52,0,1,36,0,1,0,0,4
411 | 52,0,1,43,1,1,0,0,4
412 | 27,1,0,20,0,1,0,0,1
413 | 52,0,1,24,1,1,0,1,1
414 | 52,0,0,22,1,1,0,0,1
415 | 52,0,1,20,1,0,1,0,1
416 | 52,1,0,21,1,0,0,0,0
417 | 45,1,1,18,1,0,0,0,5
418 | 4,1,0,18,1,1,0,0,1
419 | 52,1,0,33,1,1,0,1,2
420 | 36,1,1,19,1,0,0,1,2
421 | 52,0,1,21,0,1,0,1,1
422 | 52,0,1,21,1,0,0,1,1
423 | 8,1,1,21,1,1,0,1,4
424 | 15,1,1,22,1,0,0,1,3
425 | 52,0,0,18,1,0,0,1,3
426 | 19,1,0,18,1,0,0,0,2
427 | 52,0,0,24,1,1,0,1,2
428 | 12,1,1,22,1,1,1,1,2
429 | 52,0,1,31,0,1,0,1,3
430 | 52,0,0,20,1,0,0,1,1
431 | 52,0,1,20,1,1,1,1,1
432 | 52,0,0,29,1,1,0,1,3
433 | 52,0,1,24,1,1,0,1,1
434 | 


--------------------------------------------------------------------------------
/paper/paper.bib:
--------------------------------------------------------------------------------
  1 | @MISC{wiki:ph,
  2 |     AUTHOR = {{Wikipedia contributors}"},
  3 |     TITLE = "Proportional hazards model --- {Wikipedia}{,} The Free Encyclopedia",
  4 |     URL = "https://en.wikipedia.org/w/index.php?title=Proportional_hazards_model&oldid=885553852",
  5 |     NOTE = "[Online; accessed 6-March-2019]",
  6 |     YEAR = "2019",
  7 | }
  8 | @MISC{skipper_seabold_2017_275519,
  9 |     AUTHOR = {{Skipper Seabold et al.}},
 10 |     TITLE = {statsmodels/statsmodels: Version 0.8.0 Release},
 11 |     URL = {https://doi.org/10.5281/zenodo.275519},
 12 |     DOI = {10.5281/zenodo.275519},
 13 |     YEAR = 2017,
 14 |     MONTH = feb,
 15 | }
 16 | @MISC{nathaniel_j_smith_2018_1472929,
 17 |     AUTHOR = {{Nathaniel J. Smith et al.}},
 18 |     TITLE = {pydata/patsy: v0.5.1},
 19 |     URL = {https://doi.org/10.5281/zenodo.1472929},
 20 |     DOI = {10.5281/zenodo.1472929},
 21 |     YEAR = 2018,
 22 |     MONTH = oct,
 23 | }
 24 | @BOOK{book,
 25 |     AUTHOR = {Steven P. Millard, Nagaraj K. Neerchal},
 26 |     TITLE = {Environmental Statistics with R},
 27 |     PUBLISHER = {Taylor & Francis Inc},
 28 |     ISBN = {1439810273},
 29 |     EDITION = 2,
 30 |     YEAR = 2021,
 31 | }
 32 | @BOOK{book:xxx,
 33 |     AUTHOR = {Steven P. Millard, Nagaraj K. Neerchal},
 34 |     TITLE = {Environmental Statistics with R},
 35 |     VOLUME = {77},
 36 |     NUMBER = {3},
 37 |     PAGES = {463-464},
 38 |     URL = {https://onlinelibrary.wiley.com/doi/abs/10.1111/j.1751-5823.2009.00095_1.x},
 39 |     YEAR = {2009},
 40 |     EPRINT = {https://onlinelibrary.wiley.com/doi/pdf/10.1111/j.1751-5823.2009.00095_1.x},
 41 |     DOI = {10.1111/j.1751-5823.2009.00095\_1.x},
 42 |     JOURNAL = {International Statistical Review},
 43 | }
 44 | @MISC{wiki:xxx,
 45 |     AUTHOR = {{Wikipedia contributors}"},
 46 |     TITLE = "Newton's method --- {Wikipedia}{,} The Free Encyclopedia",
 47 |     URL = "https://en.wikipedia.org/w/index.php?title=Newton%27s_method&oldid=884906576",
 48 |     NOTE = "[Online; accessed 6-March-2019]",
 49 |     YEAR = "2019",
 50 | }
 51 | @ARTICLE{doi:10.1111/ajps.12176,
 52 |     AUTHOR = {Park, Sunhee AND Hendry, David J.},
 53 |     TITLE = {Reassessing Schoenfeld Residual Tests of Proportional Hazards in Political Science Event History Analyses},
 54 |     VOLUME = {59},
 55 |     NUMBER = {4},
 56 |     PAGES = {1072-1087},
 57 |     URL = {https://onlinelibrary.wiley.com/doi/abs/10.1111/ajps.12176},
 58 |     YEAR = {2015},
 59 |     ABSTRACT = {An underlying assumption of proportional hazards models is that the effect of a change in a covariate on the hazard rate of event occurrence is constant over time. For scholars using the Cox model, a Schoenfeld residual-based test has become the disciplinary standard for detecting violations of this assumption. However, using this test requires researchers to make a choice about a transformation of the time scale. In practice, this choice has largely consisted of arbitrary decisions made without justification. Using replications and simulations, we demonstrate that the decision about time transformations can have profound implications for the conclusions reached. In particular, we show that researchers can make far more informed decisions by paying closer attention to the presence of outlier survival times and levels of censoring in their data. We suggest a new standard for best practices in Cox diagnostics that buttresses the current standard with in-depth exploratory data analysis.},
 60 |     EPRINT = {https://onlinelibrary.wiley.com/doi/pdf/10.1111/ajps.12176},
 61 |     DOI = {10.1111/ajps.12176},
 62 |     JOURNAL = {American Journal of Political Science},
 63 | }
 64 | @ARTICLE{doi:10.1002/sim.2864,
 65 |     AUTHOR = {Klein, John P. AND Logan, Brent AND Harhoff, Mette AND Andersen, Per Kragh},
 66 |     TITLE = {Analyzing survival curves at a fixed point in time},
 67 |     VOLUME = {26},
 68 |     NUMBER = {24},
 69 |     PAGES = {4505-4519},
 70 |     URL = {https://onlinelibrary.wiley.com/doi/abs/10.1002/sim.2864},
 71 |     YEAR = {2007},
 72 |     ABSTRACT = {Abstract A common problem encountered in many medical applications is the comparison of survival curves. Often, rather than comparison of the entire survival curves, interest is focused on the comparison at a fixed point in time. In most cases, the naive test based on a difference in the estimates of survival is used for this comparison. In this note, we examine the performance of alternatives to the naive test. These include tests based on a number of transformations of the survival function and a test based on a generalized linear model for pseudo-observations. The type I errors and power of these tests for a variety of sample sizes are compared by a Monte Carlo study. We also discuss how these tests may be extended to situations where the data are stratified. The pseudo-value approach is also applicable in more detailed regression analysis of the survival probability at a fixed point in time. The methods are illustrated on a study comparing survival for autologous and allogeneic bone marrow transplants. Copyright © 2007 John Wiley \& Sons, Ltd.},
 73 |     EPRINT = {https://onlinelibrary.wiley.com/doi/pdf/10.1002/sim.2864},
 74 |     DOI = {10.1002/sim.2864},
 75 |     KEYWORDS = {generalized linear models, pseudo-value approach, variance stabilizing transformation, Kaplan–Meier estimators, censored data},
 76 |     JOURNAL = {Statistics in Medicine},
 77 | }
 78 | @ARTICLE{Greenland2016,
 79 |     AUTHOR = {Greenland, Douglas G.},
 80 |     TITLE = "Statistical tests, P values, confidence intervals, and power: a guide to misinterpretations",
 81 |     VOLUME = "31",
 82 |     NUMBER = "4",
 83 |     PAGES = "337--350",
 84 |     URL = "https://doi.org/10.1007/s10654-016-0149-3",
 85 |     DOI = "10.1007/s10654-016-0149-3",
 86 |     ISSN = "1573-7284",
 87 |     ABSTRACT = "Misinterpretation and abuse of statistical tests, confidence intervals, and statistical power have been decried for decades, yet remain rampant. A key problem is that there are no interpretations of these concepts that are at once simple, intuitive, correct, and foolproof. Instead, correct use and interpretation of these statistics requires an attention to detail which seems to tax the patience of working scientists. This high cognitive demand has led to an epidemic of shortcut definitions and interpretations that are simply wrong, sometimes disastrously so---and yet these misinterpretations dominate much of the scientific literature. In light of this problem, we provide definitions and a discussion of basic statistics that are more general and critical than typically found in traditional introductory expositions. Our goal is to provide a resource for instructors, researchers, and consumers of statistics whose knowledge of statistical theory and technique may be limited but who wish to avoid and spot misinterpretations. We emphasize how violation of often unstated analysis protocols (such as selecting analyses for presentation based on the P values they produce) can lead to small P values even if the declared test hypothesis is correct, and can lead to large P values even if that hypothesis is incorrect. We then provide an explanatory list of 25 misinterpretations of P values, confidence intervals, and power. We conclude with guidelines for improving statistical interpretation and reporting.",
 88 |     DAY = "01",
 89 |     MONTH = "Apr",
 90 |     YEAR = "2016",
 91 |     JOURNAL = "European Journal of Epidemiology",
 92 | }
 93 | @MISC{300620,
 94 |     AUTHOR = {{Tom Pinder (https://stats.stackexchange.com/users/134199/tom-pinder)}},
 95 |     TITLE = {What is the difference between the different types of residuals in survival analysis (Cox regression)?},
 96 |     URL = {https://stats.stackexchange.com/q/300620},
 97 |     EPRINT = {https://stats.stackexchange.com/q/300620},
 98 |     NOTE = {URL:https://stats.stackexchange.com/q/300620 (version: 2017-08-30)},
 99 |     HOWPUBLISHED = {Cross Validated},
100 | }
101 | @MISC{46536,
102 |     AUTHOR = {{ocram (https://stats.stackexchange.com/users/3019/ocram)}},
103 |     TITLE = {Cox baseline hazard},
104 |     URL = {https://stats.stackexchange.com/q/46536},
105 |     EPRINT = {https://stats.stackexchange.com/q/46536},
106 |     NOTE = {URL:https://stats.stackexchange.com/q/46536 (version: 2017-03-22)},
107 |     HOWPUBLISHED = {Cross Validated},
108 | }
109 | @MISC{133822,
110 |     AUTHOR = {{Ben Kuhn (https://stats.stackexchange.com/users/60642/ben-kuhn)}},
111 |     TITLE = {Stratified concordance index (survival::survConcordance)},
112 |     URL = {https://stats.stackexchange.com/q/133822},
113 |     EPRINT = {https://stats.stackexchange.com/q/133822},
114 |     NOTE = {URL:https://stats.stackexchange.com/q/133822 (version: 2015-01-17)},
115 |     HOWPUBLISHED = {Cross Validated},
116 | }
117 | @ARTICLE{doi:10.1111/j.1751-5823.2009.00095_1.x,
118 |     AUTHOR = {Ghosh, Jayanta K.},
119 |     TITLE = {Survival and Event History Analysis: A Process Point of View by Odd O. Aalen, Ørnulf Borgan, Håkon K. Gjessing},
120 |     VOLUME = {77},
121 |     NUMBER = {3},
122 |     PAGES = {463-464},
123 |     URL = {https://onlinelibrary.wiley.com/doi/abs/10.1111/j.1751-5823.2009.00095_1.x},
124 |     YEAR = {2009},
125 |     EPRINT = {https://onlinelibrary.wiley.com/doi/pdf/10.1111/j.1751-5823.2009.00095_1.x},
126 |     DOI = {10.1111/j.1751-5823.2009.00095\_1.x},
127 |     JOURNAL = {International Statistical Review},
128 | }
129 | @ARTICLE{Edwards2016,
130 |     AUTHOR = {Edwards, Catherine R.},
131 |     TITLE = "Methodologic Issues when Estimating Risks in Pharmacoepidemiology",
132 |     VOLUME = "3",
133 |     NUMBER = "4",
134 |     PAGES = "285--296",
135 |     URL = "https://doi.org/10.1007/s40471-016-0089-1",
136 |     DOI = "10.1007/s40471-016-0089-1",
137 |     ISSN = "2196-2995",
138 |     ABSTRACT = "Risk is an important parameter to describe the occurrence of health outcomes over time. However, many outcomes of interest in healthcare settings, such as disease incidence, treatment initiation, and cause-specific mortality, may be precluded from occurring by other events, often referred to as competing events. Here, we review straightforward approaches to estimate risk in the presence of competing events.",
139 |     DAY = "01",
140 |     MONTH = "Dec",
141 |     YEAR = "2016",
142 |     JOURNAL = "Current Epidemiology Reports",
143 | }
144 | @ARTICLE{Harrell1996MultivariablePM,
145 |     AUTHOR = {Frank E. Harrell AND Kerry L. Lee AND Daniel B. Mark},
146 |     TITLE = {Multivariable prognostic models: issues in developing models, evaluating assumptions and adequacy, and measuring and reducing errors.},
147 |     VOLUME = {15 4},
148 |     PAGES = {
149 |           361-87
150 |         },
151 |     YEAR = {1996},
152 |     JOURNAL = {Statistics in medicine},
153 | }
154 | @ARTICLE{flexsurv,
155 |     AUTHOR = {{Christopher Jackson}},
156 |     TITLE = {{flexsurv}: A Platform for Parametric Survival Modeling in
157 |     {R}},
158 |     VOLUME = {70},
159 |     NUMBER = {8},
160 |     PAGES = {1--33},
161 |     DOI = {10.18637/jss.v070.i08},
162 |     YEAR = {2016},
163 |     JOURNAL = {Journal of Statistical Software},
164 | }
165 | @MANUAL{survival-package,
166 |     AUTHOR = {{Terry M Therneau}},
167 |     TITLE = {A Package for Survival Analysis in S},
168 |     URL = {https://CRAN.R-project.org/package=survival},
169 |     NOTE = {version 2.38},
170 |     YEAR = {2015},
171 | }
172 | 


--------------------------------------------------------------------------------