├── .gitignore ├── .gitmodules ├── .idea ├── .gitignore ├── clinical-longformer.iml ├── inspectionProfiles │ └── profiles_settings.xml ├── misc.xml ├── modules.xml └── vcs.xml ├── LICENSE ├── README.md ├── Written Submission.pdf ├── classifier_pipeline ├── README.md ├── __pycache__ │ ├── classifier.cpython-37.pyc │ ├── classifier.cpython-38.pyc │ ├── classifier_longformer.cpython-37.pyc │ ├── classifier_longformer.cpython-38.pyc │ ├── classifier_multilabel.cpython-37.pyc │ ├── classifier_one_label.cpython-37.pyc │ ├── classifier_one_label.cpython-38.pyc │ ├── tokenizer.cpython-37.pyc │ ├── tokenizer.cpython-38.pyc │ ├── utils.cpython-37.pyc │ └── utils.cpython-38.pyc ├── classifier_one_label.py ├── interact.py ├── requirements.txt ├── tokenizer.py ├── training_onelabel.py └── utils.py ├── classifier_pipeline_medNLI ├── __pycache__ │ ├── mednli_classifier.cpython-37.pyc │ ├── mednli_data_utils.cpython-37.pyc │ ├── tokenizer.cpython-37.pyc │ └── utils.cpython-37.pyc ├── experiments_mednli │ ├── allenai │ │ └── biomed_roberta_base │ │ │ ├── allen_confusion_matrix.npy │ │ │ ├── allen_confusion_mtx.png │ │ │ └── version_04-12-2020--13-10-52 │ │ │ ├── allenai_hparams.yaml │ │ │ ├── events.out.tfevents.1607087458.55d001092ee9.1345.0 │ │ │ └── trial.txt │ ├── bert-base-uncased │ │ ├── bert_confusion_matrix.npy │ │ └── bert_confusion_mtx.png │ ├── emilyalsentzer │ │ └── Bio_ClinicalBERT │ │ │ ├── emily_confusion_matrix.npy │ │ │ ├── emily_confusion_mtx.png │ │ │ └── version_04-12-2020--13-10-52 │ │ │ └── hparams.yaml │ └── simonlevine │ │ └── biomed_roberta_base-4096-speedfix │ │ ├── longformer_confusion_matrix.npy │ │ ├── longformer_confusion_mtx.png │ │ └── version_04-12-2020--13-28-13 │ │ └── hparams.yaml ├── mednli_classifier.py ├── mednli_data_utils.py ├── mednli_training.py ├── mnli_testing.ipynb ├── requirements.txt ├── tokenizer.py └── utils.py ├── data ├── .DS_Store ├── .gitignore ├── annotation_task_sample ├── mednli │ ├── LICENSE.txt │ ├── README.txt │ ├── SHA256SUMS.txt │ ├── mli_dev_v1.jsonl │ ├── mli_test_v1.jsonl │ └── mli_train_v1.jsonl └── physionet.org │ └── files │ └── mimiciii │ ├── .DS_Store │ └── 1.4 │ └── .DS_Store ├── experiments ├── allenai │ └── biomed_roberta_base │ │ └── version_11-11-2020--19-37-30 │ │ ├── events.out.tfevents.1605123452.nvidia-ngc-image-2-vm.9468.0 │ │ └── hparams.yaml ├── bert-base-uncased │ └── version_11-11-2020--16-50-04 │ │ ├── events.out.tfevents.1605113407.nvidia-ngc-image-2-vm.5935.0 │ │ └── hparams.yaml ├── emilyalsentzer │ └── Bio_ClinicalBERT │ │ └── version_11-11-2020--18-13-49 │ │ ├── events.out.tfevents.1605118432.nvidia-ngc-image-2-vm.7703.0 │ │ └── hparams.yaml └── simonlevine │ ├── .DS_Store │ └── bioclinical-roberta-long │ ├── CM_updated.npy │ ├── test_confusion_matrices.npy │ └── version_11-11-2020--23-49-14 │ ├── events.out.tfevents.1605138556.nvidia-ngc-image-2-vm.13914.0 │ └── hparams.yaml ├── longformer_gen ├── .DS_Store ├── convert_model_to_long.ipynb ├── prepare_notes_longformer_mlm.py ├── pretrain_roberta.py ├── pretrain_roberta_long.py └── roberta_to_longformer.py ├── medNLI ├── med_nli_classifier_lit.py ├── run_medMLI.sh ├── run_mednli_classify.py └── testing_for_med_nli.ipynb ├── papers ├── .DS_Store ├── 1-s2.0-S0169260719311745-main.pdf ├── 1908.10419v1.pdf ├── 2004.02288.pdf ├── 2005.08622.pdf ├── Deep_neural_network_for_hierarchical_ext.pdf ├── centerloss_WenECCV16.pdf └── sound_event_classification_using_ontology_based_neural_networks (1).pdf ├── params.yaml ├── phenotype_annotation ├── annot_classifier.py ├── interact.py ├── tokenizer.py └── training_onelabel.py ├── plots ├── .DS_Store ├── legend.png ├── testres.png ├── tloss.png ├── train_loss.png ├── train_loss.svg ├── train_loss_labeled.png ├── vacc.png ├── val_acc_weighted.png ├── val_acc_weighted.svg ├── val_loss.png ├── val_loss.svg ├── val_prec.png ├── val_prec.svg ├── valloss.png ├── valres.png ├── wacc.png └── wprec.png ├── preprocessing_pipeline ├── __pycache__ │ ├── format_data_for_training.cpython-37.pyc │ └── format_data_for_training.cpython-38.pyc ├── format_data_for_training.py ├── format_notes.py └── mimicxr2mimicivICD (1).ipynb ├── results.rtf └── shell ├── do_all_icd_tasks.sh ├── elongate_roberta.sh ├── format_mimic_for_ICD_classifier.sh ├── run_icd_classifier.sh └── split_data_and_run_mlm_training.sh /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/.gitignore -------------------------------------------------------------------------------- /.gitmodules: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/.gitmodules -------------------------------------------------------------------------------- /.idea/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/.idea/.gitignore -------------------------------------------------------------------------------- /.idea/clinical-longformer.iml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/.idea/clinical-longformer.iml -------------------------------------------------------------------------------- /.idea/inspectionProfiles/profiles_settings.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/.idea/inspectionProfiles/profiles_settings.xml -------------------------------------------------------------------------------- /.idea/misc.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/.idea/misc.xml -------------------------------------------------------------------------------- /.idea/modules.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/.idea/modules.xml -------------------------------------------------------------------------------- /.idea/vcs.xml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/.idea/vcs.xml -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/README.md -------------------------------------------------------------------------------- /Written Submission.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/Written Submission.pdf -------------------------------------------------------------------------------- /classifier_pipeline/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/README.md -------------------------------------------------------------------------------- /classifier_pipeline/__pycache__/classifier.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/__pycache__/classifier.cpython-37.pyc -------------------------------------------------------------------------------- /classifier_pipeline/__pycache__/classifier.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/__pycache__/classifier.cpython-38.pyc -------------------------------------------------------------------------------- /classifier_pipeline/__pycache__/classifier_longformer.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/__pycache__/classifier_longformer.cpython-37.pyc -------------------------------------------------------------------------------- /classifier_pipeline/__pycache__/classifier_longformer.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/__pycache__/classifier_longformer.cpython-38.pyc -------------------------------------------------------------------------------- /classifier_pipeline/__pycache__/classifier_multilabel.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/__pycache__/classifier_multilabel.cpython-37.pyc -------------------------------------------------------------------------------- /classifier_pipeline/__pycache__/classifier_one_label.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/__pycache__/classifier_one_label.cpython-37.pyc -------------------------------------------------------------------------------- /classifier_pipeline/__pycache__/classifier_one_label.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/__pycache__/classifier_one_label.cpython-38.pyc -------------------------------------------------------------------------------- /classifier_pipeline/__pycache__/tokenizer.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/__pycache__/tokenizer.cpython-37.pyc -------------------------------------------------------------------------------- /classifier_pipeline/__pycache__/tokenizer.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/__pycache__/tokenizer.cpython-38.pyc -------------------------------------------------------------------------------- /classifier_pipeline/__pycache__/utils.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/__pycache__/utils.cpython-37.pyc -------------------------------------------------------------------------------- /classifier_pipeline/__pycache__/utils.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/__pycache__/utils.cpython-38.pyc -------------------------------------------------------------------------------- /classifier_pipeline/classifier_one_label.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/classifier_one_label.py -------------------------------------------------------------------------------- /classifier_pipeline/interact.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/interact.py -------------------------------------------------------------------------------- /classifier_pipeline/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/requirements.txt -------------------------------------------------------------------------------- /classifier_pipeline/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/tokenizer.py -------------------------------------------------------------------------------- /classifier_pipeline/training_onelabel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/training_onelabel.py -------------------------------------------------------------------------------- /classifier_pipeline/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline/utils.py -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/__pycache__/mednli_classifier.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/__pycache__/mednli_classifier.cpython-37.pyc -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/__pycache__/mednli_data_utils.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/__pycache__/mednli_data_utils.cpython-37.pyc -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/__pycache__/tokenizer.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/__pycache__/tokenizer.cpython-37.pyc -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/__pycache__/utils.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/__pycache__/utils.cpython-37.pyc -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/allenai/biomed_roberta_base/allen_confusion_matrix.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/experiments_mednli/allenai/biomed_roberta_base/allen_confusion_matrix.npy -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/allenai/biomed_roberta_base/allen_confusion_mtx.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/experiments_mednli/allenai/biomed_roberta_base/allen_confusion_mtx.png -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/allenai/biomed_roberta_base/version_04-12-2020--13-10-52/allenai_hparams.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/experiments_mednli/allenai/biomed_roberta_base/version_04-12-2020--13-10-52/allenai_hparams.yaml -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/allenai/biomed_roberta_base/version_04-12-2020--13-10-52/events.out.tfevents.1607087458.55d001092ee9.1345.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/experiments_mednli/allenai/biomed_roberta_base/version_04-12-2020--13-10-52/events.out.tfevents.1607087458.55d001092ee9.1345.0 -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/allenai/biomed_roberta_base/version_04-12-2020--13-10-52/trial.txt: -------------------------------------------------------------------------------- 1 | blah 2 | -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/bert-base-uncased/bert_confusion_matrix.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/experiments_mednli/bert-base-uncased/bert_confusion_matrix.npy -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/bert-base-uncased/bert_confusion_mtx.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/experiments_mednli/bert-base-uncased/bert_confusion_mtx.png -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/emilyalsentzer/Bio_ClinicalBERT/emily_confusion_matrix.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/experiments_mednli/emilyalsentzer/Bio_ClinicalBERT/emily_confusion_matrix.npy -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/emilyalsentzer/Bio_ClinicalBERT/emily_confusion_mtx.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/experiments_mednli/emilyalsentzer/Bio_ClinicalBERT/emily_confusion_mtx.png -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/emilyalsentzer/Bio_ClinicalBERT/version_04-12-2020--13-10-52/hparams.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/experiments_mednli/emilyalsentzer/Bio_ClinicalBERT/version_04-12-2020--13-10-52/hparams.yaml -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/simonlevine/biomed_roberta_base-4096-speedfix/longformer_confusion_matrix.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/experiments_mednli/simonlevine/biomed_roberta_base-4096-speedfix/longformer_confusion_matrix.npy -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/simonlevine/biomed_roberta_base-4096-speedfix/longformer_confusion_mtx.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/experiments_mednli/simonlevine/biomed_roberta_base-4096-speedfix/longformer_confusion_mtx.png -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/experiments_mednli/simonlevine/biomed_roberta_base-4096-speedfix/version_04-12-2020--13-28-13/hparams.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/experiments_mednli/simonlevine/biomed_roberta_base-4096-speedfix/version_04-12-2020--13-28-13/hparams.yaml -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/mednli_classifier.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/mednli_classifier.py -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/mednli_data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/mednli_data_utils.py -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/mednli_training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/mednli_training.py -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/mnli_testing.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/mnli_testing.ipynb -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/requirements.txt -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/tokenizer.py -------------------------------------------------------------------------------- /classifier_pipeline_medNLI/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/classifier_pipeline_medNLI/utils.py -------------------------------------------------------------------------------- /data/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/data/.DS_Store -------------------------------------------------------------------------------- /data/.gitignore: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /data/annotation_task_sample: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/data/annotation_task_sample -------------------------------------------------------------------------------- /data/mednli/LICENSE.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/data/mednli/LICENSE.txt -------------------------------------------------------------------------------- /data/mednli/README.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/data/mednli/README.txt -------------------------------------------------------------------------------- /data/mednli/SHA256SUMS.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/data/mednli/SHA256SUMS.txt -------------------------------------------------------------------------------- /data/mednli/mli_dev_v1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/data/mednli/mli_dev_v1.jsonl -------------------------------------------------------------------------------- /data/mednli/mli_test_v1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/data/mednli/mli_test_v1.jsonl -------------------------------------------------------------------------------- /data/mednli/mli_train_v1.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/data/mednli/mli_train_v1.jsonl -------------------------------------------------------------------------------- /data/physionet.org/files/mimiciii/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/data/physionet.org/files/mimiciii/.DS_Store -------------------------------------------------------------------------------- /data/physionet.org/files/mimiciii/1.4/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/data/physionet.org/files/mimiciii/1.4/.DS_Store -------------------------------------------------------------------------------- /experiments/allenai/biomed_roberta_base/version_11-11-2020--19-37-30/events.out.tfevents.1605123452.nvidia-ngc-image-2-vm.9468.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/experiments/allenai/biomed_roberta_base/version_11-11-2020--19-37-30/events.out.tfevents.1605123452.nvidia-ngc-image-2-vm.9468.0 -------------------------------------------------------------------------------- /experiments/allenai/biomed_roberta_base/version_11-11-2020--19-37-30/hparams.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/experiments/allenai/biomed_roberta_base/version_11-11-2020--19-37-30/hparams.yaml -------------------------------------------------------------------------------- /experiments/bert-base-uncased/version_11-11-2020--16-50-04/events.out.tfevents.1605113407.nvidia-ngc-image-2-vm.5935.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/experiments/bert-base-uncased/version_11-11-2020--16-50-04/events.out.tfevents.1605113407.nvidia-ngc-image-2-vm.5935.0 -------------------------------------------------------------------------------- /experiments/bert-base-uncased/version_11-11-2020--16-50-04/hparams.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/experiments/bert-base-uncased/version_11-11-2020--16-50-04/hparams.yaml -------------------------------------------------------------------------------- /experiments/emilyalsentzer/Bio_ClinicalBERT/version_11-11-2020--18-13-49/events.out.tfevents.1605118432.nvidia-ngc-image-2-vm.7703.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/experiments/emilyalsentzer/Bio_ClinicalBERT/version_11-11-2020--18-13-49/events.out.tfevents.1605118432.nvidia-ngc-image-2-vm.7703.0 -------------------------------------------------------------------------------- /experiments/emilyalsentzer/Bio_ClinicalBERT/version_11-11-2020--18-13-49/hparams.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/experiments/emilyalsentzer/Bio_ClinicalBERT/version_11-11-2020--18-13-49/hparams.yaml -------------------------------------------------------------------------------- /experiments/simonlevine/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/experiments/simonlevine/.DS_Store -------------------------------------------------------------------------------- /experiments/simonlevine/bioclinical-roberta-long/CM_updated.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/experiments/simonlevine/bioclinical-roberta-long/CM_updated.npy -------------------------------------------------------------------------------- /experiments/simonlevine/bioclinical-roberta-long/test_confusion_matrices.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/experiments/simonlevine/bioclinical-roberta-long/test_confusion_matrices.npy -------------------------------------------------------------------------------- /experiments/simonlevine/bioclinical-roberta-long/version_11-11-2020--23-49-14/events.out.tfevents.1605138556.nvidia-ngc-image-2-vm.13914.0: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/experiments/simonlevine/bioclinical-roberta-long/version_11-11-2020--23-49-14/events.out.tfevents.1605138556.nvidia-ngc-image-2-vm.13914.0 -------------------------------------------------------------------------------- /experiments/simonlevine/bioclinical-roberta-long/version_11-11-2020--23-49-14/hparams.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/experiments/simonlevine/bioclinical-roberta-long/version_11-11-2020--23-49-14/hparams.yaml -------------------------------------------------------------------------------- /longformer_gen/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/longformer_gen/.DS_Store -------------------------------------------------------------------------------- /longformer_gen/convert_model_to_long.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/longformer_gen/convert_model_to_long.ipynb -------------------------------------------------------------------------------- /longformer_gen/prepare_notes_longformer_mlm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/longformer_gen/prepare_notes_longformer_mlm.py -------------------------------------------------------------------------------- /longformer_gen/pretrain_roberta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/longformer_gen/pretrain_roberta.py -------------------------------------------------------------------------------- /longformer_gen/pretrain_roberta_long.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/longformer_gen/pretrain_roberta_long.py -------------------------------------------------------------------------------- /longformer_gen/roberta_to_longformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/longformer_gen/roberta_to_longformer.py -------------------------------------------------------------------------------- /medNLI/med_nli_classifier_lit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/medNLI/med_nli_classifier_lit.py -------------------------------------------------------------------------------- /medNLI/run_medMLI.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/medNLI/run_medMLI.sh -------------------------------------------------------------------------------- /medNLI/run_mednli_classify.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/medNLI/run_mednli_classify.py -------------------------------------------------------------------------------- /medNLI/testing_for_med_nli.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/medNLI/testing_for_med_nli.ipynb -------------------------------------------------------------------------------- /papers/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/papers/.DS_Store -------------------------------------------------------------------------------- /papers/1-s2.0-S0169260719311745-main.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/papers/1-s2.0-S0169260719311745-main.pdf -------------------------------------------------------------------------------- /papers/1908.10419v1.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/papers/1908.10419v1.pdf -------------------------------------------------------------------------------- /papers/2004.02288.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/papers/2004.02288.pdf -------------------------------------------------------------------------------- /papers/2005.08622.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/papers/2005.08622.pdf -------------------------------------------------------------------------------- /papers/Deep_neural_network_for_hierarchical_ext.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/papers/Deep_neural_network_for_hierarchical_ext.pdf -------------------------------------------------------------------------------- /papers/centerloss_WenECCV16.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/papers/centerloss_WenECCV16.pdf -------------------------------------------------------------------------------- /papers/sound_event_classification_using_ontology_based_neural_networks (1).pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/papers/sound_event_classification_using_ontology_based_neural_networks (1).pdf -------------------------------------------------------------------------------- /params.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/params.yaml -------------------------------------------------------------------------------- /phenotype_annotation/annot_classifier.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/phenotype_annotation/annot_classifier.py -------------------------------------------------------------------------------- /phenotype_annotation/interact.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/phenotype_annotation/interact.py -------------------------------------------------------------------------------- /phenotype_annotation/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/phenotype_annotation/tokenizer.py -------------------------------------------------------------------------------- /phenotype_annotation/training_onelabel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/phenotype_annotation/training_onelabel.py -------------------------------------------------------------------------------- /plots/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/.DS_Store -------------------------------------------------------------------------------- /plots/legend.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/legend.png -------------------------------------------------------------------------------- /plots/testres.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/testres.png -------------------------------------------------------------------------------- /plots/tloss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/tloss.png -------------------------------------------------------------------------------- /plots/train_loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/train_loss.png -------------------------------------------------------------------------------- /plots/train_loss.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/train_loss.svg -------------------------------------------------------------------------------- /plots/train_loss_labeled.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/train_loss_labeled.png -------------------------------------------------------------------------------- /plots/vacc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/vacc.png -------------------------------------------------------------------------------- /plots/val_acc_weighted.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/val_acc_weighted.png -------------------------------------------------------------------------------- /plots/val_acc_weighted.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/val_acc_weighted.svg -------------------------------------------------------------------------------- /plots/val_loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/val_loss.png -------------------------------------------------------------------------------- /plots/val_loss.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/val_loss.svg -------------------------------------------------------------------------------- /plots/val_prec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/val_prec.png -------------------------------------------------------------------------------- /plots/val_prec.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/val_prec.svg -------------------------------------------------------------------------------- /plots/valloss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/valloss.png -------------------------------------------------------------------------------- /plots/valres.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/valres.png -------------------------------------------------------------------------------- /plots/wacc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/wacc.png -------------------------------------------------------------------------------- /plots/wprec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/plots/wprec.png -------------------------------------------------------------------------------- /preprocessing_pipeline/__pycache__/format_data_for_training.cpython-37.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/preprocessing_pipeline/__pycache__/format_data_for_training.cpython-37.pyc -------------------------------------------------------------------------------- /preprocessing_pipeline/__pycache__/format_data_for_training.cpython-38.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/preprocessing_pipeline/__pycache__/format_data_for_training.cpython-38.pyc -------------------------------------------------------------------------------- /preprocessing_pipeline/format_data_for_training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/preprocessing_pipeline/format_data_for_training.py -------------------------------------------------------------------------------- /preprocessing_pipeline/format_notes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/preprocessing_pipeline/format_notes.py -------------------------------------------------------------------------------- /preprocessing_pipeline/mimicxr2mimicivICD (1).ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/preprocessing_pipeline/mimicxr2mimicivICD (1).ipynb -------------------------------------------------------------------------------- /results.rtf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/results.rtf -------------------------------------------------------------------------------- /shell/do_all_icd_tasks.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/shell/do_all_icd_tasks.sh -------------------------------------------------------------------------------- /shell/elongate_roberta.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/shell/elongate_roberta.sh -------------------------------------------------------------------------------- /shell/format_mimic_for_ICD_classifier.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/shell/format_mimic_for_ICD_classifier.sh -------------------------------------------------------------------------------- /shell/run_icd_classifier.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/shell/run_icd_classifier.sh -------------------------------------------------------------------------------- /shell/split_data_and_run_mlm_training.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/simonlevine/clinical-longformer/HEAD/shell/split_data_and_run_mlm_training.sh --------------------------------------------------------------------------------