├── .gitignore ├── README.md ├── data ├── processed │ ├── hetionet-relations.tsv │ ├── hetionet.tsv │ ├── msi-relations.tsv │ ├── msi.tsv │ └── repodb.tsv └── script │ ├── hetionet │ └── preprocess_hetionet.py │ ├── msi │ ├── authentication.py │ ├── get_descriptions_msi.py │ ├── preprocess_msi.py │ └── umls.py │ └── repodb │ ├── authentication.py │ ├── get_descriptions.py │ └── umls.py ├── environment.yml ├── script ├── compute_entity_encodings.py ├── compute_kge_scores.py ├── create_hetionet_dataset.py ├── create_msi_dataset.py ├── create_repodb_dataset.py ├── dataset_utils.py ├── evaluate_adaptive_weighting.py ├── evaluate_router.py ├── features.py ├── kge_util.py ├── preprocess.py ├── pretokenize.py ├── summarize_adaptive_weighting_results.py ├── summarize_ensemble_results.py ├── summarize_kge_results.py └── training │ ├── hetionet │ ├── adaptive_weighting_ensemble_grid.py │ ├── adaptive_weighting_ensemble_grid.sbatch │ ├── dkrl_grid.py │ ├── dkrl_grid.sbatch │ ├── kge_grid.py │ ├── kge_grid.sbatch │ ├── multitask_kgbert_grid.py │ ├── multitask_kgbert_grid.sbatch │ ├── multitask_kgbert_ind_grid.py │ ├── multitask_kgbert_ind_grid.sbatch │ ├── router_ensemble_grid.py │ ├── router_ensemble_grid.sbatch │ ├── router_ensemble_multi_grid.py │ └── router_ensemble_multi_grid.sbatch │ ├── msi │ ├── adaptive_weighting_ensemble_grid.py │ ├── adaptive_weighting_ensemble_grid.sbatch │ ├── dkrl_grid.py │ ├── dkrl_grid.sbatch │ ├── kge_grid.py │ ├── kge_grid.sbatch │ ├── kge_ind_grid.py │ ├── kge_ind_grid.sbatch │ ├── multitask_kgbert_grid.py │ ├── multitask_kgbert_grid.sbatch │ ├── router_ensemble_grid.py │ ├── router_ensemble_grid.sbatch │ ├── router_ensemble_multi_grid.py │ └── router_ensemble_multi_grid.sbatch │ └── repodb │ ├── adaptive_weighting_ensemble_grid.py │ ├── adaptive_weighting_ensemble_grid.sbatch │ ├── blpcrossencoder_grid.py │ ├── blpcrossencoder_grid.sbatch │ ├── dkrl_grid.py │ ├── dkrl_grid.sbatch │ ├── joint_blpx_complex_grid.py │ ├── joint_blpx_complex_grid.sbatch │ ├── kge_grid.py │ ├── kge_grid.sbatch │ ├── multitask_kgbert_grid.py │ ├── multitask_kgbert_grid.sbatch │ ├── multitask_kgbert_with_kge_inputs_grid.py │ ├── multitask_kgbert_with_kge_inputs_grid.sbatch │ ├── router_ensemble_grid.py │ ├── router_ensemble_grid.sbatch │ ├── router_ensemble_multi_grid.py │ └── router_ensemble_multi_grid.sbatch ├── src ├── kge │ ├── dataloader.py │ ├── model.py │ ├── preprocess.py │ └── run.py └── lm │ ├── dataloader.py │ ├── evaluate.py │ ├── model.py │ ├── preprocess.py │ ├── run.py │ └── util.py └── subgraph └── README.md /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/README.md -------------------------------------------------------------------------------- /data/processed/hetionet-relations.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/processed/hetionet-relations.tsv -------------------------------------------------------------------------------- /data/processed/hetionet.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/processed/hetionet.tsv -------------------------------------------------------------------------------- /data/processed/msi-relations.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/processed/msi-relations.tsv -------------------------------------------------------------------------------- /data/processed/msi.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/processed/msi.tsv -------------------------------------------------------------------------------- /data/processed/repodb.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/processed/repodb.tsv -------------------------------------------------------------------------------- /data/script/hetionet/preprocess_hetionet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/script/hetionet/preprocess_hetionet.py -------------------------------------------------------------------------------- /data/script/msi/authentication.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/script/msi/authentication.py -------------------------------------------------------------------------------- /data/script/msi/get_descriptions_msi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/script/msi/get_descriptions_msi.py -------------------------------------------------------------------------------- /data/script/msi/preprocess_msi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/script/msi/preprocess_msi.py -------------------------------------------------------------------------------- /data/script/msi/umls.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/script/msi/umls.py -------------------------------------------------------------------------------- /data/script/repodb/authentication.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/script/repodb/authentication.py -------------------------------------------------------------------------------- /data/script/repodb/get_descriptions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/script/repodb/get_descriptions.py -------------------------------------------------------------------------------- /data/script/repodb/umls.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/data/script/repodb/umls.py -------------------------------------------------------------------------------- /environment.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/environment.yml -------------------------------------------------------------------------------- /script/compute_entity_encodings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/compute_entity_encodings.py -------------------------------------------------------------------------------- /script/compute_kge_scores.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/compute_kge_scores.py -------------------------------------------------------------------------------- /script/create_hetionet_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/create_hetionet_dataset.py -------------------------------------------------------------------------------- /script/create_msi_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/create_msi_dataset.py -------------------------------------------------------------------------------- /script/create_repodb_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/create_repodb_dataset.py -------------------------------------------------------------------------------- /script/dataset_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/dataset_utils.py -------------------------------------------------------------------------------- /script/evaluate_adaptive_weighting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/evaluate_adaptive_weighting.py -------------------------------------------------------------------------------- /script/evaluate_router.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/evaluate_router.py -------------------------------------------------------------------------------- /script/features.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/features.py -------------------------------------------------------------------------------- /script/kge_util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/kge_util.py -------------------------------------------------------------------------------- /script/preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/preprocess.py -------------------------------------------------------------------------------- /script/pretokenize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/pretokenize.py -------------------------------------------------------------------------------- /script/summarize_adaptive_weighting_results.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/summarize_adaptive_weighting_results.py -------------------------------------------------------------------------------- /script/summarize_ensemble_results.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/summarize_ensemble_results.py -------------------------------------------------------------------------------- /script/summarize_kge_results.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/summarize_kge_results.py -------------------------------------------------------------------------------- /script/training/hetionet/adaptive_weighting_ensemble_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/adaptive_weighting_ensemble_grid.py -------------------------------------------------------------------------------- /script/training/hetionet/adaptive_weighting_ensemble_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/adaptive_weighting_ensemble_grid.sbatch -------------------------------------------------------------------------------- /script/training/hetionet/dkrl_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/dkrl_grid.py -------------------------------------------------------------------------------- /script/training/hetionet/dkrl_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/dkrl_grid.sbatch -------------------------------------------------------------------------------- /script/training/hetionet/kge_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/kge_grid.py -------------------------------------------------------------------------------- /script/training/hetionet/kge_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/kge_grid.sbatch -------------------------------------------------------------------------------- /script/training/hetionet/multitask_kgbert_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/multitask_kgbert_grid.py -------------------------------------------------------------------------------- /script/training/hetionet/multitask_kgbert_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/multitask_kgbert_grid.sbatch -------------------------------------------------------------------------------- /script/training/hetionet/multitask_kgbert_ind_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/multitask_kgbert_ind_grid.py -------------------------------------------------------------------------------- /script/training/hetionet/multitask_kgbert_ind_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/multitask_kgbert_ind_grid.sbatch -------------------------------------------------------------------------------- /script/training/hetionet/router_ensemble_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/router_ensemble_grid.py -------------------------------------------------------------------------------- /script/training/hetionet/router_ensemble_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/router_ensemble_grid.sbatch -------------------------------------------------------------------------------- /script/training/hetionet/router_ensemble_multi_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/router_ensemble_multi_grid.py -------------------------------------------------------------------------------- /script/training/hetionet/router_ensemble_multi_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/hetionet/router_ensemble_multi_grid.sbatch -------------------------------------------------------------------------------- /script/training/msi/adaptive_weighting_ensemble_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/adaptive_weighting_ensemble_grid.py -------------------------------------------------------------------------------- /script/training/msi/adaptive_weighting_ensemble_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/adaptive_weighting_ensemble_grid.sbatch -------------------------------------------------------------------------------- /script/training/msi/dkrl_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/dkrl_grid.py -------------------------------------------------------------------------------- /script/training/msi/dkrl_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/dkrl_grid.sbatch -------------------------------------------------------------------------------- /script/training/msi/kge_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/kge_grid.py -------------------------------------------------------------------------------- /script/training/msi/kge_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/kge_grid.sbatch -------------------------------------------------------------------------------- /script/training/msi/kge_ind_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/kge_ind_grid.py -------------------------------------------------------------------------------- /script/training/msi/kge_ind_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/kge_ind_grid.sbatch -------------------------------------------------------------------------------- /script/training/msi/multitask_kgbert_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/multitask_kgbert_grid.py -------------------------------------------------------------------------------- /script/training/msi/multitask_kgbert_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/multitask_kgbert_grid.sbatch -------------------------------------------------------------------------------- /script/training/msi/router_ensemble_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/router_ensemble_grid.py -------------------------------------------------------------------------------- /script/training/msi/router_ensemble_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/router_ensemble_grid.sbatch -------------------------------------------------------------------------------- /script/training/msi/router_ensemble_multi_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/router_ensemble_multi_grid.py -------------------------------------------------------------------------------- /script/training/msi/router_ensemble_multi_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/msi/router_ensemble_multi_grid.sbatch -------------------------------------------------------------------------------- /script/training/repodb/adaptive_weighting_ensemble_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/adaptive_weighting_ensemble_grid.py -------------------------------------------------------------------------------- /script/training/repodb/adaptive_weighting_ensemble_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/adaptive_weighting_ensemble_grid.sbatch -------------------------------------------------------------------------------- /script/training/repodb/blpcrossencoder_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/blpcrossencoder_grid.py -------------------------------------------------------------------------------- /script/training/repodb/blpcrossencoder_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/blpcrossencoder_grid.sbatch -------------------------------------------------------------------------------- /script/training/repodb/dkrl_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/dkrl_grid.py -------------------------------------------------------------------------------- /script/training/repodb/dkrl_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/dkrl_grid.sbatch -------------------------------------------------------------------------------- /script/training/repodb/joint_blpx_complex_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/joint_blpx_complex_grid.py -------------------------------------------------------------------------------- /script/training/repodb/joint_blpx_complex_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/joint_blpx_complex_grid.sbatch -------------------------------------------------------------------------------- /script/training/repodb/kge_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/kge_grid.py -------------------------------------------------------------------------------- /script/training/repodb/kge_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/kge_grid.sbatch -------------------------------------------------------------------------------- /script/training/repodb/multitask_kgbert_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/multitask_kgbert_grid.py -------------------------------------------------------------------------------- /script/training/repodb/multitask_kgbert_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/multitask_kgbert_grid.sbatch -------------------------------------------------------------------------------- /script/training/repodb/multitask_kgbert_with_kge_inputs_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/multitask_kgbert_with_kge_inputs_grid.py -------------------------------------------------------------------------------- /script/training/repodb/multitask_kgbert_with_kge_inputs_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/multitask_kgbert_with_kge_inputs_grid.sbatch -------------------------------------------------------------------------------- /script/training/repodb/router_ensemble_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/router_ensemble_grid.py -------------------------------------------------------------------------------- /script/training/repodb/router_ensemble_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/router_ensemble_grid.sbatch -------------------------------------------------------------------------------- /script/training/repodb/router_ensemble_multi_grid.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/router_ensemble_multi_grid.py -------------------------------------------------------------------------------- /script/training/repodb/router_ensemble_multi_grid.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/script/training/repodb/router_ensemble_multi_grid.sbatch -------------------------------------------------------------------------------- /src/kge/dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/src/kge/dataloader.py -------------------------------------------------------------------------------- /src/kge/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/src/kge/model.py -------------------------------------------------------------------------------- /src/kge/preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/src/kge/preprocess.py -------------------------------------------------------------------------------- /src/kge/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/src/kge/run.py -------------------------------------------------------------------------------- /src/lm/dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/src/lm/dataloader.py -------------------------------------------------------------------------------- /src/lm/evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/src/lm/evaluate.py -------------------------------------------------------------------------------- /src/lm/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/src/lm/model.py -------------------------------------------------------------------------------- /src/lm/preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/src/lm/preprocess.py -------------------------------------------------------------------------------- /src/lm/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/src/lm/run.py -------------------------------------------------------------------------------- /src/lm/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/src/lm/util.py -------------------------------------------------------------------------------- /subgraph/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rahuln/lm-bio-kgc/HEAD/subgraph/README.md --------------------------------------------------------------------------------