├── .gitignore ├── LICENSE ├── README.md ├── docker ├── Dockerfile-megatron ├── Dockerfile-nemo ├── nemo.def └── readme.md ├── finetuning ├── mnli │ ├── run_mednli_345m.sh │ ├── run_mednli_4b.sh │ └── run_mednli_8b.sh ├── nemo_ner │ ├── conlleval │ │ ├── LICENSE │ │ ├── README.md │ │ └── conlleval.py │ ├── generate_conll_compatible_eval.py │ ├── nemo2bio.py │ ├── ner_expr.py │ ├── ner_expr_ddp.py │ ├── new_bio_eval.py │ └── shell │ │ ├── i2b22010_uf_full_9b.sh │ │ ├── i2b22010_uf_full_9b.yaml │ │ ├── i2b22012_9B.sh │ │ ├── i2b22012_9B.yaml │ │ ├── n2c2_9B.sh │ │ └── n2c2_9B.yaml ├── qa │ ├── evaluate-squad-v2.0.py │ ├── evaluate-v1.1.py │ ├── qa.py │ ├── qa_ddp.py │ ├── qa_test.py │ └── slurm │ │ ├── emrqa_9b_med.sh │ │ ├── emrqa_9b_med.yaml │ │ ├── emrqa_9b_rel.sh │ │ └── emrqa_9b_rel.yaml ├── re │ ├── brat_eval_res.py │ ├── measure_perf.py │ ├── re_ddp.py │ ├── relation_extraction.py │ └── slurm │ │ ├── n2c2_9b.sh │ │ └── n2c2_9b.yaml └── sts │ ├── slurm │ ├── sts_9b.sh │ └── sts_9b.yaml │ └── sts.py ├── pretraining ├── preprocessing │ ├── csv2json_batch.sh │ ├── gatortron_process_data.py │ ├── json2data.sh │ ├── merge_bin.sh │ └── merge_megatron_preprocessing_bin_files.py ├── pretraining │ ├── helper.sh │ └── launch.sh └── train_vocab │ ├── bert_vocab_head.txt │ ├── train_vocab.py │ ├── train_vocab_docker.sh │ └── train_vocab_singularity.sh └── resources └── gatorTron_workflow.png /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/README.md -------------------------------------------------------------------------------- /docker/Dockerfile-megatron: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/docker/Dockerfile-megatron -------------------------------------------------------------------------------- /docker/Dockerfile-nemo: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/docker/Dockerfile-nemo -------------------------------------------------------------------------------- /docker/nemo.def: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/docker/nemo.def -------------------------------------------------------------------------------- /docker/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/docker/readme.md -------------------------------------------------------------------------------- /finetuning/mnli/run_mednli_345m.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/mnli/run_mednli_345m.sh -------------------------------------------------------------------------------- /finetuning/mnli/run_mednli_4b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/mnli/run_mednli_4b.sh -------------------------------------------------------------------------------- /finetuning/mnli/run_mednli_8b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/mnli/run_mednli_8b.sh -------------------------------------------------------------------------------- /finetuning/nemo_ner/conlleval/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/conlleval/LICENSE -------------------------------------------------------------------------------- /finetuning/nemo_ner/conlleval/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/conlleval/README.md -------------------------------------------------------------------------------- /finetuning/nemo_ner/conlleval/conlleval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/conlleval/conlleval.py -------------------------------------------------------------------------------- /finetuning/nemo_ner/generate_conll_compatible_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/generate_conll_compatible_eval.py -------------------------------------------------------------------------------- /finetuning/nemo_ner/nemo2bio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/nemo2bio.py -------------------------------------------------------------------------------- /finetuning/nemo_ner/ner_expr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/ner_expr.py -------------------------------------------------------------------------------- /finetuning/nemo_ner/ner_expr_ddp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/ner_expr_ddp.py -------------------------------------------------------------------------------- /finetuning/nemo_ner/new_bio_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/new_bio_eval.py -------------------------------------------------------------------------------- /finetuning/nemo_ner/shell/i2b22010_uf_full_9b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/shell/i2b22010_uf_full_9b.sh -------------------------------------------------------------------------------- /finetuning/nemo_ner/shell/i2b22010_uf_full_9b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/shell/i2b22010_uf_full_9b.yaml -------------------------------------------------------------------------------- /finetuning/nemo_ner/shell/i2b22012_9B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/shell/i2b22012_9B.sh -------------------------------------------------------------------------------- /finetuning/nemo_ner/shell/i2b22012_9B.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/shell/i2b22012_9B.yaml -------------------------------------------------------------------------------- /finetuning/nemo_ner/shell/n2c2_9B.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/shell/n2c2_9B.sh -------------------------------------------------------------------------------- /finetuning/nemo_ner/shell/n2c2_9B.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/nemo_ner/shell/n2c2_9B.yaml -------------------------------------------------------------------------------- /finetuning/qa/evaluate-squad-v2.0.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/qa/evaluate-squad-v2.0.py -------------------------------------------------------------------------------- /finetuning/qa/evaluate-v1.1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/qa/evaluate-v1.1.py -------------------------------------------------------------------------------- /finetuning/qa/qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/qa/qa.py -------------------------------------------------------------------------------- /finetuning/qa/qa_ddp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/qa/qa_ddp.py -------------------------------------------------------------------------------- /finetuning/qa/qa_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/qa/qa_test.py -------------------------------------------------------------------------------- /finetuning/qa/slurm/emrqa_9b_med.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/qa/slurm/emrqa_9b_med.sh -------------------------------------------------------------------------------- /finetuning/qa/slurm/emrqa_9b_med.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/qa/slurm/emrqa_9b_med.yaml -------------------------------------------------------------------------------- /finetuning/qa/slurm/emrqa_9b_rel.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/qa/slurm/emrqa_9b_rel.sh -------------------------------------------------------------------------------- /finetuning/qa/slurm/emrqa_9b_rel.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/qa/slurm/emrqa_9b_rel.yaml -------------------------------------------------------------------------------- /finetuning/re/brat_eval_res.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/re/brat_eval_res.py -------------------------------------------------------------------------------- /finetuning/re/measure_perf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/re/measure_perf.py -------------------------------------------------------------------------------- /finetuning/re/re_ddp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/re/re_ddp.py -------------------------------------------------------------------------------- /finetuning/re/relation_extraction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/re/relation_extraction.py -------------------------------------------------------------------------------- /finetuning/re/slurm/n2c2_9b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/re/slurm/n2c2_9b.sh -------------------------------------------------------------------------------- /finetuning/re/slurm/n2c2_9b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/re/slurm/n2c2_9b.yaml -------------------------------------------------------------------------------- /finetuning/sts/slurm/sts_9b.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/sts/slurm/sts_9b.sh -------------------------------------------------------------------------------- /finetuning/sts/slurm/sts_9b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/sts/slurm/sts_9b.yaml -------------------------------------------------------------------------------- /finetuning/sts/sts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/finetuning/sts/sts.py -------------------------------------------------------------------------------- /pretraining/preprocessing/csv2json_batch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/pretraining/preprocessing/csv2json_batch.sh -------------------------------------------------------------------------------- /pretraining/preprocessing/gatortron_process_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/pretraining/preprocessing/gatortron_process_data.py -------------------------------------------------------------------------------- /pretraining/preprocessing/json2data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/pretraining/preprocessing/json2data.sh -------------------------------------------------------------------------------- /pretraining/preprocessing/merge_bin.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/pretraining/preprocessing/merge_bin.sh -------------------------------------------------------------------------------- /pretraining/preprocessing/merge_megatron_preprocessing_bin_files.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/pretraining/preprocessing/merge_megatron_preprocessing_bin_files.py -------------------------------------------------------------------------------- /pretraining/pretraining/helper.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/pretraining/pretraining/helper.sh -------------------------------------------------------------------------------- /pretraining/pretraining/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/pretraining/pretraining/launch.sh -------------------------------------------------------------------------------- /pretraining/train_vocab/bert_vocab_head.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/pretraining/train_vocab/bert_vocab_head.txt -------------------------------------------------------------------------------- /pretraining/train_vocab/train_vocab.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/pretraining/train_vocab/train_vocab.py -------------------------------------------------------------------------------- /pretraining/train_vocab/train_vocab_docker.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/pretraining/train_vocab/train_vocab_docker.sh -------------------------------------------------------------------------------- /pretraining/train_vocab/train_vocab_singularity.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/pretraining/train_vocab/train_vocab_singularity.sh -------------------------------------------------------------------------------- /resources/gatorTron_workflow.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/uf-hobi-informatics-lab/GatorTron/HEAD/resources/gatorTron_workflow.png --------------------------------------------------------------------------------