├── README.md ├── imgs ├── image-20201213122841703.png ├── image-20201213122906064.png └── image-20201213122915570.png ├── segabert ├── README.md ├── arguments.py ├── bookcorpus │ ├── README.md │ ├── download_files.py │ ├── download_list.py │ ├── epub2txt.py │ ├── make_docs.py │ ├── make_sentlines.py │ ├── preprocess.ipynb │ ├── requirements.txt │ └── tokenize_sentlines.py ├── configure_data.py ├── data_utils │ ├── __init__.py │ ├── corpora.py │ ├── datasets.py │ ├── file_utils.py │ ├── lazy_loader.py │ ├── samplers.py │ ├── tf_dl.py │ ├── tokenization.py │ └── wordpiece.py ├── fp16 │ ├── __init__.py │ ├── fp16.py │ ├── fp16util.py │ └── loss_scaler.py ├── learning_rates.py ├── model │ ├── __init__.py │ ├── distributed.py │ ├── model.py │ ├── modeling.py │ └── utils.py ├── mpu │ ├── __init__.py │ ├── cross_entropy.py │ ├── data.py │ ├── grads.py │ ├── initialize.py │ ├── layers.py │ ├── mappings.py │ ├── random.py │ ├── tests │ │ ├── __init__.py │ │ ├── commons.py │ │ ├── test_cross_entropy.py │ │ ├── test_data.py │ │ ├── test_initialize.py │ │ ├── test_layers.py │ │ └── test_random.py │ ├── transformer.py │ └── utils.py ├── pretrain_segabert.py ├── scripts │ ├── presplit_sentences_json.py │ ├── pretrain_segabert_distributed.sh │ └── split_json.py └── utils.py ├── segatron-xl ├── README.md ├── data_utils.py ├── eval.py ├── fp16 │ ├── __init__.py │ ├── fp16.py │ ├── fp16util.py │ └── loss_scaler.py ├── getdata.sh ├── mem_transformer.py ├── mpu │ ├── __init__.py │ ├── cross_entropy.py │ ├── data.py │ ├── grads.py │ ├── initialize.py │ ├── layers.py │ ├── mappings.py │ ├── random.py │ ├── tests │ │ ├── __init__.py │ │ ├── commons.py │ │ ├── test_cross_entropy.py │ │ ├── test_data.py │ │ ├── test_initialize.py │ │ ├── test_layers.py │ │ └── test_random.py │ ├── transformer.py │ └── utils.py ├── run_wt103_base_sega.sh ├── run_wt103_large_sega.sh ├── train.py └── utils │ ├── adaptive_softmax.py │ ├── data_parallel.py │ ├── exp_utils.py │ ├── log_uniform_sampler.py │ ├── proj_adaptive_softmax.py │ └── vocabulary.py ├── sentence-transformers ├── README.md ├── examples │ └── training_transformers │ │ ├── evaluation_stsall.py │ │ └── training_nli.py ├── sentence_transformers │ ├── LoggingHandler.py │ ├── SentenceTransformer.py │ ├── __init__.py │ ├── datasets │ │ ├── ParallelSentencesDataset.py │ │ ├── SentenceLabelDataset.py │ │ ├── SentencesDataset.py │ │ ├── __init__.py │ │ └── sampler │ │ │ ├── LabelSampler.py │ │ │ └── __init__.py │ ├── evaluation │ │ ├── BinaryEmbeddingSimilarityEvaluator.py │ │ ├── EmbeddingSimilarityEvaluator.py │ │ ├── InformationRetrievalEvaluator.py │ │ ├── LabelAccuracyEvaluator.py │ │ ├── MSEEvaluator.py │ │ ├── MSEEvaluatorFromDataFrame.py │ │ ├── ParaphraseMiningEvaluator.py │ │ ├── SentenceEvaluator.py │ │ ├── SequentialEvaluator.py │ │ ├── SimilarityFunction.py │ │ ├── TranslationEvaluator.py │ │ ├── TripletEvaluator.py │ │ └── __init__.py │ ├── losses │ │ ├── BatchHardSoftMarginTripletLoss.py │ │ ├── BatchHardTripletLoss.py │ │ ├── BatchSemiHardTripletLoss.py │ │ ├── ContrastiveLoss.py │ │ ├── CosineSimilarityLoss.py │ │ ├── MSELoss.py │ │ ├── MultipleNegativesRankingLoss.py │ │ ├── OnlineContrastiveLoss.py │ │ ├── SoftmaxLoss.py │ │ ├── TripletLoss.py │ │ ├── __init__.py │ │ └── test_batch_hard_triplet_loss.py │ ├── models │ │ ├── Transformer.py │ │ ├── __init__.py │ │ └── tokenizer │ │ │ ├── PhraseTokenizer.py │ │ │ ├── WhitespaceTokenizer.py │ │ │ ├── WordTokenizer.py │ │ │ └── __init__.py │ ├── readers │ │ ├── InputExample.py │ │ ├── LabelSentenceReader.py │ │ ├── NLIDataReader.py │ │ ├── PairedFilesReader.py │ │ ├── STSDataReader.py │ │ ├── TripletReader.py │ │ └── __init__.py │ └── util.py ├── setup.cfg └── setup.py └── transformers ├── README.md ├── examples ├── README.md ├── __init__.py ├── eval_finetune │ ├── config │ │ ├── base │ │ │ ├── config.json │ │ │ └── vocab.txt │ │ └── large │ │ │ ├── config.json │ │ │ └── vocab.txt │ ├── download_glue_data.py │ ├── get_aviable_cuda.py │ ├── grid_search_glue.sh │ ├── run_race.sh │ ├── train_glue.sh │ ├── train_squad.sh │ └── train_squad2.sh ├── requirements.txt ├── run_glue.py ├── run_multiple_choice.py ├── run_squad.py └── utils_multiple_choice.py ├── fp16 ├── __init__.py ├── fp16.py ├── fp16util.py └── loss_scaler.py ├── mpu ├── __init__.py ├── cross_entropy.py ├── data.py ├── grads.py ├── initialize.py ├── layers.py ├── mappings.py ├── random.py ├── tests │ ├── __init__.py │ ├── commons.py │ ├── test_cross_entropy.py │ ├── test_data.py │ ├── test_initialize.py │ ├── test_layers.py │ └── test_random.py ├── transformer.py └── utils.py └── transformers ├── __init__.py ├── __main__.py ├── commands ├── __init__.py ├── convert.py ├── download.py ├── run.py ├── serving.py ├── train.py └── user.py ├── configuration_bert.py ├── configuration_utils.py ├── convert_segatron_to_huggingface.py ├── data ├── __init__.py ├── metrics │ ├── __init__.py │ └── squad_metrics.py └── processors │ ├── __init__.py │ ├── glue.py │ ├── split_sentences.py │ ├── squad.py │ ├── utils.py │ └── xnli.py ├── file_utils.py ├── modeling_segabert.py ├── modeling_utils.py ├── optimization.py ├── optimization_tf.py ├── pipelines.py ├── tokenization_bert.py └── tokenization_utils.py /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/README.md -------------------------------------------------------------------------------- /imgs/image-20201213122841703.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/imgs/image-20201213122841703.png -------------------------------------------------------------------------------- /imgs/image-20201213122906064.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/imgs/image-20201213122906064.png -------------------------------------------------------------------------------- /imgs/image-20201213122915570.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/imgs/image-20201213122915570.png -------------------------------------------------------------------------------- /segabert/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/README.md -------------------------------------------------------------------------------- /segabert/arguments.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/arguments.py -------------------------------------------------------------------------------- /segabert/bookcorpus/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/bookcorpus/README.md -------------------------------------------------------------------------------- /segabert/bookcorpus/download_files.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/bookcorpus/download_files.py -------------------------------------------------------------------------------- /segabert/bookcorpus/download_list.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/bookcorpus/download_list.py -------------------------------------------------------------------------------- /segabert/bookcorpus/epub2txt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/bookcorpus/epub2txt.py -------------------------------------------------------------------------------- /segabert/bookcorpus/make_docs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/bookcorpus/make_docs.py -------------------------------------------------------------------------------- /segabert/bookcorpus/make_sentlines.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/bookcorpus/make_sentlines.py -------------------------------------------------------------------------------- /segabert/bookcorpus/preprocess.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/bookcorpus/preprocess.ipynb -------------------------------------------------------------------------------- /segabert/bookcorpus/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/bookcorpus/requirements.txt -------------------------------------------------------------------------------- /segabert/bookcorpus/tokenize_sentlines.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/bookcorpus/tokenize_sentlines.py -------------------------------------------------------------------------------- /segabert/configure_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/configure_data.py -------------------------------------------------------------------------------- /segabert/data_utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/data_utils/__init__.py -------------------------------------------------------------------------------- /segabert/data_utils/corpora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/data_utils/corpora.py -------------------------------------------------------------------------------- /segabert/data_utils/datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/data_utils/datasets.py -------------------------------------------------------------------------------- /segabert/data_utils/file_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/data_utils/file_utils.py -------------------------------------------------------------------------------- /segabert/data_utils/lazy_loader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/data_utils/lazy_loader.py -------------------------------------------------------------------------------- /segabert/data_utils/samplers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/data_utils/samplers.py -------------------------------------------------------------------------------- /segabert/data_utils/tf_dl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/data_utils/tf_dl.py -------------------------------------------------------------------------------- /segabert/data_utils/tokenization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/data_utils/tokenization.py -------------------------------------------------------------------------------- /segabert/data_utils/wordpiece.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/data_utils/wordpiece.py -------------------------------------------------------------------------------- /segabert/fp16/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/fp16/__init__.py -------------------------------------------------------------------------------- /segabert/fp16/fp16.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/fp16/fp16.py -------------------------------------------------------------------------------- /segabert/fp16/fp16util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/fp16/fp16util.py -------------------------------------------------------------------------------- /segabert/fp16/loss_scaler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/fp16/loss_scaler.py -------------------------------------------------------------------------------- /segabert/learning_rates.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/learning_rates.py -------------------------------------------------------------------------------- /segabert/model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/model/__init__.py -------------------------------------------------------------------------------- /segabert/model/distributed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/model/distributed.py -------------------------------------------------------------------------------- /segabert/model/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/model/model.py -------------------------------------------------------------------------------- /segabert/model/modeling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/model/modeling.py -------------------------------------------------------------------------------- /segabert/model/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/model/utils.py -------------------------------------------------------------------------------- /segabert/mpu/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/__init__.py -------------------------------------------------------------------------------- /segabert/mpu/cross_entropy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/cross_entropy.py -------------------------------------------------------------------------------- /segabert/mpu/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/data.py -------------------------------------------------------------------------------- /segabert/mpu/grads.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/grads.py -------------------------------------------------------------------------------- /segabert/mpu/initialize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/initialize.py -------------------------------------------------------------------------------- /segabert/mpu/layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/layers.py -------------------------------------------------------------------------------- /segabert/mpu/mappings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/mappings.py -------------------------------------------------------------------------------- /segabert/mpu/random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/random.py -------------------------------------------------------------------------------- /segabert/mpu/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /segabert/mpu/tests/commons.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/tests/commons.py -------------------------------------------------------------------------------- /segabert/mpu/tests/test_cross_entropy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/tests/test_cross_entropy.py -------------------------------------------------------------------------------- /segabert/mpu/tests/test_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/tests/test_data.py -------------------------------------------------------------------------------- /segabert/mpu/tests/test_initialize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/tests/test_initialize.py -------------------------------------------------------------------------------- /segabert/mpu/tests/test_layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/tests/test_layers.py -------------------------------------------------------------------------------- /segabert/mpu/tests/test_random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/tests/test_random.py -------------------------------------------------------------------------------- /segabert/mpu/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/transformer.py -------------------------------------------------------------------------------- /segabert/mpu/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/mpu/utils.py -------------------------------------------------------------------------------- /segabert/pretrain_segabert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/pretrain_segabert.py -------------------------------------------------------------------------------- /segabert/scripts/presplit_sentences_json.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/scripts/presplit_sentences_json.py -------------------------------------------------------------------------------- /segabert/scripts/pretrain_segabert_distributed.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/scripts/pretrain_segabert_distributed.sh -------------------------------------------------------------------------------- /segabert/scripts/split_json.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/scripts/split_json.py -------------------------------------------------------------------------------- /segabert/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segabert/utils.py -------------------------------------------------------------------------------- /segatron-xl/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/README.md -------------------------------------------------------------------------------- /segatron-xl/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/data_utils.py -------------------------------------------------------------------------------- /segatron-xl/eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/eval.py -------------------------------------------------------------------------------- /segatron-xl/fp16/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/fp16/__init__.py -------------------------------------------------------------------------------- /segatron-xl/fp16/fp16.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/fp16/fp16.py -------------------------------------------------------------------------------- /segatron-xl/fp16/fp16util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/fp16/fp16util.py -------------------------------------------------------------------------------- /segatron-xl/fp16/loss_scaler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/fp16/loss_scaler.py -------------------------------------------------------------------------------- /segatron-xl/getdata.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/getdata.sh -------------------------------------------------------------------------------- /segatron-xl/mem_transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mem_transformer.py -------------------------------------------------------------------------------- /segatron-xl/mpu/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/__init__.py -------------------------------------------------------------------------------- /segatron-xl/mpu/cross_entropy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/cross_entropy.py -------------------------------------------------------------------------------- /segatron-xl/mpu/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/data.py -------------------------------------------------------------------------------- /segatron-xl/mpu/grads.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/grads.py -------------------------------------------------------------------------------- /segatron-xl/mpu/initialize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/initialize.py -------------------------------------------------------------------------------- /segatron-xl/mpu/layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/layers.py -------------------------------------------------------------------------------- /segatron-xl/mpu/mappings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/mappings.py -------------------------------------------------------------------------------- /segatron-xl/mpu/random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/random.py -------------------------------------------------------------------------------- /segatron-xl/mpu/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /segatron-xl/mpu/tests/commons.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/tests/commons.py -------------------------------------------------------------------------------- /segatron-xl/mpu/tests/test_cross_entropy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/tests/test_cross_entropy.py -------------------------------------------------------------------------------- /segatron-xl/mpu/tests/test_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/tests/test_data.py -------------------------------------------------------------------------------- /segatron-xl/mpu/tests/test_initialize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/tests/test_initialize.py -------------------------------------------------------------------------------- /segatron-xl/mpu/tests/test_layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/tests/test_layers.py -------------------------------------------------------------------------------- /segatron-xl/mpu/tests/test_random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/tests/test_random.py -------------------------------------------------------------------------------- /segatron-xl/mpu/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/transformer.py -------------------------------------------------------------------------------- /segatron-xl/mpu/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/mpu/utils.py -------------------------------------------------------------------------------- /segatron-xl/run_wt103_base_sega.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/run_wt103_base_sega.sh -------------------------------------------------------------------------------- /segatron-xl/run_wt103_large_sega.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/run_wt103_large_sega.sh -------------------------------------------------------------------------------- /segatron-xl/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/train.py -------------------------------------------------------------------------------- /segatron-xl/utils/adaptive_softmax.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/utils/adaptive_softmax.py -------------------------------------------------------------------------------- /segatron-xl/utils/data_parallel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/utils/data_parallel.py -------------------------------------------------------------------------------- /segatron-xl/utils/exp_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/utils/exp_utils.py -------------------------------------------------------------------------------- /segatron-xl/utils/log_uniform_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/utils/log_uniform_sampler.py -------------------------------------------------------------------------------- /segatron-xl/utils/proj_adaptive_softmax.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/utils/proj_adaptive_softmax.py -------------------------------------------------------------------------------- /segatron-xl/utils/vocabulary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/segatron-xl/utils/vocabulary.py -------------------------------------------------------------------------------- /sentence-transformers/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/README.md -------------------------------------------------------------------------------- /sentence-transformers/examples/training_transformers/evaluation_stsall.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/examples/training_transformers/evaluation_stsall.py -------------------------------------------------------------------------------- /sentence-transformers/examples/training_transformers/training_nli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/examples/training_transformers/training_nli.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/LoggingHandler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/LoggingHandler.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/SentenceTransformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/SentenceTransformer.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/__init__.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/datasets/ParallelSentencesDataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/datasets/ParallelSentencesDataset.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/datasets/SentenceLabelDataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/datasets/SentenceLabelDataset.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/datasets/SentencesDataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/datasets/SentencesDataset.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/datasets/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/datasets/__init__.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/datasets/sampler/LabelSampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/datasets/sampler/LabelSampler.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/datasets/sampler/__init__.py: -------------------------------------------------------------------------------- 1 | from .LabelSampler import * -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/BinaryEmbeddingSimilarityEvaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/BinaryEmbeddingSimilarityEvaluator.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/EmbeddingSimilarityEvaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/EmbeddingSimilarityEvaluator.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/InformationRetrievalEvaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/InformationRetrievalEvaluator.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/LabelAccuracyEvaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/LabelAccuracyEvaluator.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/MSEEvaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/MSEEvaluator.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/MSEEvaluatorFromDataFrame.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/MSEEvaluatorFromDataFrame.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/ParaphraseMiningEvaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/ParaphraseMiningEvaluator.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/SentenceEvaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/SentenceEvaluator.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/SequentialEvaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/SequentialEvaluator.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/SimilarityFunction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/SimilarityFunction.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/TranslationEvaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/TranslationEvaluator.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/TripletEvaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/TripletEvaluator.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/evaluation/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/evaluation/__init__.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/losses/BatchHardSoftMarginTripletLoss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/losses/BatchHardSoftMarginTripletLoss.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/losses/BatchHardTripletLoss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/losses/BatchHardTripletLoss.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/losses/BatchSemiHardTripletLoss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/losses/BatchSemiHardTripletLoss.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/losses/ContrastiveLoss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/losses/ContrastiveLoss.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/losses/CosineSimilarityLoss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/losses/CosineSimilarityLoss.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/losses/MSELoss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/losses/MSELoss.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/losses/MultipleNegativesRankingLoss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/losses/MultipleNegativesRankingLoss.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/losses/OnlineContrastiveLoss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/losses/OnlineContrastiveLoss.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/losses/SoftmaxLoss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/losses/SoftmaxLoss.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/losses/TripletLoss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/losses/TripletLoss.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/losses/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/losses/__init__.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/losses/test_batch_hard_triplet_loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/losses/test_batch_hard_triplet_loss.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/models/Transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/models/Transformer.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/models/__init__.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/models/tokenizer/PhraseTokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/models/tokenizer/PhraseTokenizer.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/models/tokenizer/WhitespaceTokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/models/tokenizer/WhitespaceTokenizer.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/models/tokenizer/WordTokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/models/tokenizer/WordTokenizer.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/models/tokenizer/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/models/tokenizer/__init__.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/readers/InputExample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/readers/InputExample.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/readers/LabelSentenceReader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/readers/LabelSentenceReader.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/readers/NLIDataReader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/readers/NLIDataReader.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/readers/PairedFilesReader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/readers/PairedFilesReader.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/readers/STSDataReader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/readers/STSDataReader.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/readers/TripletReader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/readers/TripletReader.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/readers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/readers/__init__.py -------------------------------------------------------------------------------- /sentence-transformers/sentence_transformers/util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/sentence_transformers/util.py -------------------------------------------------------------------------------- /sentence-transformers/setup.cfg: -------------------------------------------------------------------------------- 1 | [metadata] 2 | description-file = README.md -------------------------------------------------------------------------------- /sentence-transformers/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/sentence-transformers/setup.py -------------------------------------------------------------------------------- /transformers/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/README.md -------------------------------------------------------------------------------- /transformers/examples/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/README.md -------------------------------------------------------------------------------- /transformers/examples/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers/examples/eval_finetune/config/base/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/eval_finetune/config/base/config.json -------------------------------------------------------------------------------- /transformers/examples/eval_finetune/config/base/vocab.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/eval_finetune/config/base/vocab.txt -------------------------------------------------------------------------------- /transformers/examples/eval_finetune/config/large/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/eval_finetune/config/large/config.json -------------------------------------------------------------------------------- /transformers/examples/eval_finetune/config/large/vocab.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/eval_finetune/config/large/vocab.txt -------------------------------------------------------------------------------- /transformers/examples/eval_finetune/download_glue_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/eval_finetune/download_glue_data.py -------------------------------------------------------------------------------- /transformers/examples/eval_finetune/get_aviable_cuda.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/eval_finetune/get_aviable_cuda.py -------------------------------------------------------------------------------- /transformers/examples/eval_finetune/grid_search_glue.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/eval_finetune/grid_search_glue.sh -------------------------------------------------------------------------------- /transformers/examples/eval_finetune/run_race.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/eval_finetune/run_race.sh -------------------------------------------------------------------------------- /transformers/examples/eval_finetune/train_glue.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/eval_finetune/train_glue.sh -------------------------------------------------------------------------------- /transformers/examples/eval_finetune/train_squad.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/eval_finetune/train_squad.sh -------------------------------------------------------------------------------- /transformers/examples/eval_finetune/train_squad2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/eval_finetune/train_squad2.sh -------------------------------------------------------------------------------- /transformers/examples/requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/requirements.txt -------------------------------------------------------------------------------- /transformers/examples/run_glue.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/run_glue.py -------------------------------------------------------------------------------- /transformers/examples/run_multiple_choice.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/run_multiple_choice.py -------------------------------------------------------------------------------- /transformers/examples/run_squad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/run_squad.py -------------------------------------------------------------------------------- /transformers/examples/utils_multiple_choice.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/examples/utils_multiple_choice.py -------------------------------------------------------------------------------- /transformers/fp16/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/fp16/__init__.py -------------------------------------------------------------------------------- /transformers/fp16/fp16.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/fp16/fp16.py -------------------------------------------------------------------------------- /transformers/fp16/fp16util.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/fp16/fp16util.py -------------------------------------------------------------------------------- /transformers/fp16/loss_scaler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/fp16/loss_scaler.py -------------------------------------------------------------------------------- /transformers/mpu/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/__init__.py -------------------------------------------------------------------------------- /transformers/mpu/cross_entropy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/cross_entropy.py -------------------------------------------------------------------------------- /transformers/mpu/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/data.py -------------------------------------------------------------------------------- /transformers/mpu/grads.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/grads.py -------------------------------------------------------------------------------- /transformers/mpu/initialize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/initialize.py -------------------------------------------------------------------------------- /transformers/mpu/layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/layers.py -------------------------------------------------------------------------------- /transformers/mpu/mappings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/mappings.py -------------------------------------------------------------------------------- /transformers/mpu/random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/random.py -------------------------------------------------------------------------------- /transformers/mpu/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers/mpu/tests/commons.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/tests/commons.py -------------------------------------------------------------------------------- /transformers/mpu/tests/test_cross_entropy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/tests/test_cross_entropy.py -------------------------------------------------------------------------------- /transformers/mpu/tests/test_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/tests/test_data.py -------------------------------------------------------------------------------- /transformers/mpu/tests/test_initialize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/tests/test_initialize.py -------------------------------------------------------------------------------- /transformers/mpu/tests/test_layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/tests/test_layers.py -------------------------------------------------------------------------------- /transformers/mpu/tests/test_random.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/tests/test_random.py -------------------------------------------------------------------------------- /transformers/mpu/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/transformer.py -------------------------------------------------------------------------------- /transformers/mpu/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/mpu/utils.py -------------------------------------------------------------------------------- /transformers/transformers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/__init__.py -------------------------------------------------------------------------------- /transformers/transformers/__main__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/__main__.py -------------------------------------------------------------------------------- /transformers/transformers/commands/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/commands/__init__.py -------------------------------------------------------------------------------- /transformers/transformers/commands/convert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/commands/convert.py -------------------------------------------------------------------------------- /transformers/transformers/commands/download.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/commands/download.py -------------------------------------------------------------------------------- /transformers/transformers/commands/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/commands/run.py -------------------------------------------------------------------------------- /transformers/transformers/commands/serving.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/commands/serving.py -------------------------------------------------------------------------------- /transformers/transformers/commands/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/commands/train.py -------------------------------------------------------------------------------- /transformers/transformers/commands/user.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/commands/user.py -------------------------------------------------------------------------------- /transformers/transformers/configuration_bert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/configuration_bert.py -------------------------------------------------------------------------------- /transformers/transformers/configuration_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/configuration_utils.py -------------------------------------------------------------------------------- /transformers/transformers/convert_segatron_to_huggingface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/convert_segatron_to_huggingface.py -------------------------------------------------------------------------------- /transformers/transformers/data/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/data/__init__.py -------------------------------------------------------------------------------- /transformers/transformers/data/metrics/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/data/metrics/__init__.py -------------------------------------------------------------------------------- /transformers/transformers/data/metrics/squad_metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/data/metrics/squad_metrics.py -------------------------------------------------------------------------------- /transformers/transformers/data/processors/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/data/processors/__init__.py -------------------------------------------------------------------------------- /transformers/transformers/data/processors/glue.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/data/processors/glue.py -------------------------------------------------------------------------------- /transformers/transformers/data/processors/split_sentences.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/data/processors/split_sentences.py -------------------------------------------------------------------------------- /transformers/transformers/data/processors/squad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/data/processors/squad.py -------------------------------------------------------------------------------- /transformers/transformers/data/processors/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/data/processors/utils.py -------------------------------------------------------------------------------- /transformers/transformers/data/processors/xnli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/data/processors/xnli.py -------------------------------------------------------------------------------- /transformers/transformers/file_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/file_utils.py -------------------------------------------------------------------------------- /transformers/transformers/modeling_segabert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/modeling_segabert.py -------------------------------------------------------------------------------- /transformers/transformers/modeling_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/modeling_utils.py -------------------------------------------------------------------------------- /transformers/transformers/optimization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/optimization.py -------------------------------------------------------------------------------- /transformers/transformers/optimization_tf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/optimization_tf.py -------------------------------------------------------------------------------- /transformers/transformers/pipelines.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/pipelines.py -------------------------------------------------------------------------------- /transformers/transformers/tokenization_bert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/tokenization_bert.py -------------------------------------------------------------------------------- /transformers/transformers/tokenization_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/rsvp-ai/segatron_aaai/HEAD/transformers/transformers/tokenization_utils.py --------------------------------------------------------------------------------