├── README.md ├── img ├── Background.png ├── equation.png ├── hyperparameter.png └── overview.png ├── reasoning_evaluation ├── gsm8k │ ├── adaptive │ │ ├── ada_13B_gsm8k.json │ │ ├── ada_70B_gsm8k.json │ │ └── ada_7B_gsm8k.json │ ├── greedy │ │ ├── greedy_13B_gsm8k.json │ │ ├── greedy_70B_gsm8k.json │ │ └── greedy_7B_gsm8k.json │ └── topp │ │ ├── top95_13B_gsm8k.json │ │ ├── top95_70B_gsm8k.json │ │ └── top95_7B_gsm8k.json └── multiarith │ ├── adaptive │ ├── ada_13B_multiarith.json │ ├── ada_70B_multiarith.json │ └── ada_7B_multiarith.json │ ├── greedy │ ├── greedy_13B_multiarith.json │ ├── greedy_70B_multiarith.json │ └── greedy_7B_multiarith.json │ └── topp │ ├── top95_13B_multiarith.json │ ├── top95_70B_multiarith.json │ └── top95_70Btrue_multiarith.json ├── test.ipynb └── transformers-main ├── .coveragerc ├── .gitattributes ├── .gitignore ├── CITATION.cff ├── CODE_OF_CONDUCT.md ├── CONTRIBUTING.md ├── ISSUES.md ├── LICENSE ├── Makefile ├── README.md ├── README_de.md ├── README_es.md ├── README_fr.md ├── README_hd.md ├── README_ja.md ├── README_ko.md ├── README_pt-br.md ├── README_ru.md ├── README_te.md ├── README_vi.md ├── README_zh-hans.md ├── README_zh-hant.md ├── SECURITY.md ├── awesome-transformers.md ├── conftest.py ├── docker ├── transformers-all-latest-gpu │ └── Dockerfile ├── transformers-doc-builder │ └── Dockerfile ├── transformers-gpu │ └── Dockerfile ├── transformers-past-gpu │ └── Dockerfile ├── transformers-pytorch-amd-gpu │ └── Dockerfile ├── transformers-pytorch-deepspeed-amd-gpu │ └── Dockerfile ├── transformers-pytorch-deepspeed-latest-gpu │ └── Dockerfile ├── transformers-pytorch-deepspeed-nightly-gpu │ └── Dockerfile ├── transformers-pytorch-gpu │ └── Dockerfile ├── transformers-pytorch-tpu │ ├── Dockerfile │ ├── bert-base-cased.jsonnet │ ├── dataset.yaml │ └── docker-entrypoint.sh ├── transformers-quantization-latest-gpu │ └── Dockerfile └── transformers-tensorflow-gpu │ └── Dockerfile ├── docs ├── README.md ├── TRANSLATING.md └── source │ ├── _config.py │ ├── de │ ├── _config.py │ ├── _toctree.yml │ ├── accelerate.md │ ├── add_new_model.md │ ├── add_new_pipeline.md │ ├── add_tensorflow_model.md │ ├── autoclass_tutorial.md │ ├── contributing.md │ ├── index.md │ ├── installation.md │ ├── llm_tutorial.md │ ├── model_sharing.md │ ├── peft.md │ ├── pipeline_tutorial.md │ ├── pr_checks.md │ ├── preprocessing.md │ ├── quicktour.md │ ├── run_scripts.md │ ├── testing.md │ ├── training.md │ └── transformers_agents.md │ ├── en │ ├── _config.py │ ├── _redirects.yml │ ├── _toctree.yml │ ├── accelerate.md │ ├── add_new_model.md │ ├── add_new_pipeline.md │ ├── add_tensorflow_model.md │ ├── attention.md │ ├── autoclass_tutorial.md │ ├── benchmarks.md │ ├── bertology.md │ ├── big_models.md │ ├── chat_templating.md │ ├── community.md │ ├── contributing.md │ ├── create_a_model.md │ ├── custom_models.md │ ├── custom_tools.md │ ├── debugging.md │ ├── deepspeed.md │ ├── fast_tokenizers.md │ ├── fsdp.md │ ├── generation_strategies.md │ ├── glossary.md │ ├── hf_quantizer.md │ ├── hpo_train.md │ ├── index.md │ ├── installation.md │ ├── internal │ │ ├── audio_utils.md │ │ ├── file_utils.md │ │ ├── generation_utils.md │ │ ├── image_processing_utils.md │ │ ├── modeling_utils.md │ │ ├── pipelines_utils.md │ │ ├── time_series_utils.md │ │ ├── tokenization_utils.md │ │ └── trainer_utils.md │ ├── llm_tutorial.md │ ├── llm_tutorial_optimization.md │ ├── main_classes │ │ ├── agent.md │ │ ├── backbones.md │ │ ├── callback.md │ │ ├── configuration.md │ │ ├── data_collator.md │ │ ├── deepspeed.md │ │ ├── feature_extractor.md │ │ ├── image_processor.md │ │ ├── keras_callbacks.md │ │ ├── logging.md │ │ ├── model.md │ │ ├── onnx.md │ │ ├── optimizer_schedules.md │ │ ├── output.md │ │ ├── pipelines.md │ │ ├── processors.md │ │ ├── quantization.md │ │ ├── text_generation.md │ │ ├── tokenizer.md │ │ └── trainer.md │ ├── model_doc │ │ ├── albert.md │ │ ├── align.md │ │ ├── altclip.md │ │ ├── audio-spectrogram-transformer.md │ │ ├── auto.md │ │ ├── autoformer.md │ │ ├── bark.md │ │ ├── bart.md │ │ ├── barthez.md │ │ ├── bartpho.md │ │ ├── beit.md │ │ ├── bert-generation.md │ │ ├── bert-japanese.md │ │ ├── bert.md │ │ ├── bertweet.md │ │ ├── big_bird.md │ │ ├── bigbird_pegasus.md │ │ ├── biogpt.md │ │ ├── bit.md │ │ ├── blenderbot-small.md │ │ ├── blenderbot.md │ │ ├── blip-2.md │ │ ├── blip.md │ │ ├── bloom.md │ │ ├── bort.md │ │ ├── bridgetower.md │ │ ├── bros.md │ │ ├── byt5.md │ │ ├── camembert.md │ │ ├── canine.md │ │ ├── chinese_clip.md │ │ ├── clap.md │ │ ├── clip.md │ │ ├── clipseg.md │ │ ├── clvp.md │ │ ├── code_llama.md │ │ ├── codegen.md │ │ ├── cohere.md │ │ ├── conditional_detr.md │ │ ├── convbert.md │ │ ├── convnext.md │ │ ├── convnextv2.md │ │ ├── cpm.md │ │ ├── cpmant.md │ │ ├── ctrl.md │ │ ├── cvt.md │ │ ├── data2vec.md │ │ ├── dbrx.md │ │ ├── deberta-v2.md │ │ ├── deberta.md │ │ ├── decision_transformer.md │ │ ├── deformable_detr.md │ │ ├── deit.md │ │ ├── deplot.md │ │ ├── depth_anything.md │ │ ├── deta.md │ │ ├── detr.md │ │ ├── dialogpt.md │ │ ├── dinat.md │ │ ├── dinov2.md │ │ ├── distilbert.md │ │ ├── dit.md │ │ ├── donut.md │ │ ├── dpr.md │ │ ├── dpt.md │ │ ├── efficientformer.md │ │ ├── efficientnet.md │ │ ├── electra.md │ │ ├── encodec.md │ │ ├── encoder-decoder.md │ │ ├── ernie.md │ │ ├── ernie_m.md │ │ ├── esm.md │ │ ├── falcon.md │ │ ├── fastspeech2_conformer.md │ │ ├── flan-t5.md │ │ ├── flan-ul2.md │ │ ├── flaubert.md │ │ ├── flava.md │ │ ├── fnet.md │ │ ├── focalnet.md │ │ ├── fsmt.md │ │ ├── funnel.md │ │ ├── fuyu.md │ │ ├── gemma.md │ │ ├── git.md │ │ ├── glpn.md │ │ ├── gpt-sw3.md │ │ ├── gpt2.md │ │ ├── gpt_bigcode.md │ │ ├── gpt_neo.md │ │ ├── gpt_neox.md │ │ ├── gpt_neox_japanese.md │ │ ├── gptj.md │ │ ├── gptsan-japanese.md │ │ ├── graphormer.md │ │ ├── grounding-dino.md │ │ ├── groupvit.md │ │ ├── herbert.md │ │ ├── hubert.md │ │ ├── ibert.md │ │ ├── idefics.md │ │ ├── idefics2.md │ │ ├── imagegpt.md │ │ ├── informer.md │ │ ├── instructblip.md │ │ ├── jamba.md │ │ ├── jukebox.md │ │ ├── kosmos-2.md │ │ ├── layoutlm.md │ │ ├── layoutlmv2.md │ │ ├── layoutlmv3.md │ │ ├── layoutxlm.md │ │ ├── led.md │ │ ├── levit.md │ │ ├── lilt.md │ │ ├── llama.md │ │ ├── llama2.md │ │ ├── llava.md │ │ ├── llava_next.md │ │ ├── longformer.md │ │ ├── longt5.md │ │ ├── luke.md │ │ ├── lxmert.md │ │ ├── m2m_100.md │ │ ├── madlad-400.md │ │ ├── mamba.md │ │ ├── marian.md │ │ ├── markuplm.md │ │ ├── mask2former.md │ │ ├── maskformer.md │ │ ├── matcha.md │ │ ├── mbart.md │ │ ├── mctct.md │ │ ├── mega.md │ │ ├── megatron-bert.md │ │ ├── megatron_gpt2.md │ │ ├── mgp-str.md │ │ ├── mistral.md │ │ ├── mixtral.md │ │ ├── mluke.md │ │ ├── mms.md │ │ ├── mobilebert.md │ │ ├── mobilenet_v1.md │ │ ├── mobilenet_v2.md │ │ ├── mobilevit.md │ │ ├── mobilevitv2.md │ │ ├── mpnet.md │ │ ├── mpt.md │ │ ├── mra.md │ │ ├── mt5.md │ │ ├── musicgen.md │ │ ├── musicgen_melody.md │ │ ├── mvp.md │ │ ├── nat.md │ │ ├── nezha.md │ │ ├── nllb-moe.md │ │ ├── nllb.md │ │ ├── nougat.md │ │ ├── nystromformer.md │ │ ├── olmo.md │ │ ├── oneformer.md │ │ ├── open-llama.md │ │ ├── openai-gpt.md │ │ ├── opt.md │ │ ├── owlv2.md │ │ ├── owlvit.md │ │ ├── patchtsmixer.md │ │ ├── patchtst.md │ │ ├── pegasus.md │ │ ├── pegasus_x.md │ │ ├── perceiver.md │ │ ├── persimmon.md │ │ ├── phi.md │ │ ├── phobert.md │ │ ├── pix2struct.md │ │ ├── plbart.md │ │ ├── poolformer.md │ │ ├── pop2piano.md │ │ ├── prophetnet.md │ │ ├── pvt.md │ │ ├── pvt_v2.md │ │ ├── qdqbert.md │ │ ├── qwen2.md │ │ ├── qwen2_moe.md │ │ ├── rag.md │ │ ├── realm.md │ │ ├── recurrent_gemma.md │ │ ├── reformer.md │ │ ├── regnet.md │ │ ├── rembert.md │ │ ├── resnet.md │ │ ├── retribert.md │ │ ├── roberta-prelayernorm.md │ │ ├── roberta.md │ │ ├── roc_bert.md │ │ ├── roformer.md │ │ ├── rwkv.md │ │ ├── sam.md │ │ ├── seamless_m4t.md │ │ ├── seamless_m4t_v2.md │ │ ├── segformer.md │ │ ├── seggpt.md │ │ ├── sew-d.md │ │ ├── sew.md │ │ ├── siglip.md │ │ ├── speech-encoder-decoder.md │ │ ├── speech_to_text.md │ │ ├── speech_to_text_2.md │ │ ├── speecht5.md │ │ ├── splinter.md │ │ ├── squeezebert.md │ │ ├── stablelm.md │ │ ├── starcoder2.md │ │ ├── superpoint.md │ │ ├── swiftformer.md │ │ ├── swin.md │ │ ├── swin2sr.md │ │ ├── swinv2.md │ │ ├── switch_transformers.md │ │ ├── t5.md │ │ ├── t5v1.1.md │ │ ├── table-transformer.md │ │ ├── tapas.md │ │ ├── tapex.md │ │ ├── time_series_transformer.md │ │ ├── timesformer.md │ │ ├── trajectory_transformer.md │ │ ├── transfo-xl.md │ │ ├── trocr.md │ │ ├── tvlt.md │ │ ├── tvp.md │ │ ├── udop.md │ │ ├── ul2.md │ │ ├── umt5.md │ │ ├── unispeech-sat.md │ │ ├── unispeech.md │ │ ├── univnet.md │ │ ├── upernet.md │ │ ├── van.md │ │ ├── videomae.md │ │ ├── vilt.md │ │ ├── vipllava.md │ │ ├── vision-encoder-decoder.md │ │ ├── vision-text-dual-encoder.md │ │ ├── visual_bert.md │ │ ├── vit.md │ │ ├── vit_hybrid.md │ │ ├── vit_mae.md │ │ ├── vit_msn.md │ │ ├── vitdet.md │ │ ├── vitmatte.md │ │ ├── vits.md │ │ ├── vivit.md │ │ ├── wav2vec2-bert.md │ │ ├── wav2vec2-conformer.md │ │ ├── wav2vec2.md │ │ ├── wav2vec2_phoneme.md │ │ ├── wavlm.md │ │ ├── whisper.md │ │ ├── xclip.md │ │ ├── xglm.md │ │ ├── xlm-prophetnet.md │ │ ├── xlm-roberta-xl.md │ │ ├── xlm-roberta.md │ │ ├── xlm-v.md │ │ ├── xlm.md │ │ ├── xlnet.md │ │ ├── xls_r.md │ │ ├── xlsr_wav2vec2.md │ │ ├── xmod.md │ │ ├── yolos.md │ │ └── yoso.md │ ├── model_memory_anatomy.md │ ├── model_sharing.md │ ├── model_summary.md │ ├── multilingual.md │ ├── notebooks.md │ ├── pad_truncation.md │ ├── peft.md │ ├── perf_hardware.md │ ├── perf_infer_cpu.md │ ├── perf_infer_gpu_one.md │ ├── perf_torch_compile.md │ ├── perf_train_cpu.md │ ├── perf_train_cpu_many.md │ ├── perf_train_gpu_many.md │ ├── perf_train_gpu_one.md │ ├── perf_train_special.md │ ├── perf_train_tpu_tf.md │ ├── performance.md │ ├── perplexity.md │ ├── philosophy.md │ ├── pipeline_tutorial.md │ ├── pipeline_webserver.md │ ├── pr_checks.md │ ├── preprocessing.md │ ├── quantization.md │ ├── quicktour.md │ ├── run_scripts.md │ ├── sagemaker.md │ ├── serialization.md │ ├── task_summary.md │ ├── tasks │ │ ├── asr.md │ │ ├── audio_classification.md │ │ ├── document_question_answering.md │ │ ├── idefics.md │ │ ├── image_captioning.md │ │ ├── image_classification.md │ │ ├── image_feature_extraction.md │ │ ├── image_to_image.md │ │ ├── knowledge_distillation_for_image_classification.md │ │ ├── language_modeling.md │ │ ├── mask_generation.md │ │ ├── masked_language_modeling.md │ │ ├── monocular_depth_estimation.md │ │ ├── multiple_choice.md │ │ ├── object_detection.md │ │ ├── prompting.md │ │ ├── question_answering.md │ │ ├── semantic_segmentation.md │ │ ├── sequence_classification.md │ │ ├── summarization.md │ │ ├── text-to-speech.md │ │ ├── token_classification.md │ │ ├── translation.md │ │ ├── video_classification.md │ │ ├── visual_question_answering.md │ │ ├── zero_shot_image_classification.md │ │ └── zero_shot_object_detection.md │ ├── tasks_explained.md │ ├── testing.md │ ├── tf_xla.md │ ├── tflite.md │ ├── tokenizer_summary.md │ ├── torchscript.md │ ├── trainer.md │ ├── training.md │ ├── transformers_agents.md │ └── troubleshooting.md │ ├── es │ ├── _config.py │ ├── _toctree.yml │ ├── accelerate.md │ ├── add_new_pipeline.md │ ├── attention.md │ ├── autoclass_tutorial.md │ ├── bertology.md │ ├── chat_templating.md │ ├── community.md │ ├── converting_tensorflow_models.md │ ├── create_a_model.md │ ├── custom_models.md │ ├── debugging.md │ ├── fast_tokenizers.md │ ├── glossary.md │ ├── index.md │ ├── installation.md │ ├── model_sharing.md │ ├── multilingual.md │ ├── pad_truncation.md │ ├── performance.md │ ├── perplexity.md │ ├── philosophy.md │ ├── pipeline_tutorial.md │ ├── pr_checks.md │ ├── preprocessing.md │ ├── quicktour.md │ ├── run_scripts.md │ ├── sagemaker.md │ ├── serialization.md │ ├── task_summary.md │ ├── tasks │ │ ├── asr.md │ │ ├── image_captioning.md │ │ ├── image_classification.md │ │ ├── language_modeling.md │ │ ├── multiple_choice.md │ │ ├── question_answering.md │ │ └── summarization.md │ ├── tasks_explained.md │ ├── torchscript.md │ ├── trainer.md │ └── training.md │ ├── fr │ ├── _config.py │ ├── _toctree.yml │ ├── autoclass_tutorial.md │ ├── in_translation.md │ ├── index.md │ ├── installation.md │ └── quicktour.md │ ├── hi │ ├── _toctree.yml │ └── pipeline_tutorial.md │ ├── it │ ├── _config.py │ ├── _toctree.yml │ ├── accelerate.md │ ├── add_new_model.md │ ├── add_new_pipeline.md │ ├── autoclass_tutorial.md │ ├── big_models.md │ ├── community.md │ ├── converting_tensorflow_models.md │ ├── create_a_model.md │ ├── custom_models.md │ ├── debugging.md │ ├── index.md │ ├── installation.md │ ├── migration.md │ ├── model_sharing.md │ ├── multilingual.md │ ├── perf_hardware.md │ ├── perf_infer_cpu.md │ ├── perf_infer_gpu_many.md │ ├── perf_infer_gpu_one.md │ ├── perf_infer_special.md │ ├── perf_train_cpu.md │ ├── perf_train_cpu_many.md │ ├── perf_train_special.md │ ├── perf_train_tpu.md │ ├── pipeline_tutorial.md │ ├── pr_checks.md │ ├── preprocessing.md │ ├── quicktour.md │ ├── run_scripts.md │ ├── serialization.md │ └── training.md │ ├── ja │ ├── _toctree.yml │ ├── accelerate.md │ ├── add_new_model.md │ ├── add_tensorflow_model.md │ ├── attention.md │ ├── autoclass_tutorial.md │ ├── benchmarks.md │ ├── bertology.md │ ├── big_models.md │ ├── chat_templating.md │ ├── community.md │ ├── create_a_model.md │ ├── custom_models.md │ ├── custom_tools.md │ ├── fast_tokenizers.md │ ├── generation_strategies.md │ ├── glossary.md │ ├── hpo_train.md │ ├── index.md │ ├── installation.md │ ├── internal │ │ ├── audio_utils.md │ │ ├── file_utils.md │ │ ├── generation_utils.md │ │ ├── image_processing_utils.md │ │ ├── modeling_utils.md │ │ ├── pipelines_utils.md │ │ ├── time_series_utils.md │ │ ├── tokenization_utils.md │ │ └── trainer_utils.md │ ├── llm_tutorial.md │ ├── main_classes │ │ ├── agent.md │ │ ├── callback.md │ │ ├── configuration.md │ │ ├── data_collator.md │ │ ├── deepspeed.md │ │ ├── feature_extractor.md │ │ ├── image_processor.md │ │ ├── keras_callbacks.md │ │ ├── logging.md │ │ ├── model.md │ │ ├── onnx.md │ │ ├── optimizer_schedules.md │ │ ├── output.md │ │ ├── pipelines.md │ │ ├── processors.md │ │ ├── quantization.md │ │ ├── text_generation.md │ │ ├── tokenizer.md │ │ └── trainer.md │ ├── model_doc │ │ ├── albert.md │ │ ├── align.md │ │ ├── altclip.md │ │ ├── audio-spectrogram-transformer.md │ │ ├── auto.md │ │ ├── autoformer.md │ │ ├── bark.md │ │ ├── bart.md │ │ ├── barthez.md │ │ ├── bartpho.md │ │ ├── beit.md │ │ ├── bert-generation.md │ │ ├── bert-japanese.md │ │ ├── bert.md │ │ ├── bertweet.md │ │ ├── big_bird.md │ │ ├── bigbird_pegasus.md │ │ ├── biogpt.md │ │ ├── bit.md │ │ ├── blenderbot-small.md │ │ ├── blenderbot.md │ │ ├── blip-2.md │ │ ├── blip.md │ │ ├── bloom.md │ │ ├── bort.md │ │ ├── bridgetower.md │ │ ├── bros.md │ │ ├── byt5.md │ │ ├── camembert.md │ │ ├── canine.md │ │ ├── chinese_clip.md │ │ ├── clap.md │ │ ├── clip.md │ │ ├── clipseg.md │ │ ├── clvp.md │ │ ├── code_llama.md │ │ ├── codegen.md │ │ ├── conditional_detr.md │ │ ├── convbert.md │ │ ├── convnext.md │ │ ├── convnextv2.md │ │ ├── cpm.md │ │ ├── cpmant.md │ │ ├── ctrl.md │ │ ├── cvt.md │ │ ├── data2vec.md │ │ ├── deberta-v2.md │ │ ├── deberta.md │ │ ├── decision_transformer.md │ │ ├── deformable_detr.md │ │ ├── deit.md │ │ ├── deplot.md │ │ ├── deta.md │ │ ├── detr.md │ │ ├── dialogpt.md │ │ └── dinat.md │ ├── model_memory_anatomy.md │ ├── model_sharing.md │ ├── model_summary.md │ ├── multilingual.md │ ├── pad_truncation.md │ ├── peft.md │ ├── perf_hardware.md │ ├── perf_infer_cpu.md │ ├── perf_infer_gpu_many.md │ ├── perf_infer_gpu_one.md │ ├── perf_infer_special.md │ ├── perf_torch_compile.md │ ├── perf_train_cpu.md │ ├── perf_train_cpu_many.md │ ├── perf_train_gpu_many.md │ ├── perf_train_gpu_one.md │ ├── perf_train_special.md │ ├── perf_train_tpu.md │ ├── perf_train_tpu_tf.md │ ├── performance.md │ ├── perplexity.md │ ├── philosophy.md │ ├── pipeline_tutorial.md │ ├── pipeline_webserver.md │ ├── pr_checks.md │ ├── preprocessing.md │ ├── quicktour.md │ ├── run_scripts.md │ ├── serialization.md │ ├── task_summary.md │ ├── tasks │ │ ├── asr.md │ │ ├── audio_classification.md │ │ ├── document_question_answering.md │ │ ├── idefics.md │ │ ├── image_captioning.md │ │ ├── image_classification.md │ │ ├── image_to_image.md │ │ ├── knowledge_distillation_for_image_classification.md │ │ ├── language_modeling.md │ │ ├── masked_language_modeling.md │ │ ├── monocular_depth_estimation.md │ │ ├── multiple_choice.md │ │ ├── object_detection.md │ │ ├── prompting.md │ │ ├── question_answering.md │ │ ├── semantic_segmentation.md │ │ ├── sequence_classification.md │ │ ├── summarization.md │ │ ├── text-to-speech.md │ │ ├── token_classification.md │ │ ├── translation.md │ │ ├── video_classification.md │ │ ├── visual_question_answering.md │ │ ├── zero_shot_image_classification.md │ │ └── zero_shot_object_detection.md │ ├── tasks_explained.md │ ├── testing.md │ ├── tf_xla.md │ ├── tflite.md │ ├── tokenizer_summary.md │ ├── torchscript.md │ ├── training.md │ ├── transformers_agents.md │ └── troubleshooting.md │ ├── ko │ ├── _config.py │ ├── _toctree.yml │ ├── accelerate.md │ ├── add_new_model.md │ ├── add_new_pipeline.md │ ├── add_tensorflow_model.md │ ├── attention.md │ ├── autoclass_tutorial.md │ ├── bertology.md │ ├── big_models.md │ ├── community.md │ ├── contributing.md │ ├── create_a_model.md │ ├── custom_models.md │ ├── custom_tools.md │ ├── debugging.md │ ├── fast_tokenizers.md │ ├── generation_strategies.md │ ├── hpo_train.md │ ├── in_translation.md │ ├── index.md │ ├── installation.md │ ├── llm_tutorial.md │ ├── model_doc │ │ ├── llama.md │ │ ├── llama2.md │ │ └── whisper.md │ ├── model_memory_anatomy.md │ ├── model_sharing.md │ ├── model_summary.md │ ├── multilingual.md │ ├── pad_truncation.md │ ├── peft.md │ ├── perf_hardware.md │ ├── perf_infer_cpu.md │ ├── perf_infer_gpu_one.md │ ├── perf_train_cpu.md │ ├── perf_train_cpu_many.md │ ├── perf_train_gpu_many.md │ ├── perf_train_tpu_tf.md │ ├── performance.md │ ├── perplexity.md │ ├── philosophy.md │ ├── pipeline_tutorial.md │ ├── pipeline_webserver.md │ ├── pr_checks.md │ ├── preprocessing.md │ ├── quicktour.md │ ├── run_scripts.md │ ├── sagemaker.md │ ├── serialization.md │ ├── task_summary.md │ ├── tasks │ │ ├── asr.md │ │ ├── audio_classification.md │ │ ├── document_question_answering.md │ │ ├── image_captioning.md │ │ ├── image_classification.md │ │ ├── language_modeling.md │ │ ├── masked_language_modeling.md │ │ ├── monocular_depth_estimation.md │ │ ├── multiple_choice.md │ │ ├── object_detection.md │ │ ├── question_answering.md │ │ ├── semantic_segmentation.md │ │ ├── sequence_classification.md │ │ ├── summarization.md │ │ ├── token_classification.md │ │ ├── translation.md │ │ ├── video_classification.md │ │ ├── visual_question_answering.md │ │ ├── zero_shot_image_classification.md │ │ └── zero_shot_object_detection.md │ ├── tasks_explained.md │ ├── testing.md │ ├── tf_xla.md │ ├── tflite.md │ ├── tokenizer_summary.md │ ├── torchscript.md │ ├── training.md │ ├── transformers_agents.md │ └── troubleshooting.md │ ├── ms │ ├── _toctree.yml │ └── index.md │ ├── pt │ ├── _config.py │ ├── _toctree.yml │ ├── accelerate.md │ ├── converting_tensorflow_models.md │ ├── create_a_model.md │ ├── custom_models.md │ ├── fast_tokenizers.md │ ├── index.md │ ├── installation.md │ ├── multilingual.md │ ├── pipeline_tutorial.md │ ├── quicktour.md │ ├── run_scripts.md │ ├── serialization.md │ ├── tasks │ │ ├── sequence_classification.md │ │ └── token_classification.md │ └── training.md │ ├── te │ ├── _toctree.yml │ ├── index.md │ └── quicktour.md │ ├── tr │ ├── _toctree.yml │ └── index.md │ └── zh │ ├── _toctree.yml │ ├── accelerate.md │ ├── add_new_pipeline.md │ ├── autoclass_tutorial.md │ ├── big_models.md │ ├── chat_templating.md │ ├── contributing.md │ ├── create_a_model.md │ ├── custom_models.md │ ├── debugging.md │ ├── fast_tokenizers.md │ ├── fsdp.md │ ├── hpo_train.md │ ├── index.md │ ├── installation.md │ ├── internal │ ├── audio_utils.md │ ├── file_utils.md │ ├── generation_utils.md │ ├── image_processing_utils.md │ ├── modeling_utils.md │ ├── pipelines_utils.md │ ├── time_series_utils.md │ ├── tokenization_utils.md │ └── trainer_utils.md │ ├── llm_tutorial.md │ ├── main_classes │ ├── agent.md │ ├── callback.md │ ├── configuration.md │ ├── data_collator.md │ ├── deepspeed.md │ ├── feature_extractor.md │ ├── image_processor.md │ ├── keras_callbacks.md │ ├── logging.md │ ├── model.md │ ├── onnx.md │ ├── optimizer_schedules.md │ ├── output.md │ ├── pipelines.md │ ├── processors.md │ ├── quantization.md │ ├── text_generation.md │ ├── tokenizer.md │ └── trainer.md │ ├── model_sharing.md │ ├── multilingual.md │ ├── peft.md │ ├── perf_hardware.md │ ├── perf_torch_compile.md │ ├── performance.md │ ├── pipeline_tutorial.md │ ├── preprocessing.md │ ├── quicktour.md │ ├── run_scripts.md │ ├── serialization.md │ ├── task_summary.md │ ├── tasks │ └── asr.md │ ├── tf_xla.md │ ├── tflite.md │ ├── tokenizer_summary.md │ ├── torchscript.md │ ├── training.md │ └── transformers_agents.md ├── examples ├── README.md ├── flax │ ├── README.md │ ├── _tests_requirements.txt │ ├── conftest.py │ ├── image-captioning │ │ ├── README.md │ │ ├── create_model_from_encoder_decoder_models.py │ │ └── run_image_captioning_flax.py │ ├── language-modeling │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_bart_dlm_flax.py │ │ ├── run_clm_flax.py │ │ ├── run_mlm_flax.py │ │ ├── run_t5_mlm_flax.py │ │ └── t5_tokenizer_model.py │ ├── question-answering │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_qa.py │ │ └── utils_qa.py │ ├── speech-recognition │ │ ├── README.md │ │ ├── requirements.txt │ │ └── run_flax_speech_recognition_seq2seq.py │ ├── summarization │ │ ├── README.md │ │ ├── requirements.txt │ │ └── run_summarization_flax.py │ ├── test_flax_examples.py │ ├── text-classification │ │ ├── README.md │ │ ├── requirements.txt │ │ └── run_flax_glue.py │ ├── token-classification │ │ ├── README.md │ │ ├── requirements.txt │ │ └── run_flax_ner.py │ └── vision │ │ ├── README.md │ │ ├── requirements.txt │ │ └── run_image_classification.py ├── legacy │ ├── README.md │ ├── benchmarking │ │ ├── README.md │ │ ├── plot_csv_file.py │ │ ├── requirements.txt │ │ └── run_benchmark.py │ ├── multiple_choice │ │ ├── run_multiple_choice.py │ │ └── utils_multiple_choice.py │ ├── pytorch-lightning │ │ ├── lightning_base.py │ │ ├── requirements.txt │ │ ├── run_glue.py │ │ ├── run_glue.sh │ │ ├── run_ner.py │ │ ├── run_ner.sh │ │ └── run_pos.sh │ ├── question-answering │ │ ├── README.md │ │ ├── run_squad.py │ │ └── run_squad_trainer.py │ ├── run_camembert.py │ ├── run_chinese_ref.py │ ├── run_language_modeling.py │ ├── run_openai_gpt.py │ ├── run_swag.py │ ├── run_transfo_xl.py │ ├── seq2seq │ │ ├── README.md │ │ ├── __init__.py │ │ ├── convert_model_to_fp16.py │ │ ├── download_wmt.py │ │ ├── finetune.sh │ │ ├── finetune_tpu.sh │ │ ├── finetune_trainer.py │ │ ├── minify_dataset.py │ │ ├── old_test_calculate_rouge.py │ │ ├── old_test_datasets.py │ │ ├── old_test_fsmt_bleu_score.py │ │ ├── old_test_seq2seq_examples.py │ │ ├── old_test_seq2seq_examples_multi_gpu.py │ │ ├── old_test_tatoeba_conversion.py │ │ ├── pack_dataset.py │ │ ├── requirements.txt │ │ ├── romanian_postprocessing.md │ │ ├── rouge_cli.py │ │ ├── run_distributed_eval.py │ │ ├── run_eval.py │ │ ├── run_eval_search.py │ │ ├── save_len_file.py │ │ ├── save_randomly_initialized_model.py │ │ ├── sentence_splitter.py │ │ ├── seq2seq_trainer.py │ │ ├── seq2seq_training_args.py │ │ ├── test_data │ │ │ ├── fsmt │ │ │ │ ├── build-eval-data.py │ │ │ │ └── fsmt_val_data.json │ │ │ └── wmt_en_ro │ │ │ │ ├── test.source │ │ │ │ ├── test.target │ │ │ │ ├── train.len │ │ │ │ ├── train.source │ │ │ │ ├── train.target │ │ │ │ ├── val.len │ │ │ │ ├── val.source │ │ │ │ └── val.target │ │ ├── train_distil_marian_enro.sh │ │ ├── train_distil_marian_enro_tpu.sh │ │ ├── train_distilbart_cnn.sh │ │ ├── train_mbart_cc25_enro.sh │ │ ├── utils.py │ │ └── xla_spawn.py │ └── token-classification │ │ ├── README.md │ │ ├── run.sh │ │ ├── run_chunk.sh │ │ ├── run_ner.py │ │ ├── run_pos.sh │ │ ├── scripts │ │ └── preprocess.py │ │ ├── tasks.py │ │ └── utils_ner.py ├── pytorch │ ├── README.md │ ├── _tests_requirements.txt │ ├── audio-classification │ │ ├── README.md │ │ ├── requirements.txt │ │ └── run_audio_classification.py │ ├── conftest.py │ ├── contrastive-image-text │ │ ├── README.md │ │ ├── requirements.txt │ │ └── run_clip.py │ ├── image-classification │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_image_classification.py │ │ └── run_image_classification_no_trainer.py │ ├── image-pretraining │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_mae.py │ │ ├── run_mim.py │ │ └── run_mim_no_trainer.py │ ├── language-modeling │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_clm.py │ │ ├── run_clm_no_trainer.py │ │ ├── run_fim.py │ │ ├── run_fim_no_trainer.py │ │ ├── run_mlm.py │ │ ├── run_mlm_no_trainer.py │ │ └── run_plm.py │ ├── multiple-choice │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_no_trainer.sh │ │ ├── run_swag.py │ │ └── run_swag_no_trainer.py │ ├── old_test_xla_examples.py │ ├── question-answering │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_qa.py │ │ ├── run_qa_beam_search.py │ │ ├── run_qa_beam_search_no_trainer.py │ │ ├── run_qa_no_trainer.py │ │ ├── run_seq2seq_qa.py │ │ ├── trainer_qa.py │ │ ├── trainer_seq2seq_qa.py │ │ └── utils_qa.py │ ├── semantic-segmentation │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_semantic_segmentation.py │ │ └── run_semantic_segmentation_no_trainer.py │ ├── speech-pretraining │ │ ├── README.md │ │ ├── requirements.txt │ │ └── run_wav2vec2_pretraining_no_trainer.py │ ├── speech-recognition │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_speech_recognition_ctc.py │ │ ├── run_speech_recognition_ctc_adapter.py │ │ └── run_speech_recognition_seq2seq.py │ ├── summarization │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_summarization.py │ │ └── run_summarization_no_trainer.py │ ├── test_accelerate_examples.py │ ├── test_pytorch_examples.py │ ├── text-classification │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_classification.py │ │ ├── run_glue.py │ │ ├── run_glue_no_trainer.py │ │ └── run_xnli.py │ ├── text-generation │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_generation.py │ │ └── run_generation_contrastive_search.py │ ├── token-classification │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run.sh │ │ ├── run_ner.py │ │ ├── run_ner_no_trainer.py │ │ └── run_no_trainer.sh │ ├── translation │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_translation.py │ │ └── run_translation_no_trainer.py │ └── xla_spawn.py ├── research_projects │ ├── README.md │ ├── adversarial │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_hans.py │ │ └── utils_hans.py │ ├── bert-loses-patience │ │ ├── README.md │ │ ├── pabee │ │ │ ├── __init__.py │ │ │ ├── modeling_pabee_albert.py │ │ │ └── modeling_pabee_bert.py │ │ ├── requirements.txt │ │ ├── run_glue_with_pabee.py │ │ └── test_run_glue_with_pabee.py │ ├── bertabs │ │ ├── README.md │ │ ├── __init__.py │ │ ├── configuration_bertabs.py │ │ ├── convert_bertabs_original_pytorch_checkpoint.py │ │ ├── modeling_bertabs.py │ │ ├── requirements.txt │ │ ├── run_summarization.py │ │ ├── test_utils_summarization.py │ │ └── utils_summarization.py │ ├── bertology │ │ ├── requirements.txt │ │ ├── run_bertology.py │ │ └── run_prune_gpt.py │ ├── codeparrot │ │ ├── README.md │ │ ├── examples │ │ │ ├── README.md │ │ │ ├── requirements.txt │ │ │ └── train_complexity_predictor.py │ │ ├── requirements.txt │ │ └── scripts │ │ │ ├── arguments.py │ │ │ ├── bpe_training.py │ │ │ ├── codeparrot_training.py │ │ │ ├── human_eval.py │ │ │ ├── initialize_model.py │ │ │ ├── minhash_deduplication.py │ │ │ ├── preprocessing.py │ │ │ ├── pretokenizing.py │ │ │ ├── tests │ │ │ ├── __init__.py │ │ │ └── test_deduplicate.py │ │ │ └── validation_loss.py │ ├── decision_transformer │ │ ├── requirements.txt │ │ └── run_decision_transformer.py │ ├── deebert │ │ ├── README.md │ │ ├── entropy_eval.sh │ │ ├── eval_deebert.sh │ │ ├── requirements.txt │ │ ├── run_glue_deebert.py │ │ ├── src │ │ │ ├── __init__.py │ │ │ ├── modeling_highway_bert.py │ │ │ └── modeling_highway_roberta.py │ │ ├── test_glue_deebert.py │ │ └── train_deebert.sh │ ├── distillation │ │ ├── README.md │ │ ├── distiller.py │ │ ├── grouped_batch_sampler.py │ │ ├── lm_seqs_dataset.py │ │ ├── requirements.txt │ │ ├── run_squad_w_distillation.py │ │ ├── scripts │ │ │ ├── binarized_data.py │ │ │ ├── extract.py │ │ │ ├── extract_distilbert.py │ │ │ └── token_counts.py │ │ ├── train.py │ │ ├── training_configs │ │ │ ├── distilbert-base-cased.json │ │ │ ├── distilbert-base-multilingual-cased.json │ │ │ ├── distilbert-base-uncased.json │ │ │ ├── distilgpt2.json │ │ │ └── distilroberta-base.json │ │ └── utils.py │ ├── fsner │ │ ├── README.md │ │ ├── pyproject.toml │ │ ├── requirements.txt │ │ ├── setup.py │ │ └── src │ │ │ └── fsner │ │ │ ├── __init__.py │ │ │ ├── model.py │ │ │ └── tokenizer_utils.py │ ├── information-gain-filtration │ │ ├── README.md │ │ ├── igf │ │ │ ├── __init__.py │ │ │ └── igf.py │ │ ├── requirements.txt │ │ ├── result_igf.png │ │ └── run_clm_igf.py │ ├── jax-projects │ │ ├── HOW_TO_PROPOSE_PROJECT.md │ │ ├── README.md │ │ ├── big_bird │ │ │ ├── README.md │ │ │ ├── bigbird_flax.py │ │ │ ├── evaluate.py │ │ │ ├── prepare_natural_questions.py │ │ │ ├── requirements.txt │ │ │ ├── sweep_flax.yaml │ │ │ └── train.py │ │ ├── dataset-streaming │ │ │ ├── README.md │ │ │ └── run_mlm_flax_stream.py │ │ ├── hybrid_clip │ │ │ ├── README.md │ │ │ ├── configuration_hybrid_clip.py │ │ │ ├── modeling_hybrid_clip.py │ │ │ ├── requirements.txt │ │ │ └── run_hybrid_clip.py │ │ ├── model_parallel │ │ │ ├── README.md │ │ │ ├── partitions.py │ │ │ └── run_clm_mp.py │ │ └── wav2vec2 │ │ │ ├── README.md │ │ │ └── run_wav2vec2_pretrain_flax.py │ ├── layoutlmv3 │ │ ├── README.md │ │ ├── requirements.txt │ │ └── run_funsd_cord.py │ ├── longform-qa │ │ ├── README.md │ │ ├── eli5_app.py │ │ ├── eli5_utils.py │ │ └── requirements.txt │ ├── luke │ │ ├── README.md │ │ ├── luke_utils.py │ │ └── run_luke_ner_no_trainer.py │ ├── lxmert │ │ ├── README.md │ │ ├── demo.ipynb │ │ ├── extracting_data.py │ │ ├── modeling_frcnn.py │ │ ├── processing_image.py │ │ ├── requirements.txt │ │ ├── utils.py │ │ └── visualizing_image.py │ ├── mlm_wwm │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_chinese_ref.py │ │ └── run_mlm_wwm.py │ ├── mm-imdb │ │ ├── README.md │ │ ├── run_mmimdb.py │ │ └── utils_mmimdb.py │ ├── movement-pruning │ │ ├── README.md │ │ ├── Saving_PruneBERT.ipynb │ │ ├── bertarize.py │ │ ├── counts_parameters.py │ │ ├── emmental │ │ │ ├── __init__.py │ │ │ ├── configuration_bert_masked.py │ │ │ ├── modeling_bert_masked.py │ │ │ └── modules │ │ │ │ ├── __init__.py │ │ │ │ ├── binarizer.py │ │ │ │ └── masked_nn.py │ │ ├── masked_run_glue.py │ │ ├── masked_run_squad.py │ │ └── requirements.txt │ ├── onnx │ │ └── summarization │ │ │ ├── README.md │ │ │ ├── bart_onnx │ │ │ ├── generation_onnx.py │ │ │ └── reduce_onnx_size.py │ │ │ ├── requirements.txt │ │ │ └── run_onnx_exporter.py │ ├── performer │ │ ├── README.md │ │ ├── full_script.sh │ │ ├── modeling_flax_performer.py │ │ ├── modeling_flax_performer_utils.py │ │ ├── run_mlm_performer.py │ │ └── sanity_script.sh │ ├── pplm │ │ ├── README.md │ │ ├── imgs │ │ │ ├── headfigure.png │ │ │ └── wooly.png │ │ ├── pplm_classification_head.py │ │ ├── requirements.txt │ │ ├── run_pplm.py │ │ └── run_pplm_discrim_train.py │ ├── quantization-qdqbert │ │ ├── Dockerfile │ │ ├── README.md │ │ ├── evaluate-hf-trt-qa.py │ │ ├── ort-infer-benchmark.py │ │ ├── quant_trainer.py │ │ ├── run_quant_qa.py │ │ ├── trainer_quant_qa.py │ │ └── utils_qa.py │ ├── rag-end2end-retriever │ │ ├── README.md │ │ ├── callbacks_rag.py │ │ ├── distributed_ray_retriever.py │ │ ├── eval_rag.py │ │ ├── finetune_rag.py │ │ ├── finetune_rag_ray_end2end.sh │ │ ├── kb_encode_utils.py │ │ ├── lightning_base.py │ │ ├── requirements.txt │ │ ├── test_run │ │ │ ├── dummy-kb │ │ │ │ └── my_knowledge_dataset.csv │ │ │ ├── dummy-train-data │ │ │ │ ├── test.source │ │ │ │ ├── test.target │ │ │ │ ├── train.source │ │ │ │ ├── train.target │ │ │ │ ├── val.source │ │ │ │ └── val.target │ │ │ ├── test_finetune.sh │ │ │ └── test_rag_new_features.sh │ │ ├── use_own_knowledge_dataset.py │ │ └── utils_rag.py │ ├── rag │ │ ├── README.md │ │ ├── __init__.py │ │ ├── _test_finetune_rag.py │ │ ├── callbacks_rag.py │ │ ├── consolidate_rag_checkpoint.py │ │ ├── distributed_pytorch_retriever.py │ │ ├── distributed_ray_retriever.py │ │ ├── eval_rag.py │ │ ├── finetune_rag.py │ │ ├── finetune_rag.sh │ │ ├── finetune_rag_ray.sh │ │ ├── lightning_base.py │ │ ├── parse_dpr_relevance_data.py │ │ ├── requirements.txt │ │ ├── test_data │ │ │ └── my_knowledge_dataset.csv │ │ ├── test_distributed_retriever.py │ │ ├── use_own_knowledge_dataset.py │ │ └── utils_rag.py │ ├── robust-speech-event │ │ ├── README.md │ │ ├── eval.py │ │ ├── run_speech_recognition_ctc_bnb.py │ │ └── run_speech_recognition_ctc_streaming.py │ ├── self-training-text-classification │ │ ├── README.md │ │ ├── finetuning.py │ │ ├── requirements.txt │ │ ├── run.sh │ │ └── selftraining.py │ ├── seq2seq-distillation │ │ ├── README.md │ │ ├── _test_bash_script.py │ │ ├── _test_make_student.py │ │ ├── _test_seq2seq_examples.py │ │ ├── _test_seq2seq_examples_multi_gpu.py │ │ ├── callbacks.py │ │ ├── convert_pl_checkpoint_to_hf.py │ │ ├── distil_marian_enro_teacher.sh │ │ ├── distil_marian_no_teacher.sh │ │ ├── distillation.py │ │ ├── dynamic_bs_example.sh │ │ ├── finetune.py │ │ ├── finetune.sh │ │ ├── finetune_bart_tiny.sh │ │ ├── finetune_pegasus_xsum.sh │ │ ├── finetune_t5.sh │ │ ├── lightning_base.py │ │ ├── make_student.py │ │ ├── precomputed_pseudo_labels.md │ │ ├── requirements.txt │ │ ├── run_eval.py │ │ ├── sentence_splitter.py │ │ ├── train_distilbart_cnn.sh │ │ ├── train_distilbart_xsum.sh │ │ ├── train_mbart_cc25_enro.sh │ │ └── utils.py │ ├── tapex │ │ ├── README.md │ │ ├── requirements.txt │ │ ├── run_tabfact_with_tapex.py │ │ ├── run_wikisql_with_tapex.py │ │ ├── run_wikitablequestions_with_tapex.py │ │ └── wikisql_utils.py │ ├── visual_bert │ │ ├── README.md │ │ ├── demo.ipynb │ │ ├── extracting_data.py │ │ ├── modeling_frcnn.py │ │ ├── processing_image.py │ │ ├── requirements.txt │ │ ├── utils.py │ │ └── visualizing_image.py │ ├── vqgan-clip │ │ ├── README.md │ │ ├── VQGAN_CLIP.py │ │ ├── img_processing.py │ │ ├── loaders.py │ │ ├── requirements.txt │ │ └── utils.py │ ├── wav2vec2 │ │ ├── FINE_TUNE_XLSR_WAV2VEC2.md │ │ ├── README.md │ │ ├── alignment.py │ │ ├── ds_config_wav2vec2_zero2.json │ │ ├── ds_config_wav2vec2_zero3.json │ │ ├── finetune_base_100.sh │ │ ├── finetune_base_timit_asr.sh │ │ ├── finetune_large_lv60_100.sh │ │ ├── finetune_large_lv60_timit_asr.sh │ │ ├── finetune_large_xlsr_53_arabic_speech_corpus.sh │ │ ├── finetune_wav2vec2_xlsr_turkish.sh │ │ ├── requirements.txt │ │ ├── run_alignment.sh │ │ ├── run_asr.py │ │ ├── run_common_voice.py │ │ ├── run_pretrain.py │ │ ├── test_wav2vec2_deepspeed.py │ │ └── vocab │ │ │ └── buckwalter.json │ ├── xtreme-s │ │ ├── README.md │ │ ├── requirements.txt │ │ └── run_xtreme_s.py │ └── zero-shot-distillation │ │ ├── README.md │ │ └── distill_classifier.py ├── run_on_remote.py └── tensorflow │ ├── README.md │ ├── _tests_requirements.txt │ ├── benchmarking │ ├── README.md │ ├── plot_csv_file.py │ ├── requirements.txt │ └── run_benchmark_tf.py │ ├── contrastive-image-text │ ├── README.md │ ├── requirements.txt │ └── run_clip.py │ ├── image-classification │ ├── README.md │ ├── requirements.txt │ └── run_image_classification.py │ ├── language-modeling-tpu │ ├── README.md │ ├── prepare_tfrecord_shards.py │ ├── requirements.txt │ ├── run_mlm.py │ └── train_unigram.py │ ├── language-modeling │ ├── README.md │ ├── requirements.txt │ ├── run_clm.py │ └── run_mlm.py │ ├── multiple-choice │ ├── README.md │ ├── requirements.txt │ └── run_swag.py │ ├── question-answering │ ├── README.md │ ├── requirements.txt │ ├── run_qa.py │ └── utils_qa.py │ ├── summarization │ ├── README.md │ ├── requirements.txt │ └── run_summarization.py │ ├── test_tensorflow_examples.py │ ├── text-classification │ ├── README.md │ ├── requirements.txt │ ├── run_glue.py │ └── run_text_classification.py │ ├── token-classification │ ├── README.md │ ├── requirements.txt │ └── run_ner.py │ └── translation │ ├── README.md │ ├── requirements.txt │ └── run_translation.py ├── hubconf.py ├── model_cards └── README.md ├── notebooks └── README.md ├── pyproject.toml ├── scripts ├── benchmark │ └── trainer-benchmark.py ├── check_tokenizers.py ├── distributed │ └── torch-distributed-gpu-test.py ├── fsmt │ ├── convert-allenai-wmt16.sh │ ├── convert-allenai-wmt19.sh │ ├── convert-facebook-wmt19.sh │ ├── eval-allenai-wmt16.sh │ ├── eval-allenai-wmt19.sh │ ├── eval-facebook-wmt19.sh │ ├── fsmt-make-super-tiny-model.py │ ├── fsmt-make-tiny-model.py │ ├── gen-card-allenai-wmt16.py │ ├── gen-card-allenai-wmt19.py │ ├── gen-card-facebook-wmt19.py │ ├── s3-move.sh │ └── tests-to-run.sh ├── pegasus │ └── build_test_sample_spm_no_bos.py ├── stale.py └── tatoeba │ ├── README.md │ └── upload_models.sh ├── setup.py ├── src └── transformers │ ├── __init__.py │ ├── activations.py │ ├── activations_tf.py │ ├── audio_utils.py │ ├── benchmark │ ├── __init__.py │ ├── benchmark.py │ ├── benchmark_args.py │ ├── benchmark_args_tf.py │ ├── benchmark_args_utils.py │ ├── benchmark_tf.py │ └── benchmark_utils.py │ ├── cache_utils.py │ ├── commands │ ├── __init__.py │ ├── add_new_model.py │ ├── add_new_model_like.py │ ├── convert.py │ ├── download.py │ ├── env.py │ ├── lfs.py │ ├── pt_to_tf.py │ ├── run.py │ ├── serving.py │ ├── train.py │ ├── transformers_cli.py │ └── user.py │ ├── configuration_utils.py │ ├── convert_graph_to_onnx.py │ ├── convert_pytorch_checkpoint_to_tf2.py │ ├── convert_slow_tokenizer.py │ ├── convert_slow_tokenizers_checkpoints_to_fast.py │ ├── convert_tf_hub_seq_to_seq_bert_to_pytorch.py │ ├── data │ ├── __init__.py │ ├── data_collator.py │ ├── datasets │ │ ├── __init__.py │ │ ├── glue.py │ │ ├── language_modeling.py │ │ └── squad.py │ ├── metrics │ │ ├── __init__.py │ │ └── squad_metrics.py │ └── processors │ │ ├── __init__.py │ │ ├── glue.py │ │ ├── squad.py │ │ ├── utils.py │ │ └── xnli.py │ ├── debug_utils.py │ ├── deepspeed.py │ ├── dependency_versions_check.py │ ├── dependency_versions_table.py │ ├── dynamic_module_utils.py │ ├── feature_extraction_sequence_utils.py │ ├── feature_extraction_utils.py │ ├── file_utils.py │ ├── generation │ ├── __init__.py │ ├── beam_constraints.py │ ├── beam_search.py │ ├── candidate_generator.py │ ├── configuration_utils.py │ ├── flax_logits_process.py │ ├── flax_utils.py │ ├── logits_process.py │ ├── stopping_criteria.py │ ├── streamers.py │ ├── tf_logits_process.py │ ├── tf_utils.py │ └── utils.py │ ├── hf_argparser.py │ ├── hyperparameter_search.py │ ├── image_processing_utils.py │ ├── image_transforms.py │ ├── image_utils.py │ ├── integrations │ ├── __init__.py │ ├── aqlm.py │ ├── awq.py │ ├── bitsandbytes.py │ ├── deepspeed.py │ ├── integration_utils.py │ ├── peft.py │ ├── quanto.py │ └── tpu.py │ ├── keras_callbacks.py │ ├── kernels │ ├── deformable_detr │ │ ├── cpu │ │ │ ├── ms_deform_attn_cpu.cpp │ │ │ └── ms_deform_attn_cpu.h │ │ ├── cuda │ │ │ ├── ms_deform_attn_cuda.cu │ │ │ ├── ms_deform_attn_cuda.cuh │ │ │ ├── ms_deform_attn_cuda.h │ │ │ └── ms_deform_im2col_cuda.cuh │ │ ├── ms_deform_attn.h │ │ └── vision.cpp │ ├── deta │ │ ├── cpu │ │ │ ├── ms_deform_attn_cpu.cpp │ │ │ └── ms_deform_attn_cpu.h │ │ ├── cuda │ │ │ ├── ms_deform_attn_cuda.cu │ │ │ ├── ms_deform_attn_cuda.cuh │ │ │ ├── ms_deform_attn_cuda.h │ │ │ └── ms_deform_im2col_cuda.cuh │ │ ├── ms_deform_attn.h │ │ └── vision.cpp │ ├── mra │ │ ├── cuda_kernel.cu │ │ ├── cuda_kernel.h │ │ ├── cuda_launch.cu │ │ ├── cuda_launch.h │ │ └── torch_extension.cpp │ ├── rwkv │ │ ├── wkv_cuda.cu │ │ ├── wkv_cuda_bf16.cu │ │ └── wkv_op.cpp │ └── yoso │ │ ├── common.h │ │ ├── common_cuda.h │ │ ├── common_cuda_device.h │ │ ├── fast_lsh_cumulation.cu │ │ ├── fast_lsh_cumulation.h │ │ ├── fast_lsh_cumulation_cuda.cu │ │ ├── fast_lsh_cumulation_cuda.h │ │ └── fast_lsh_cumulation_torch.cpp │ ├── modelcard.py │ ├── modeling_attn_mask_utils.py │ ├── modeling_flax_outputs.py │ ├── modeling_flax_pytorch_utils.py │ ├── modeling_flax_utils.py │ ├── modeling_outputs.py │ ├── modeling_tf_outputs.py │ ├── modeling_tf_pytorch_utils.py │ ├── modeling_tf_utils.py │ ├── modeling_utils.py │ ├── models │ ├── __init__.py │ ├── albert │ │ ├── __init__.py │ │ ├── configuration_albert.py │ │ ├── convert_albert_original_tf_checkpoint_to_pytorch.py │ │ ├── modeling_albert.py │ │ ├── modeling_flax_albert.py │ │ ├── modeling_tf_albert.py │ │ ├── tokenization_albert.py │ │ └── tokenization_albert_fast.py │ ├── align │ │ ├── __init__.py │ │ ├── configuration_align.py │ │ ├── convert_align_tf_to_hf.py │ │ ├── modeling_align.py │ │ └── processing_align.py │ ├── altclip │ │ ├── __init__.py │ │ ├── configuration_altclip.py │ │ ├── modeling_altclip.py │ │ └── processing_altclip.py │ ├── audio_spectrogram_transformer │ │ ├── __init__.py │ │ ├── configuration_audio_spectrogram_transformer.py │ │ ├── convert_audio_spectrogram_transformer_original_to_pytorch.py │ │ ├── feature_extraction_audio_spectrogram_transformer.py │ │ └── modeling_audio_spectrogram_transformer.py │ ├── auto │ │ ├── __init__.py │ │ ├── auto_factory.py │ │ ├── configuration_auto.py │ │ ├── feature_extraction_auto.py │ │ ├── image_processing_auto.py │ │ ├── modeling_auto.py │ │ ├── modeling_flax_auto.py │ │ ├── modeling_tf_auto.py │ │ ├── processing_auto.py │ │ └── tokenization_auto.py │ ├── autoformer │ │ ├── __init__.py │ │ ├── configuration_autoformer.py │ │ └── modeling_autoformer.py │ ├── bark │ │ ├── __init__.py │ │ ├── configuration_bark.py │ │ ├── convert_suno_to_hf.py │ │ ├── generation_configuration_bark.py │ │ ├── modeling_bark.py │ │ └── processing_bark.py │ ├── bart │ │ ├── __init__.py │ │ ├── configuration_bart.py │ │ ├── convert_bart_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_bart.py │ │ ├── modeling_flax_bart.py │ │ ├── modeling_tf_bart.py │ │ ├── tokenization_bart.py │ │ └── tokenization_bart_fast.py │ ├── barthez │ │ ├── __init__.py │ │ ├── tokenization_barthez.py │ │ └── tokenization_barthez_fast.py │ ├── bartpho │ │ ├── __init__.py │ │ └── tokenization_bartpho.py │ ├── beit │ │ ├── __init__.py │ │ ├── configuration_beit.py │ │ ├── convert_beit_unilm_to_pytorch.py │ │ ├── feature_extraction_beit.py │ │ ├── image_processing_beit.py │ │ ├── modeling_beit.py │ │ └── modeling_flax_beit.py │ ├── bert │ │ ├── __init__.py │ │ ├── configuration_bert.py │ │ ├── convert_bert_original_tf2_checkpoint_to_pytorch.py │ │ ├── convert_bert_original_tf_checkpoint_to_pytorch.py │ │ ├── convert_bert_pytorch_checkpoint_to_original_tf.py │ │ ├── convert_bert_token_dropping_original_tf2_checkpoint_to_pytorch.py │ │ ├── modeling_bert.py │ │ ├── modeling_flax_bert.py │ │ ├── modeling_tf_bert.py │ │ ├── tokenization_bert.py │ │ ├── tokenization_bert_fast.py │ │ └── tokenization_bert_tf.py │ ├── bert_generation │ │ ├── __init__.py │ │ ├── configuration_bert_generation.py │ │ ├── modeling_bert_generation.py │ │ └── tokenization_bert_generation.py │ ├── bert_japanese │ │ ├── __init__.py │ │ └── tokenization_bert_japanese.py │ ├── bertweet │ │ ├── __init__.py │ │ └── tokenization_bertweet.py │ ├── big_bird │ │ ├── __init__.py │ │ ├── configuration_big_bird.py │ │ ├── convert_bigbird_original_tf_checkpoint_to_pytorch.py │ │ ├── modeling_big_bird.py │ │ ├── modeling_flax_big_bird.py │ │ ├── tokenization_big_bird.py │ │ └── tokenization_big_bird_fast.py │ ├── bigbird_pegasus │ │ ├── __init__.py │ │ ├── configuration_bigbird_pegasus.py │ │ ├── convert_bigbird_pegasus_tf_to_pytorch.py │ │ └── modeling_bigbird_pegasus.py │ ├── biogpt │ │ ├── __init__.py │ │ ├── configuration_biogpt.py │ │ ├── convert_biogpt_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_biogpt.py │ │ └── tokenization_biogpt.py │ ├── bit │ │ ├── __init__.py │ │ ├── configuration_bit.py │ │ ├── convert_bit_to_pytorch.py │ │ ├── image_processing_bit.py │ │ └── modeling_bit.py │ ├── blenderbot │ │ ├── __init__.py │ │ ├── configuration_blenderbot.py │ │ ├── convert_blenderbot_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_blenderbot.py │ │ ├── modeling_flax_blenderbot.py │ │ ├── modeling_tf_blenderbot.py │ │ ├── tokenization_blenderbot.py │ │ └── tokenization_blenderbot_fast.py │ ├── blenderbot_small │ │ ├── __init__.py │ │ ├── configuration_blenderbot_small.py │ │ ├── modeling_blenderbot_small.py │ │ ├── modeling_flax_blenderbot_small.py │ │ ├── modeling_tf_blenderbot_small.py │ │ ├── tokenization_blenderbot_small.py │ │ └── tokenization_blenderbot_small_fast.py │ ├── blip │ │ ├── __init__.py │ │ ├── configuration_blip.py │ │ ├── convert_blip_original_pytorch_to_hf.py │ │ ├── image_processing_blip.py │ │ ├── modeling_blip.py │ │ ├── modeling_blip_text.py │ │ ├── modeling_tf_blip.py │ │ ├── modeling_tf_blip_text.py │ │ └── processing_blip.py │ ├── blip_2 │ │ ├── __init__.py │ │ ├── configuration_blip_2.py │ │ ├── convert_blip_2_original_to_pytorch.py │ │ ├── modeling_blip_2.py │ │ └── processing_blip_2.py │ ├── bloom │ │ ├── __init__.py │ │ ├── configuration_bloom.py │ │ ├── convert_bloom_original_checkpoint_to_pytorch.py │ │ ├── modeling_bloom.py │ │ ├── modeling_flax_bloom.py │ │ └── tokenization_bloom_fast.py │ ├── bridgetower │ │ ├── __init__.py │ │ ├── configuration_bridgetower.py │ │ ├── image_processing_bridgetower.py │ │ ├── modeling_bridgetower.py │ │ └── processing_bridgetower.py │ ├── bros │ │ ├── __init__.py │ │ ├── configuration_bros.py │ │ ├── convert_bros_to_pytorch.py │ │ ├── modeling_bros.py │ │ └── processing_bros.py │ ├── byt5 │ │ ├── __init__.py │ │ ├── convert_byt5_original_tf_checkpoint_to_pytorch.py │ │ └── tokenization_byt5.py │ ├── camembert │ │ ├── __init__.py │ │ ├── configuration_camembert.py │ │ ├── modeling_camembert.py │ │ ├── modeling_tf_camembert.py │ │ ├── tokenization_camembert.py │ │ └── tokenization_camembert_fast.py │ ├── canine │ │ ├── __init__.py │ │ ├── configuration_canine.py │ │ ├── convert_canine_original_tf_checkpoint_to_pytorch.py │ │ ├── modeling_canine.py │ │ └── tokenization_canine.py │ ├── chinese_clip │ │ ├── __init__.py │ │ ├── configuration_chinese_clip.py │ │ ├── convert_chinese_clip_original_pytorch_to_hf.py │ │ ├── feature_extraction_chinese_clip.py │ │ ├── image_processing_chinese_clip.py │ │ ├── modeling_chinese_clip.py │ │ └── processing_chinese_clip.py │ ├── clap │ │ ├── __init__.py │ │ ├── configuration_clap.py │ │ ├── convert_clap_original_pytorch_to_hf.py │ │ ├── feature_extraction_clap.py │ │ ├── modeling_clap.py │ │ └── processing_clap.py │ ├── clip │ │ ├── __init__.py │ │ ├── configuration_clip.py │ │ ├── convert_clip_original_pytorch_to_hf.py │ │ ├── feature_extraction_clip.py │ │ ├── image_processing_clip.py │ │ ├── modeling_clip.py │ │ ├── modeling_flax_clip.py │ │ ├── modeling_tf_clip.py │ │ ├── processing_clip.py │ │ ├── tokenization_clip.py │ │ └── tokenization_clip_fast.py │ ├── clipseg │ │ ├── __init__.py │ │ ├── configuration_clipseg.py │ │ ├── convert_clipseg_original_pytorch_to_hf.py │ │ ├── modeling_clipseg.py │ │ └── processing_clipseg.py │ ├── clvp │ │ ├── __init__.py │ │ ├── configuration_clvp.py │ │ ├── convert_clvp_to_hf.py │ │ ├── feature_extraction_clvp.py │ │ ├── modeling_clvp.py │ │ ├── number_normalizer.py │ │ ├── processing_clvp.py │ │ └── tokenization_clvp.py │ ├── code_llama │ │ ├── __init__.py │ │ ├── tokenization_code_llama.py │ │ └── tokenization_code_llama_fast.py │ ├── codegen │ │ ├── __init__.py │ │ ├── configuration_codegen.py │ │ ├── modeling_codegen.py │ │ ├── tokenization_codegen.py │ │ └── tokenization_codegen_fast.py │ ├── cohere │ │ ├── __init__.py │ │ ├── configuration_cohere.py │ │ ├── modeling_cohere.py │ │ └── tokenization_cohere_fast.py │ ├── conditional_detr │ │ ├── __init__.py │ │ ├── configuration_conditional_detr.py │ │ ├── convert_conditional_detr_original_pytorch_checkpoint_to_pytorch.py │ │ ├── feature_extraction_conditional_detr.py │ │ ├── image_processing_conditional_detr.py │ │ └── modeling_conditional_detr.py │ ├── convbert │ │ ├── __init__.py │ │ ├── configuration_convbert.py │ │ ├── convert_convbert_original_tf1_checkpoint_to_pytorch_and_tf2.py │ │ ├── modeling_convbert.py │ │ ├── modeling_tf_convbert.py │ │ ├── tokenization_convbert.py │ │ └── tokenization_convbert_fast.py │ ├── convnext │ │ ├── __init__.py │ │ ├── configuration_convnext.py │ │ ├── convert_convnext_to_pytorch.py │ │ ├── feature_extraction_convnext.py │ │ ├── image_processing_convnext.py │ │ ├── modeling_convnext.py │ │ └── modeling_tf_convnext.py │ ├── convnextv2 │ │ ├── __init__.py │ │ ├── configuration_convnextv2.py │ │ ├── convert_convnextv2_to_pytorch.py │ │ ├── modeling_convnextv2.py │ │ └── modeling_tf_convnextv2.py │ ├── cpm │ │ ├── __init__.py │ │ ├── tokenization_cpm.py │ │ └── tokenization_cpm_fast.py │ ├── cpmant │ │ ├── __init__.py │ │ ├── configuration_cpmant.py │ │ ├── modeling_cpmant.py │ │ └── tokenization_cpmant.py │ ├── ctrl │ │ ├── __init__.py │ │ ├── configuration_ctrl.py │ │ ├── modeling_ctrl.py │ │ ├── modeling_tf_ctrl.py │ │ └── tokenization_ctrl.py │ ├── cvt │ │ ├── __init__.py │ │ ├── configuration_cvt.py │ │ ├── convert_cvt_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_cvt.py │ │ └── modeling_tf_cvt.py │ ├── data2vec │ │ ├── __init__.py │ │ ├── configuration_data2vec_audio.py │ │ ├── configuration_data2vec_text.py │ │ ├── configuration_data2vec_vision.py │ │ ├── convert_data2vec_audio_original_pytorch_checkpoint_to_pytorch.py │ │ ├── convert_data2vec_text_original_pytorch_checkpoint_to_pytorch.py │ │ ├── convert_data2vec_vision_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_data2vec_audio.py │ │ ├── modeling_data2vec_text.py │ │ ├── modeling_data2vec_vision.py │ │ └── modeling_tf_data2vec_vision.py │ ├── dbrx │ │ ├── __init__.py │ │ ├── configuration_dbrx.py │ │ └── modeling_dbrx.py │ ├── deberta │ │ ├── __init__.py │ │ ├── configuration_deberta.py │ │ ├── modeling_deberta.py │ │ ├── modeling_tf_deberta.py │ │ ├── tokenization_deberta.py │ │ └── tokenization_deberta_fast.py │ ├── deberta_v2 │ │ ├── __init__.py │ │ ├── configuration_deberta_v2.py │ │ ├── modeling_deberta_v2.py │ │ ├── modeling_tf_deberta_v2.py │ │ ├── tokenization_deberta_v2.py │ │ └── tokenization_deberta_v2_fast.py │ ├── decision_transformer │ │ ├── __init__.py │ │ ├── configuration_decision_transformer.py │ │ └── modeling_decision_transformer.py │ ├── deformable_detr │ │ ├── __init__.py │ │ ├── configuration_deformable_detr.py │ │ ├── convert_deformable_detr_to_pytorch.py │ │ ├── feature_extraction_deformable_detr.py │ │ ├── image_processing_deformable_detr.py │ │ ├── load_custom.py │ │ └── modeling_deformable_detr.py │ ├── deit │ │ ├── __init__.py │ │ ├── configuration_deit.py │ │ ├── convert_deit_timm_to_pytorch.py │ │ ├── feature_extraction_deit.py │ │ ├── image_processing_deit.py │ │ ├── modeling_deit.py │ │ └── modeling_tf_deit.py │ ├── deprecated │ │ ├── __init__.py │ │ ├── _archive_maps.py │ │ ├── bort │ │ │ ├── __init__.py │ │ │ └── convert_bort_original_gluonnlp_checkpoint_to_pytorch.py │ │ ├── mctct │ │ │ ├── __init__.py │ │ │ ├── configuration_mctct.py │ │ │ ├── feature_extraction_mctct.py │ │ │ ├── modeling_mctct.py │ │ │ └── processing_mctct.py │ │ ├── mmbt │ │ │ ├── __init__.py │ │ │ ├── configuration_mmbt.py │ │ │ └── modeling_mmbt.py │ │ ├── open_llama │ │ │ ├── __init__.py │ │ │ ├── configuration_open_llama.py │ │ │ └── modeling_open_llama.py │ │ ├── retribert │ │ │ ├── __init__.py │ │ │ ├── configuration_retribert.py │ │ │ ├── modeling_retribert.py │ │ │ ├── tokenization_retribert.py │ │ │ └── tokenization_retribert_fast.py │ │ ├── tapex │ │ │ ├── __init__.py │ │ │ └── tokenization_tapex.py │ │ ├── trajectory_transformer │ │ │ ├── __init__.py │ │ │ ├── configuration_trajectory_transformer.py │ │ │ ├── convert_trajectory_transformer_original_pytorch_checkpoint_to_pytorch.py │ │ │ └── modeling_trajectory_transformer.py │ │ ├── transfo_xl │ │ │ ├── __init__.py │ │ │ ├── configuration_transfo_xl.py │ │ │ ├── convert_transfo_xl_original_tf_checkpoint_to_pytorch.py │ │ │ ├── modeling_tf_transfo_xl.py │ │ │ ├── modeling_tf_transfo_xl_utilities.py │ │ │ ├── modeling_transfo_xl.py │ │ │ ├── modeling_transfo_xl_utilities.py │ │ │ └── tokenization_transfo_xl.py │ │ └── van │ │ │ ├── __init__.py │ │ │ ├── configuration_van.py │ │ │ ├── convert_van_to_pytorch.py │ │ │ └── modeling_van.py │ ├── depth_anything │ │ ├── __init__.py │ │ ├── configuration_depth_anything.py │ │ ├── convert_depth_anything_to_hf.py │ │ └── modeling_depth_anything.py │ ├── deta │ │ ├── __init__.py │ │ ├── configuration_deta.py │ │ ├── convert_deta_resnet_to_pytorch.py │ │ ├── convert_deta_swin_to_pytorch.py │ │ ├── image_processing_deta.py │ │ └── modeling_deta.py │ ├── detr │ │ ├── __init__.py │ │ ├── configuration_detr.py │ │ ├── convert_detr_original_pytorch_checkpoint_to_pytorch.py │ │ ├── convert_detr_to_pytorch.py │ │ ├── feature_extraction_detr.py │ │ ├── image_processing_detr.py │ │ └── modeling_detr.py │ ├── dialogpt │ │ ├── __init__.py │ │ └── convert_dialogpt_original_pytorch_checkpoint_to_pytorch.py │ ├── dinat │ │ ├── __init__.py │ │ ├── configuration_dinat.py │ │ └── modeling_dinat.py │ ├── dinov2 │ │ ├── __init__.py │ │ ├── configuration_dinov2.py │ │ ├── convert_dinov2_to_hf.py │ │ └── modeling_dinov2.py │ ├── distilbert │ │ ├── __init__.py │ │ ├── configuration_distilbert.py │ │ ├── modeling_distilbert.py │ │ ├── modeling_flax_distilbert.py │ │ ├── modeling_tf_distilbert.py │ │ ├── tokenization_distilbert.py │ │ └── tokenization_distilbert_fast.py │ ├── dit │ │ ├── __init__.py │ │ └── convert_dit_unilm_to_pytorch.py │ ├── donut │ │ ├── __init__.py │ │ ├── configuration_donut_swin.py │ │ ├── convert_donut_to_pytorch.py │ │ ├── feature_extraction_donut.py │ │ ├── image_processing_donut.py │ │ ├── modeling_donut_swin.py │ │ └── processing_donut.py │ ├── dpr │ │ ├── __init__.py │ │ ├── configuration_dpr.py │ │ ├── convert_dpr_original_checkpoint_to_pytorch.py │ │ ├── modeling_dpr.py │ │ ├── modeling_tf_dpr.py │ │ ├── tokenization_dpr.py │ │ └── tokenization_dpr_fast.py │ ├── dpt │ │ ├── __init__.py │ │ ├── configuration_dpt.py │ │ ├── convert_dinov2_depth_to_hf.py │ │ ├── convert_dpt_beit_to_hf.py │ │ ├── convert_dpt_hybrid_to_pytorch.py │ │ ├── convert_dpt_swinv2_to_hf.py │ │ ├── convert_dpt_to_pytorch.py │ │ ├── feature_extraction_dpt.py │ │ ├── image_processing_dpt.py │ │ └── modeling_dpt.py │ ├── efficientformer │ │ ├── __init__.py │ │ ├── configuration_efficientformer.py │ │ ├── convert_efficientformer_original_pytorch_checkpoint_to_pytorch.py │ │ ├── image_processing_efficientformer.py │ │ ├── modeling_efficientformer.py │ │ └── modeling_tf_efficientformer.py │ ├── efficientnet │ │ ├── __init__.py │ │ ├── configuration_efficientnet.py │ │ ├── convert_efficientnet_to_pytorch.py │ │ ├── image_processing_efficientnet.py │ │ └── modeling_efficientnet.py │ ├── electra │ │ ├── __init__.py │ │ ├── configuration_electra.py │ │ ├── convert_electra_original_tf_checkpoint_to_pytorch.py │ │ ├── modeling_electra.py │ │ ├── modeling_flax_electra.py │ │ ├── modeling_tf_electra.py │ │ ├── tokenization_electra.py │ │ └── tokenization_electra_fast.py │ ├── encodec │ │ ├── __init__.py │ │ ├── configuration_encodec.py │ │ ├── convert_encodec_checkpoint_to_pytorch.py │ │ ├── feature_extraction_encodec.py │ │ └── modeling_encodec.py │ ├── encoder_decoder │ │ ├── __init__.py │ │ ├── configuration_encoder_decoder.py │ │ ├── modeling_encoder_decoder.py │ │ ├── modeling_flax_encoder_decoder.py │ │ └── modeling_tf_encoder_decoder.py │ ├── ernie │ │ ├── __init__.py │ │ ├── configuration_ernie.py │ │ └── modeling_ernie.py │ ├── ernie_m │ │ ├── __init__.py │ │ ├── configuration_ernie_m.py │ │ ├── modeling_ernie_m.py │ │ └── tokenization_ernie_m.py │ ├── esm │ │ ├── __init__.py │ │ ├── configuration_esm.py │ │ ├── convert_esm.py │ │ ├── modeling_esm.py │ │ ├── modeling_esmfold.py │ │ ├── modeling_tf_esm.py │ │ ├── openfold_utils │ │ │ ├── __init__.py │ │ │ ├── chunk_utils.py │ │ │ ├── data_transforms.py │ │ │ ├── feats.py │ │ │ ├── loss.py │ │ │ ├── protein.py │ │ │ ├── residue_constants.py │ │ │ ├── rigid_utils.py │ │ │ └── tensor_utils.py │ │ └── tokenization_esm.py │ ├── falcon │ │ ├── __init__.py │ │ ├── configuration_falcon.py │ │ ├── convert_custom_code_checkpoint.py │ │ └── modeling_falcon.py │ ├── fastspeech2_conformer │ │ ├── __init__.py │ │ ├── configuration_fastspeech2_conformer.py │ │ ├── convert_fastspeech2_conformer_original_pytorch_checkpoint_to_pytorch.py │ │ ├── convert_hifigan.py │ │ ├── convert_model_with_hifigan.py │ │ ├── modeling_fastspeech2_conformer.py │ │ └── tokenization_fastspeech2_conformer.py │ ├── flaubert │ │ ├── __init__.py │ │ ├── configuration_flaubert.py │ │ ├── modeling_flaubert.py │ │ ├── modeling_tf_flaubert.py │ │ └── tokenization_flaubert.py │ ├── flava │ │ ├── __init__.py │ │ ├── configuration_flava.py │ │ ├── convert_dalle_to_flava_codebook.py │ │ ├── convert_flava_original_pytorch_to_hf.py │ │ ├── feature_extraction_flava.py │ │ ├── image_processing_flava.py │ │ ├── modeling_flava.py │ │ └── processing_flava.py │ ├── fnet │ │ ├── __init__.py │ │ ├── configuration_fnet.py │ │ ├── convert_fnet_original_flax_checkpoint_to_pytorch.py │ │ ├── modeling_fnet.py │ │ ├── tokenization_fnet.py │ │ └── tokenization_fnet_fast.py │ ├── focalnet │ │ ├── __init__.py │ │ ├── configuration_focalnet.py │ │ ├── convert_focalnet_to_hf_format.py │ │ └── modeling_focalnet.py │ ├── fsmt │ │ ├── __init__.py │ │ ├── configuration_fsmt.py │ │ ├── convert_fsmt_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_fsmt.py │ │ └── tokenization_fsmt.py │ ├── funnel │ │ ├── __init__.py │ │ ├── configuration_funnel.py │ │ ├── convert_funnel_original_tf_checkpoint_to_pytorch.py │ │ ├── modeling_funnel.py │ │ ├── modeling_tf_funnel.py │ │ ├── tokenization_funnel.py │ │ └── tokenization_funnel_fast.py │ ├── fuyu │ │ ├── __init__.py │ │ ├── configuration_fuyu.py │ │ ├── convert_fuyu_model_weights_to_hf.py │ │ ├── image_processing_fuyu.py │ │ ├── modeling_fuyu.py │ │ └── processing_fuyu.py │ ├── gemma │ │ ├── __init__.py │ │ ├── configuration_gemma.py │ │ ├── convert_gemma_weights_to_hf.py │ │ ├── modeling_flax_gemma.py │ │ ├── modeling_gemma.py │ │ ├── tokenization_gemma.py │ │ └── tokenization_gemma_fast.py │ ├── git │ │ ├── __init__.py │ │ ├── configuration_git.py │ │ ├── convert_git_to_pytorch.py │ │ ├── modeling_git.py │ │ └── processing_git.py │ ├── glpn │ │ ├── __init__.py │ │ ├── configuration_glpn.py │ │ ├── convert_glpn_to_pytorch.py │ │ ├── feature_extraction_glpn.py │ │ ├── image_processing_glpn.py │ │ └── modeling_glpn.py │ ├── gpt2 │ │ ├── CONVERSION.md │ │ ├── __init__.py │ │ ├── configuration_gpt2.py │ │ ├── convert_gpt2_original_tf_checkpoint_to_pytorch.py │ │ ├── modeling_flax_gpt2.py │ │ ├── modeling_gpt2.py │ │ ├── modeling_tf_gpt2.py │ │ ├── tokenization_gpt2.py │ │ ├── tokenization_gpt2_fast.py │ │ └── tokenization_gpt2_tf.py │ ├── gpt_bigcode │ │ ├── __init__.py │ │ ├── configuration_gpt_bigcode.py │ │ └── modeling_gpt_bigcode.py │ ├── gpt_neo │ │ ├── __init__.py │ │ ├── configuration_gpt_neo.py │ │ ├── convert_gpt_neo_mesh_tf_to_pytorch.py │ │ ├── modeling_flax_gpt_neo.py │ │ └── modeling_gpt_neo.py │ ├── gpt_neox │ │ ├── __init__.py │ │ ├── configuration_gpt_neox.py │ │ ├── modeling_gpt_neox.py │ │ └── tokenization_gpt_neox_fast.py │ ├── gpt_neox_japanese │ │ ├── __init__.py │ │ ├── configuration_gpt_neox_japanese.py │ │ ├── modeling_gpt_neox_japanese.py │ │ └── tokenization_gpt_neox_japanese.py │ ├── gpt_sw3 │ │ ├── __init__.py │ │ ├── convert_megatron_to_pytorch.py │ │ └── tokenization_gpt_sw3.py │ ├── gptj │ │ ├── __init__.py │ │ ├── configuration_gptj.py │ │ ├── modeling_flax_gptj.py │ │ ├── modeling_gptj.py │ │ └── modeling_tf_gptj.py │ ├── gptsan_japanese │ │ ├── __init__.py │ │ ├── configuration_gptsan_japanese.py │ │ ├── convert_gptsan_tf_checkpoint_to_pytorch.py │ │ ├── modeling_gptsan_japanese.py │ │ └── tokenization_gptsan_japanese.py │ ├── graphormer │ │ ├── __init__.py │ │ ├── algos_graphormer.pyx │ │ ├── collating_graphormer.py │ │ ├── configuration_graphormer.py │ │ └── modeling_graphormer.py │ ├── grounding_dino │ │ ├── __init__.py │ │ ├── configuration_grounding_dino.py │ │ ├── convert_grounding_dino_to_hf.py │ │ ├── image_processing_grounding_dino.py │ │ ├── modeling_grounding_dino.py │ │ └── processing_grounding_dino.py │ ├── groupvit │ │ ├── __init__.py │ │ ├── configuration_groupvit.py │ │ ├── convert_groupvit_nvlab_to_hf.py │ │ ├── modeling_groupvit.py │ │ └── modeling_tf_groupvit.py │ ├── herbert │ │ ├── __init__.py │ │ ├── tokenization_herbert.py │ │ └── tokenization_herbert_fast.py │ ├── hubert │ │ ├── __init__.py │ │ ├── configuration_hubert.py │ │ ├── convert_distilhubert_original_s3prl_checkpoint_to_pytorch.py │ │ ├── convert_hubert_original_pytorch_checkpoint_to_pytorch.py │ │ ├── convert_hubert_original_s3prl_checkpoint_to_pytorch.py │ │ ├── modeling_hubert.py │ │ └── modeling_tf_hubert.py │ ├── ibert │ │ ├── __init__.py │ │ ├── configuration_ibert.py │ │ ├── modeling_ibert.py │ │ └── quant_modules.py │ ├── idefics │ │ ├── __init__.py │ │ ├── configuration_idefics.py │ │ ├── image_processing_idefics.py │ │ ├── modeling_idefics.py │ │ ├── perceiver.py │ │ ├── processing_idefics.py │ │ └── vision.py │ ├── idefics2 │ │ ├── __init__.py │ │ ├── configuration_idefics2.py │ │ ├── convert_idefics2_weights_to_hf.py │ │ ├── image_processing_idefics2.py │ │ ├── modeling_idefics2.py │ │ └── processing_idefics2.py │ ├── imagegpt │ │ ├── __init__.py │ │ ├── configuration_imagegpt.py │ │ ├── convert_imagegpt_original_tf2_to_pytorch.py │ │ ├── feature_extraction_imagegpt.py │ │ ├── image_processing_imagegpt.py │ │ └── modeling_imagegpt.py │ ├── informer │ │ ├── __init__.py │ │ ├── configuration_informer.py │ │ └── modeling_informer.py │ ├── instructblip │ │ ├── __init__.py │ │ ├── configuration_instructblip.py │ │ ├── convert_instructblip_original_to_pytorch.py │ │ ├── modeling_instructblip.py │ │ └── processing_instructblip.py │ ├── jamba │ │ ├── __init__.py │ │ ├── configuration_jamba.py │ │ └── modeling_jamba.py │ ├── jukebox │ │ ├── __init__.py │ │ ├── configuration_jukebox.py │ │ ├── convert_jukebox.py │ │ ├── modeling_jukebox.py │ │ └── tokenization_jukebox.py │ ├── kosmos2 │ │ ├── __init__.py │ │ ├── configuration_kosmos2.py │ │ ├── convert_kosmos2_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_kosmos2.py │ │ └── processing_kosmos2.py │ ├── layoutlm │ │ ├── __init__.py │ │ ├── configuration_layoutlm.py │ │ ├── modeling_layoutlm.py │ │ ├── modeling_tf_layoutlm.py │ │ ├── tokenization_layoutlm.py │ │ └── tokenization_layoutlm_fast.py │ ├── layoutlmv2 │ │ ├── __init__.py │ │ ├── configuration_layoutlmv2.py │ │ ├── feature_extraction_layoutlmv2.py │ │ ├── image_processing_layoutlmv2.py │ │ ├── modeling_layoutlmv2.py │ │ ├── processing_layoutlmv2.py │ │ ├── tokenization_layoutlmv2.py │ │ └── tokenization_layoutlmv2_fast.py │ ├── layoutlmv3 │ │ ├── __init__.py │ │ ├── configuration_layoutlmv3.py │ │ ├── feature_extraction_layoutlmv3.py │ │ ├── image_processing_layoutlmv3.py │ │ ├── modeling_layoutlmv3.py │ │ ├── modeling_tf_layoutlmv3.py │ │ ├── processing_layoutlmv3.py │ │ ├── tokenization_layoutlmv3.py │ │ └── tokenization_layoutlmv3_fast.py │ ├── layoutxlm │ │ ├── __init__.py │ │ ├── processing_layoutxlm.py │ │ ├── tokenization_layoutxlm.py │ │ └── tokenization_layoutxlm_fast.py │ ├── led │ │ ├── __init__.py │ │ ├── configuration_led.py │ │ ├── modeling_led.py │ │ ├── modeling_tf_led.py │ │ ├── tokenization_led.py │ │ └── tokenization_led_fast.py │ ├── levit │ │ ├── __init__.py │ │ ├── configuration_levit.py │ │ ├── convert_levit_timm_to_pytorch.py │ │ ├── feature_extraction_levit.py │ │ ├── image_processing_levit.py │ │ └── modeling_levit.py │ ├── lilt │ │ ├── __init__.py │ │ ├── configuration_lilt.py │ │ └── modeling_lilt.py │ ├── llama │ │ ├── __init__.py │ │ ├── configuration_llama.py │ │ ├── convert_llama_weights_to_hf.py │ │ ├── modeling_flax_llama.py │ │ ├── modeling_llama.py │ │ ├── tokenization_llama.py │ │ └── tokenization_llama_fast.py │ ├── llava │ │ ├── __init__.py │ │ ├── configuration_llava.py │ │ ├── convert_llava_weights_to_hf.py │ │ ├── modeling_llava.py │ │ └── processing_llava.py │ ├── llava_next │ │ ├── __init__.py │ │ ├── configuration_llava_next.py │ │ ├── convert_llava_next_weights_to_hf.py │ │ ├── image_processing_llava_next.py │ │ ├── modeling_llava_next.py │ │ └── processing_llava_next.py │ ├── longformer │ │ ├── __init__.py │ │ ├── configuration_longformer.py │ │ ├── convert_longformer_original_pytorch_lightning_to_pytorch.py │ │ ├── modeling_longformer.py │ │ ├── modeling_tf_longformer.py │ │ ├── tokenization_longformer.py │ │ └── tokenization_longformer_fast.py │ ├── longt5 │ │ ├── __init__.py │ │ ├── configuration_longt5.py │ │ ├── convert_longt5x_checkpoint_to_flax.py │ │ ├── modeling_flax_longt5.py │ │ └── modeling_longt5.py │ ├── luke │ │ ├── __init__.py │ │ ├── configuration_luke.py │ │ ├── convert_luke_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_luke.py │ │ └── tokenization_luke.py │ ├── lxmert │ │ ├── __init__.py │ │ ├── configuration_lxmert.py │ │ ├── convert_lxmert_original_tf_checkpoint_to_pytorch.py │ │ ├── modeling_lxmert.py │ │ ├── modeling_tf_lxmert.py │ │ ├── tokenization_lxmert.py │ │ └── tokenization_lxmert_fast.py │ ├── m2m_100 │ │ ├── __init__.py │ │ ├── configuration_m2m_100.py │ │ ├── convert_m2m100_original_checkpoint_to_pytorch.py │ │ ├── modeling_m2m_100.py │ │ └── tokenization_m2m_100.py │ ├── mamba │ │ ├── __init__.py │ │ ├── configuration_mamba.py │ │ ├── convert_mamba_ssm_checkpoint_to_pytorch.py │ │ └── modeling_mamba.py │ ├── marian │ │ ├── __init__.py │ │ ├── configuration_marian.py │ │ ├── convert_marian_tatoeba_to_pytorch.py │ │ ├── convert_marian_to_pytorch.py │ │ ├── modeling_flax_marian.py │ │ ├── modeling_marian.py │ │ ├── modeling_tf_marian.py │ │ └── tokenization_marian.py │ ├── markuplm │ │ ├── __init__.py │ │ ├── configuration_markuplm.py │ │ ├── feature_extraction_markuplm.py │ │ ├── modeling_markuplm.py │ │ ├── processing_markuplm.py │ │ ├── tokenization_markuplm.py │ │ └── tokenization_markuplm_fast.py │ ├── mask2former │ │ ├── __init__.py │ │ ├── configuration_mask2former.py │ │ ├── convert_mask2former_original_pytorch_checkpoint_to_pytorch.py │ │ ├── image_processing_mask2former.py │ │ └── modeling_mask2former.py │ ├── maskformer │ │ ├── __init__.py │ │ ├── configuration_maskformer.py │ │ ├── configuration_maskformer_swin.py │ │ ├── convert_maskformer_original_pytorch_checkpoint_to_pytorch.py │ │ ├── convert_maskformer_resnet_to_pytorch.py │ │ ├── convert_maskformer_swin_to_pytorch.py │ │ ├── feature_extraction_maskformer.py │ │ ├── image_processing_maskformer.py │ │ ├── modeling_maskformer.py │ │ └── modeling_maskformer_swin.py │ ├── mbart │ │ ├── __init__.py │ │ ├── configuration_mbart.py │ │ ├── convert_mbart_original_checkpoint_to_pytorch.py │ │ ├── modeling_flax_mbart.py │ │ ├── modeling_mbart.py │ │ ├── modeling_tf_mbart.py │ │ ├── tokenization_mbart.py │ │ └── tokenization_mbart_fast.py │ ├── mbart50 │ │ ├── __init__.py │ │ ├── tokenization_mbart50.py │ │ └── tokenization_mbart50_fast.py │ ├── mega │ │ ├── __init__.py │ │ ├── configuration_mega.py │ │ ├── convert_mega_original_pytorch_checkpoint_to_pytorch.py │ │ └── modeling_mega.py │ ├── megatron_bert │ │ ├── __init__.py │ │ ├── configuration_megatron_bert.py │ │ ├── convert_megatron_bert_checkpoint.py │ │ └── modeling_megatron_bert.py │ ├── megatron_gpt2 │ │ ├── __init__.py │ │ ├── checkpoint_reshaping_and_interoperability.py │ │ └── convert_megatron_gpt2_checkpoint.py │ ├── mgp_str │ │ ├── __init__.py │ │ ├── configuration_mgp_str.py │ │ ├── modeling_mgp_str.py │ │ ├── processing_mgp_str.py │ │ └── tokenization_mgp_str.py │ ├── mistral │ │ ├── __init__.py │ │ ├── configuration_mistral.py │ │ ├── convert_mistral_weights_to_hf.py │ │ ├── modeling_flax_mistral.py │ │ └── modeling_mistral.py │ ├── mixtral │ │ ├── __init__.py │ │ ├── configuration_mixtral.py │ │ ├── convert_mixtral_weights_to_hf.py │ │ └── modeling_mixtral.py │ ├── mluke │ │ ├── __init__.py │ │ ├── convert_mluke_original_pytorch_checkpoint_to_pytorch.py │ │ └── tokenization_mluke.py │ ├── mobilebert │ │ ├── __init__.py │ │ ├── configuration_mobilebert.py │ │ ├── convert_mobilebert_original_tf_checkpoint_to_pytorch.py │ │ ├── modeling_mobilebert.py │ │ ├── modeling_tf_mobilebert.py │ │ ├── tokenization_mobilebert.py │ │ └── tokenization_mobilebert_fast.py │ ├── mobilenet_v1 │ │ ├── __init__.py │ │ ├── configuration_mobilenet_v1.py │ │ ├── convert_original_tf_checkpoint_to_pytorch.py │ │ ├── feature_extraction_mobilenet_v1.py │ │ ├── image_processing_mobilenet_v1.py │ │ └── modeling_mobilenet_v1.py │ ├── mobilenet_v2 │ │ ├── __init__.py │ │ ├── configuration_mobilenet_v2.py │ │ ├── convert_original_tf_checkpoint_to_pytorch.py │ │ ├── feature_extraction_mobilenet_v2.py │ │ ├── image_processing_mobilenet_v2.py │ │ └── modeling_mobilenet_v2.py │ ├── mobilevit │ │ ├── __init__.py │ │ ├── configuration_mobilevit.py │ │ ├── convert_mlcvnets_to_pytorch.py │ │ ├── feature_extraction_mobilevit.py │ │ ├── image_processing_mobilevit.py │ │ ├── modeling_mobilevit.py │ │ └── modeling_tf_mobilevit.py │ ├── mobilevitv2 │ │ ├── __init__.py │ │ ├── configuration_mobilevitv2.py │ │ ├── convert_mlcvnets_to_pytorch.py │ │ └── modeling_mobilevitv2.py │ ├── mpnet │ │ ├── __init__.py │ │ ├── configuration_mpnet.py │ │ ├── modeling_mpnet.py │ │ ├── modeling_tf_mpnet.py │ │ ├── tokenization_mpnet.py │ │ └── tokenization_mpnet_fast.py │ ├── mpt │ │ ├── __init__.py │ │ ├── configuration_mpt.py │ │ └── modeling_mpt.py │ ├── mra │ │ ├── __init__.py │ │ ├── configuration_mra.py │ │ ├── convert_mra_pytorch_to_pytorch.py │ │ └── modeling_mra.py │ ├── mt5 │ │ ├── __init__.py │ │ ├── configuration_mt5.py │ │ ├── modeling_flax_mt5.py │ │ ├── modeling_mt5.py │ │ └── modeling_tf_mt5.py │ ├── musicgen │ │ ├── __init__.py │ │ ├── configuration_musicgen.py │ │ ├── convert_musicgen_transformers.py │ │ ├── modeling_musicgen.py │ │ └── processing_musicgen.py │ ├── musicgen_melody │ │ ├── __init__.py │ │ ├── configuration_musicgen_melody.py │ │ ├── convert_musicgen_melody_transformers.py │ │ ├── feature_extraction_musicgen_melody.py │ │ ├── modeling_musicgen_melody.py │ │ └── processing_musicgen_melody.py │ ├── mvp │ │ ├── __init__.py │ │ ├── configuration_mvp.py │ │ ├── modeling_mvp.py │ │ ├── tokenization_mvp.py │ │ └── tokenization_mvp_fast.py │ ├── nat │ │ ├── __init__.py │ │ ├── configuration_nat.py │ │ └── modeling_nat.py │ ├── nezha │ │ ├── __init__.py │ │ ├── configuration_nezha.py │ │ └── modeling_nezha.py │ ├── nllb │ │ ├── __init__.py │ │ ├── tokenization_nllb.py │ │ └── tokenization_nllb_fast.py │ ├── nllb_moe │ │ ├── __init__.py │ │ ├── configuration_nllb_moe.py │ │ ├── convert_nllb_moe_sharded_original_checkpoint_to_pytorch.py │ │ └── modeling_nllb_moe.py │ ├── nougat │ │ ├── __init__.py │ │ ├── convert_nougat_to_hf.py │ │ ├── image_processing_nougat.py │ │ ├── processing_nougat.py │ │ └── tokenization_nougat_fast.py │ ├── nystromformer │ │ ├── __init__.py │ │ ├── configuration_nystromformer.py │ │ ├── convert_nystromformer_original_pytorch_checkpoint_to_pytorch.py │ │ └── modeling_nystromformer.py │ ├── olmo │ │ ├── __init__.py │ │ ├── configuration_olmo.py │ │ ├── convert_olmo_weights_to_hf.py │ │ └── modeling_olmo.py │ ├── oneformer │ │ ├── __init__.py │ │ ├── configuration_oneformer.py │ │ ├── convert_to_hf_oneformer.py │ │ ├── image_processing_oneformer.py │ │ ├── modeling_oneformer.py │ │ └── processing_oneformer.py │ ├── openai │ │ ├── __init__.py │ │ ├── configuration_openai.py │ │ ├── convert_openai_original_tf_checkpoint_to_pytorch.py │ │ ├── modeling_openai.py │ │ ├── modeling_tf_openai.py │ │ ├── tokenization_openai.py │ │ └── tokenization_openai_fast.py │ ├── opt │ │ ├── __init__.py │ │ ├── configuration_opt.py │ │ ├── convert_opt_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_flax_opt.py │ │ ├── modeling_opt.py │ │ └── modeling_tf_opt.py │ ├── owlv2 │ │ ├── __init__.py │ │ ├── configuration_owlv2.py │ │ ├── convert_owlv2_to_hf.py │ │ ├── image_processing_owlv2.py │ │ ├── modeling_owlv2.py │ │ └── processing_owlv2.py │ ├── owlvit │ │ ├── __init__.py │ │ ├── configuration_owlvit.py │ │ ├── convert_owlvit_original_flax_to_hf.py │ │ ├── feature_extraction_owlvit.py │ │ ├── image_processing_owlvit.py │ │ ├── modeling_owlvit.py │ │ └── processing_owlvit.py │ ├── patchtsmixer │ │ ├── __init__.py │ │ ├── configuration_patchtsmixer.py │ │ └── modeling_patchtsmixer.py │ ├── patchtst │ │ ├── __init__.py │ │ ├── configuration_patchtst.py │ │ └── modeling_patchtst.py │ ├── pegasus │ │ ├── __init__.py │ │ ├── configuration_pegasus.py │ │ ├── convert_pegasus_tf_to_pytorch.py │ │ ├── modeling_flax_pegasus.py │ │ ├── modeling_pegasus.py │ │ ├── modeling_tf_pegasus.py │ │ ├── tokenization_pegasus.py │ │ └── tokenization_pegasus_fast.py │ ├── pegasus_x │ │ ├── __init__.py │ │ ├── configuration_pegasus_x.py │ │ └── modeling_pegasus_x.py │ ├── perceiver │ │ ├── __init__.py │ │ ├── configuration_perceiver.py │ │ ├── convert_perceiver_haiku_to_pytorch.py │ │ ├── feature_extraction_perceiver.py │ │ ├── image_processing_perceiver.py │ │ ├── modeling_perceiver.py │ │ └── tokenization_perceiver.py │ ├── persimmon │ │ ├── __init__.py │ │ ├── configuration_persimmon.py │ │ ├── convert_persimmon_weights_to_hf.py │ │ └── modeling_persimmon.py │ ├── phi │ │ ├── __init__.py │ │ ├── configuration_phi.py │ │ ├── convert_phi_weights_to_hf.py │ │ └── modeling_phi.py │ ├── phobert │ │ ├── __init__.py │ │ └── tokenization_phobert.py │ ├── pix2struct │ │ ├── __init__.py │ │ ├── configuration_pix2struct.py │ │ ├── convert_pix2struct_original_pytorch_to_hf.py │ │ ├── image_processing_pix2struct.py │ │ ├── modeling_pix2struct.py │ │ └── processing_pix2struct.py │ ├── plbart │ │ ├── __init__.py │ │ ├── configuration_plbart.py │ │ ├── convert_plbart_original_checkpoint_to_torch.py │ │ ├── modeling_plbart.py │ │ └── tokenization_plbart.py │ ├── poolformer │ │ ├── __init__.py │ │ ├── configuration_poolformer.py │ │ ├── convert_poolformer_original_to_pytorch.py │ │ ├── feature_extraction_poolformer.py │ │ ├── image_processing_poolformer.py │ │ └── modeling_poolformer.py │ ├── pop2piano │ │ ├── __init__.py │ │ ├── configuration_pop2piano.py │ │ ├── convert_pop2piano_weights_to_hf.py │ │ ├── feature_extraction_pop2piano.py │ │ ├── modeling_pop2piano.py │ │ ├── processing_pop2piano.py │ │ └── tokenization_pop2piano.py │ ├── prophetnet │ │ ├── __init__.py │ │ ├── configuration_prophetnet.py │ │ ├── convert_prophetnet_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_prophetnet.py │ │ └── tokenization_prophetnet.py │ ├── pvt │ │ ├── __init__.py │ │ ├── configuration_pvt.py │ │ ├── convert_pvt_to_pytorch.py │ │ ├── image_processing_pvt.py │ │ └── modeling_pvt.py │ ├── pvt_v2 │ │ ├── __init__.py │ │ ├── configuration_pvt_v2.py │ │ ├── convert_pvt_v2_to_pytorch.py │ │ └── modeling_pvt_v2.py │ ├── qdqbert │ │ ├── __init__.py │ │ ├── configuration_qdqbert.py │ │ └── modeling_qdqbert.py │ ├── qwen2 │ │ ├── __init__.py │ │ ├── configuration_qwen2.py │ │ ├── modeling_qwen2.py │ │ ├── tokenization_qwen2.py │ │ └── tokenization_qwen2_fast.py │ ├── qwen2_moe │ │ ├── __init__.py │ │ ├── configuration_qwen2_moe.py │ │ └── modeling_qwen2_moe.py │ ├── rag │ │ ├── __init__.py │ │ ├── configuration_rag.py │ │ ├── modeling_rag.py │ │ ├── modeling_tf_rag.py │ │ ├── retrieval_rag.py │ │ └── tokenization_rag.py │ ├── realm │ │ ├── __init__.py │ │ ├── configuration_realm.py │ │ ├── modeling_realm.py │ │ ├── retrieval_realm.py │ │ ├── tokenization_realm.py │ │ └── tokenization_realm_fast.py │ ├── recurrent_gemma │ │ ├── __init__.py │ │ ├── configuration_recurrent_gemma.py │ │ ├── convert_recurrent_gemma_to_hf.py │ │ └── modeling_recurrent_gemma.py │ ├── reformer │ │ ├── __init__.py │ │ ├── configuration_reformer.py │ │ ├── convert_reformer_trax_checkpoint_to_pytorch.py │ │ ├── modeling_reformer.py │ │ ├── tokenization_reformer.py │ │ └── tokenization_reformer_fast.py │ ├── regnet │ │ ├── __init__.py │ │ ├── configuration_regnet.py │ │ ├── convert_regnet_seer_10b_to_pytorch.py │ │ ├── convert_regnet_to_pytorch.py │ │ ├── modeling_flax_regnet.py │ │ ├── modeling_regnet.py │ │ └── modeling_tf_regnet.py │ ├── rembert │ │ ├── __init__.py │ │ ├── configuration_rembert.py │ │ ├── convert_rembert_tf_checkpoint_to_pytorch.py │ │ ├── modeling_rembert.py │ │ ├── modeling_tf_rembert.py │ │ ├── tokenization_rembert.py │ │ └── tokenization_rembert_fast.py │ ├── resnet │ │ ├── __init__.py │ │ ├── configuration_resnet.py │ │ ├── convert_resnet_to_pytorch.py │ │ ├── modeling_flax_resnet.py │ │ ├── modeling_resnet.py │ │ └── modeling_tf_resnet.py │ ├── roberta │ │ ├── __init__.py │ │ ├── configuration_roberta.py │ │ ├── convert_roberta_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_flax_roberta.py │ │ ├── modeling_roberta.py │ │ ├── modeling_tf_roberta.py │ │ ├── tokenization_roberta.py │ │ └── tokenization_roberta_fast.py │ ├── roberta_prelayernorm │ │ ├── __init__.py │ │ ├── configuration_roberta_prelayernorm.py │ │ ├── convert_roberta_prelayernorm_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_flax_roberta_prelayernorm.py │ │ ├── modeling_roberta_prelayernorm.py │ │ └── modeling_tf_roberta_prelayernorm.py │ ├── roc_bert │ │ ├── __init__.py │ │ ├── configuration_roc_bert.py │ │ ├── modeling_roc_bert.py │ │ └── tokenization_roc_bert.py │ ├── roformer │ │ ├── __init__.py │ │ ├── configuration_roformer.py │ │ ├── convert_roformer_original_tf_checkpoint_to_pytorch.py │ │ ├── modeling_flax_roformer.py │ │ ├── modeling_roformer.py │ │ ├── modeling_tf_roformer.py │ │ ├── tokenization_roformer.py │ │ ├── tokenization_roformer_fast.py │ │ └── tokenization_utils.py │ ├── rwkv │ │ ├── __init__.py │ │ ├── configuration_rwkv.py │ │ ├── convert_rwkv_checkpoint_to_hf.py │ │ └── modeling_rwkv.py │ ├── sam │ │ ├── __init__.py │ │ ├── configuration_sam.py │ │ ├── convert_sam_to_hf.py │ │ ├── image_processing_sam.py │ │ ├── modeling_sam.py │ │ ├── modeling_tf_sam.py │ │ └── processing_sam.py │ ├── seamless_m4t │ │ ├── __init__.py │ │ ├── configuration_seamless_m4t.py │ │ ├── convert_fairseq2_to_hf.py │ │ ├── feature_extraction_seamless_m4t.py │ │ ├── modeling_seamless_m4t.py │ │ ├── processing_seamless_m4t.py │ │ ├── tokenization_seamless_m4t.py │ │ └── tokenization_seamless_m4t_fast.py │ ├── seamless_m4t_v2 │ │ ├── __init__.py │ │ ├── configuration_seamless_m4t_v2.py │ │ ├── convert_fairseq2_to_hf.py │ │ └── modeling_seamless_m4t_v2.py │ ├── segformer │ │ ├── __init__.py │ │ ├── configuration_segformer.py │ │ ├── convert_segformer_original_to_pytorch.py │ │ ├── feature_extraction_segformer.py │ │ ├── image_processing_segformer.py │ │ ├── modeling_segformer.py │ │ └── modeling_tf_segformer.py │ ├── seggpt │ │ ├── __init__.py │ │ ├── configuration_seggpt.py │ │ ├── convert_seggpt_to_hf.py │ │ ├── image_processing_seggpt.py │ │ └── modeling_seggpt.py │ ├── sew │ │ ├── __init__.py │ │ ├── configuration_sew.py │ │ ├── convert_sew_original_pytorch_checkpoint_to_pytorch.py │ │ └── modeling_sew.py │ ├── sew_d │ │ ├── __init__.py │ │ ├── configuration_sew_d.py │ │ ├── convert_sew_d_original_pytorch_checkpoint_to_pytorch.py │ │ └── modeling_sew_d.py │ ├── siglip │ │ ├── __init__.py │ │ ├── configuration_siglip.py │ │ ├── convert_siglip_to_hf.py │ │ ├── image_processing_siglip.py │ │ ├── modeling_siglip.py │ │ ├── processing_siglip.py │ │ └── tokenization_siglip.py │ ├── speech_encoder_decoder │ │ ├── __init__.py │ │ ├── configuration_speech_encoder_decoder.py │ │ ├── convert_mbart_wav2vec2_seq2seq_original_to_pytorch.py │ │ ├── convert_speech_to_text_wav2vec2_seq2seq_original_to_pytorch.py │ │ ├── modeling_flax_speech_encoder_decoder.py │ │ └── modeling_speech_encoder_decoder.py │ ├── speech_to_text │ │ ├── __init__.py │ │ ├── configuration_speech_to_text.py │ │ ├── convert_s2t_fairseq_to_tfms.py │ │ ├── feature_extraction_speech_to_text.py │ │ ├── modeling_speech_to_text.py │ │ ├── modeling_tf_speech_to_text.py │ │ ├── processing_speech_to_text.py │ │ └── tokenization_speech_to_text.py │ ├── speech_to_text_2 │ │ ├── __init__.py │ │ ├── configuration_speech_to_text_2.py │ │ ├── modeling_speech_to_text_2.py │ │ ├── processing_speech_to_text_2.py │ │ └── tokenization_speech_to_text_2.py │ ├── speecht5 │ │ ├── __init__.py │ │ ├── configuration_speecht5.py │ │ ├── convert_hifigan.py │ │ ├── convert_speecht5_original_pytorch_checkpoint_to_pytorch.py │ │ ├── feature_extraction_speecht5.py │ │ ├── modeling_speecht5.py │ │ ├── number_normalizer.py │ │ ├── processing_speecht5.py │ │ └── tokenization_speecht5.py │ ├── splinter │ │ ├── __init__.py │ │ ├── configuration_splinter.py │ │ ├── modeling_splinter.py │ │ ├── tokenization_splinter.py │ │ └── tokenization_splinter_fast.py │ ├── squeezebert │ │ ├── __init__.py │ │ ├── configuration_squeezebert.py │ │ ├── modeling_squeezebert.py │ │ ├── tokenization_squeezebert.py │ │ └── tokenization_squeezebert_fast.py │ ├── stablelm │ │ ├── __init__.py │ │ ├── configuration_stablelm.py │ │ └── modeling_stablelm.py │ ├── starcoder2 │ │ ├── __init__.py │ │ ├── configuration_starcoder2.py │ │ └── modeling_starcoder2.py │ ├── superpoint │ │ ├── __init__.py │ │ ├── configuration_superpoint.py │ │ ├── convert_superpoint_to_pytorch.py │ │ ├── image_processing_superpoint.py │ │ └── modeling_superpoint.py │ ├── swiftformer │ │ ├── __init__.py │ │ ├── configuration_swiftformer.py │ │ ├── convert_swiftformer_original_to_hf.py │ │ ├── modeling_swiftformer.py │ │ └── modeling_tf_swiftformer.py │ ├── swin │ │ ├── __init__.py │ │ ├── configuration_swin.py │ │ ├── convert_swin_simmim_to_pytorch.py │ │ ├── convert_swin_timm_to_pytorch.py │ │ ├── modeling_swin.py │ │ └── modeling_tf_swin.py │ ├── swin2sr │ │ ├── __init__.py │ │ ├── configuration_swin2sr.py │ │ ├── convert_swin2sr_original_to_pytorch.py │ │ ├── image_processing_swin2sr.py │ │ └── modeling_swin2sr.py │ ├── swinv2 │ │ ├── __init__.py │ │ ├── configuration_swinv2.py │ │ ├── convert_swinv2_timm_to_pytorch.py │ │ └── modeling_swinv2.py │ ├── switch_transformers │ │ ├── __init__.py │ │ ├── configuration_switch_transformers.py │ │ ├── convert_big_switch.py │ │ ├── convert_switch_transformers_original_flax_checkpoint_to_pytorch.py │ │ └── modeling_switch_transformers.py │ ├── t5 │ │ ├── __init__.py │ │ ├── configuration_t5.py │ │ ├── convert_t5_original_tf_checkpoint_to_pytorch.py │ │ ├── convert_t5x_checkpoint_to_flax.py │ │ ├── convert_t5x_checkpoint_to_pytorch.py │ │ ├── download_from_gcp.sh │ │ ├── modeling_flax_t5.py │ │ ├── modeling_t5.py │ │ ├── modeling_tf_t5.py │ │ ├── tokenization_t5.py │ │ └── tokenization_t5_fast.py │ ├── table_transformer │ │ ├── __init__.py │ │ ├── configuration_table_transformer.py │ │ ├── convert_table_transformer_to_hf.py │ │ ├── convert_table_transformer_to_hf_no_timm.py │ │ └── modeling_table_transformer.py │ ├── tapas │ │ ├── __init__.py │ │ ├── configuration_tapas.py │ │ ├── convert_tapas_original_tf_checkpoint_to_pytorch.py │ │ ├── modeling_tapas.py │ │ ├── modeling_tf_tapas.py │ │ └── tokenization_tapas.py │ ├── time_series_transformer │ │ ├── __init__.py │ │ ├── configuration_time_series_transformer.py │ │ └── modeling_time_series_transformer.py │ ├── timesformer │ │ ├── __init__.py │ │ ├── configuration_timesformer.py │ │ ├── convert_timesformer_to_pytorch.py │ │ └── modeling_timesformer.py │ ├── timm_backbone │ │ ├── __init__.py │ │ ├── configuration_timm_backbone.py │ │ └── modeling_timm_backbone.py │ ├── trocr │ │ ├── __init__.py │ │ ├── configuration_trocr.py │ │ ├── convert_trocr_unilm_to_pytorch.py │ │ ├── modeling_trocr.py │ │ └── processing_trocr.py │ ├── tvlt │ │ ├── __init__.py │ │ ├── configuration_tvlt.py │ │ ├── feature_extraction_tvlt.py │ │ ├── image_processing_tvlt.py │ │ ├── modeling_tvlt.py │ │ └── processing_tvlt.py │ ├── tvp │ │ ├── __init__.py │ │ ├── configuration_tvp.py │ │ ├── image_processing_tvp.py │ │ ├── modeling_tvp.py │ │ └── processing_tvp.py │ ├── udop │ │ ├── __init__.py │ │ ├── configuration_udop.py │ │ ├── convert_udop_to_hf.py │ │ ├── modeling_udop.py │ │ ├── processing_udop.py │ │ ├── tokenization_udop.py │ │ └── tokenization_udop_fast.py │ ├── umt5 │ │ ├── __init__.py │ │ ├── configuration_umt5.py │ │ ├── convert_umt5_checkpoint_to_pytorch.py │ │ └── modeling_umt5.py │ ├── unispeech │ │ ├── __init__.py │ │ ├── configuration_unispeech.py │ │ ├── convert_unispeech_original_pytorch_checkpoint_to_pytorch.py │ │ └── modeling_unispeech.py │ ├── unispeech_sat │ │ ├── __init__.py │ │ ├── configuration_unispeech_sat.py │ │ ├── convert_unispeech_original_s3prl_checkpoint_to_pytorch.py │ │ ├── convert_unispeech_sat_original_pytorch_checkpoint_to_pytorch.py │ │ └── modeling_unispeech_sat.py │ ├── univnet │ │ ├── __init__.py │ │ ├── configuration_univnet.py │ │ ├── convert_univnet.py │ │ ├── feature_extraction_univnet.py │ │ └── modeling_univnet.py │ ├── upernet │ │ ├── __init__.py │ │ ├── configuration_upernet.py │ │ ├── convert_convnext_upernet_to_pytorch.py │ │ ├── convert_swin_upernet_to_pytorch.py │ │ └── modeling_upernet.py │ ├── videomae │ │ ├── __init__.py │ │ ├── configuration_videomae.py │ │ ├── convert_videomae_to_pytorch.py │ │ ├── feature_extraction_videomae.py │ │ ├── image_processing_videomae.py │ │ └── modeling_videomae.py │ ├── vilt │ │ ├── __init__.py │ │ ├── configuration_vilt.py │ │ ├── convert_vilt_original_to_pytorch.py │ │ ├── feature_extraction_vilt.py │ │ ├── image_processing_vilt.py │ │ ├── modeling_vilt.py │ │ └── processing_vilt.py │ ├── vipllava │ │ ├── __init__.py │ │ ├── configuration_vipllava.py │ │ ├── convert_vipllava_weights_to_hf.py │ │ └── modeling_vipllava.py │ ├── vision_encoder_decoder │ │ ├── __init__.py │ │ ├── configuration_vision_encoder_decoder.py │ │ ├── modeling_flax_vision_encoder_decoder.py │ │ ├── modeling_tf_vision_encoder_decoder.py │ │ └── modeling_vision_encoder_decoder.py │ ├── vision_text_dual_encoder │ │ ├── __init__.py │ │ ├── configuration_vision_text_dual_encoder.py │ │ ├── modeling_flax_vision_text_dual_encoder.py │ │ ├── modeling_tf_vision_text_dual_encoder.py │ │ ├── modeling_vision_text_dual_encoder.py │ │ └── processing_vision_text_dual_encoder.py │ ├── visual_bert │ │ ├── __init__.py │ │ ├── configuration_visual_bert.py │ │ ├── convert_visual_bert_original_pytorch_checkpoint_to_pytorch.py │ │ └── modeling_visual_bert.py │ ├── vit │ │ ├── __init__.py │ │ ├── configuration_vit.py │ │ ├── convert_dino_to_pytorch.py │ │ ├── convert_vit_timm_to_pytorch.py │ │ ├── feature_extraction_vit.py │ │ ├── image_processing_vit.py │ │ ├── modeling_flax_vit.py │ │ ├── modeling_tf_vit.py │ │ └── modeling_vit.py │ ├── vit_hybrid │ │ ├── __init__.py │ │ ├── configuration_vit_hybrid.py │ │ ├── convert_vit_hybrid_timm_to_pytorch.py │ │ ├── image_processing_vit_hybrid.py │ │ └── modeling_vit_hybrid.py │ ├── vit_mae │ │ ├── __init__.py │ │ ├── configuration_vit_mae.py │ │ ├── convert_vit_mae_to_pytorch.py │ │ ├── modeling_tf_vit_mae.py │ │ └── modeling_vit_mae.py │ ├── vit_msn │ │ ├── __init__.py │ │ ├── configuration_vit_msn.py │ │ ├── convert_msn_to_pytorch.py │ │ └── modeling_vit_msn.py │ ├── vitdet │ │ ├── __init__.py │ │ ├── configuration_vitdet.py │ │ └── modeling_vitdet.py │ ├── vitmatte │ │ ├── __init__.py │ │ ├── configuration_vitmatte.py │ │ ├── convert_vitmatte_to_hf.py │ │ ├── image_processing_vitmatte.py │ │ └── modeling_vitmatte.py │ ├── vits │ │ ├── __init__.py │ │ ├── configuration_vits.py │ │ ├── convert_original_checkpoint.py │ │ ├── modeling_vits.py │ │ └── tokenization_vits.py │ ├── vivit │ │ ├── __init__.py │ │ ├── configuration_vivit.py │ │ ├── convert_vivit_flax_to_pytorch.py │ │ ├── image_processing_vivit.py │ │ └── modeling_vivit.py │ ├── wav2vec2 │ │ ├── __init__.py │ │ ├── configuration_wav2vec2.py │ │ ├── convert_wav2vec2_original_pytorch_checkpoint_to_pytorch.py │ │ ├── convert_wav2vec2_original_s3prl_checkpoint_to_pytorch.py │ │ ├── feature_extraction_wav2vec2.py │ │ ├── modeling_flax_wav2vec2.py │ │ ├── modeling_tf_wav2vec2.py │ │ ├── modeling_wav2vec2.py │ │ ├── processing_wav2vec2.py │ │ └── tokenization_wav2vec2.py │ ├── wav2vec2_bert │ │ ├── __init__.py │ │ ├── configuration_wav2vec2_bert.py │ │ ├── convert_wav2vec2_seamless_checkpoint.py │ │ ├── modeling_wav2vec2_bert.py │ │ └── processing_wav2vec2_bert.py │ ├── wav2vec2_conformer │ │ ├── __init__.py │ │ ├── configuration_wav2vec2_conformer.py │ │ ├── convert_wav2vec2_conformer_original_pytorch_checkpoint_to_pytorch.py │ │ └── modeling_wav2vec2_conformer.py │ ├── wav2vec2_phoneme │ │ ├── __init__.py │ │ └── tokenization_wav2vec2_phoneme.py │ ├── wav2vec2_with_lm │ │ ├── __init__.py │ │ └── processing_wav2vec2_with_lm.py │ ├── wavlm │ │ ├── __init__.py │ │ ├── configuration_wavlm.py │ │ ├── convert_wavlm_original_pytorch_checkpoint_to_pytorch.py │ │ ├── convert_wavlm_original_s3prl_checkpoint_to_pytorch.py │ │ └── modeling_wavlm.py │ ├── whisper │ │ ├── __init__.py │ │ ├── configuration_whisper.py │ │ ├── convert_openai_to_hf.py │ │ ├── english_normalizer.py │ │ ├── feature_extraction_whisper.py │ │ ├── generation_whisper.py │ │ ├── modeling_flax_whisper.py │ │ ├── modeling_tf_whisper.py │ │ ├── modeling_whisper.py │ │ ├── processing_whisper.py │ │ ├── tokenization_whisper.py │ │ └── tokenization_whisper_fast.py │ ├── x_clip │ │ ├── __init__.py │ │ ├── configuration_x_clip.py │ │ ├── convert_x_clip_original_pytorch_to_hf.py │ │ ├── modeling_x_clip.py │ │ └── processing_x_clip.py │ ├── xglm │ │ ├── __init__.py │ │ ├── configuration_xglm.py │ │ ├── convert_xglm_original_ckpt_to_trfms.py │ │ ├── modeling_flax_xglm.py │ │ ├── modeling_tf_xglm.py │ │ ├── modeling_xglm.py │ │ ├── tokenization_xglm.py │ │ └── tokenization_xglm_fast.py │ ├── xlm │ │ ├── __init__.py │ │ ├── configuration_xlm.py │ │ ├── convert_xlm_original_pytorch_checkpoint_to_pytorch.py │ │ ├── modeling_tf_xlm.py │ │ ├── modeling_xlm.py │ │ └── tokenization_xlm.py │ ├── xlm_prophetnet │ │ ├── __init__.py │ │ ├── configuration_xlm_prophetnet.py │ │ ├── modeling_xlm_prophetnet.py │ │ └── tokenization_xlm_prophetnet.py │ ├── xlm_roberta │ │ ├── __init__.py │ │ ├── configuration_xlm_roberta.py │ │ ├── modeling_flax_xlm_roberta.py │ │ ├── modeling_tf_xlm_roberta.py │ │ ├── modeling_xlm_roberta.py │ │ ├── tokenization_xlm_roberta.py │ │ └── tokenization_xlm_roberta_fast.py │ ├── xlm_roberta_xl │ │ ├── __init__.py │ │ ├── configuration_xlm_roberta_xl.py │ │ ├── convert_xlm_roberta_xl_original_pytorch_checkpoint_to_pytorch.py │ │ └── modeling_xlm_roberta_xl.py │ ├── xlnet │ │ ├── __init__.py │ │ ├── configuration_xlnet.py │ │ ├── convert_xlnet_original_tf_checkpoint_to_pytorch.py │ │ ├── modeling_tf_xlnet.py │ │ ├── modeling_xlnet.py │ │ ├── tokenization_xlnet.py │ │ └── tokenization_xlnet_fast.py │ ├── xmod │ │ ├── __init__.py │ │ ├── configuration_xmod.py │ │ ├── convert_xmod_original_pytorch_checkpoint_to_pytorch.py │ │ └── modeling_xmod.py │ ├── yolos │ │ ├── __init__.py │ │ ├── configuration_yolos.py │ │ ├── convert_yolos_to_pytorch.py │ │ ├── feature_extraction_yolos.py │ │ ├── image_processing_yolos.py │ │ └── modeling_yolos.py │ └── yoso │ │ ├── __init__.py │ │ ├── configuration_yoso.py │ │ ├── convert_yoso_pytorch_to_pytorch.py │ │ └── modeling_yoso.py │ ├── onnx │ ├── __init__.py │ ├── __main__.py │ ├── config.py │ ├── convert.py │ ├── features.py │ └── utils.py │ ├── optimization.py │ ├── optimization_tf.py │ ├── pipelines │ ├── __init__.py │ ├── audio_classification.py │ ├── audio_utils.py │ ├── automatic_speech_recognition.py │ ├── base.py │ ├── conversational.py │ ├── depth_estimation.py │ ├── document_question_answering.py │ ├── feature_extraction.py │ ├── fill_mask.py │ ├── image_classification.py │ ├── image_feature_extraction.py │ ├── image_segmentation.py │ ├── image_to_image.py │ ├── image_to_text.py │ ├── mask_generation.py │ ├── object_detection.py │ ├── pt_utils.py │ ├── question_answering.py │ ├── table_question_answering.py │ ├── text2text_generation.py │ ├── text_classification.py │ ├── text_generation.py │ ├── text_to_audio.py │ ├── token_classification.py │ ├── video_classification.py │ ├── visual_question_answering.py │ ├── zero_shot_audio_classification.py │ ├── zero_shot_classification.py │ ├── zero_shot_image_classification.py │ └── zero_shot_object_detection.py │ ├── processing_utils.py │ ├── pytorch_utils.py │ ├── quantizers │ ├── __init__.py │ ├── auto.py │ ├── base.py │ ├── quantizer_aqlm.py │ ├── quantizer_awq.py │ ├── quantizer_bnb_4bit.py │ ├── quantizer_bnb_8bit.py │ ├── quantizer_gptq.py │ ├── quantizer_quanto.py │ └── quantizers_utils.py │ ├── safetensors_conversion.py │ ├── sagemaker │ ├── __init__.py │ ├── trainer_sm.py │ └── training_args_sm.py │ ├── testing_utils.py │ ├── tf_utils.py │ ├── time_series_utils.py │ ├── tokenization_utils.py │ ├── tokenization_utils_base.py │ ├── tokenization_utils_fast.py │ ├── tools │ ├── __init__.py │ ├── agent_types.py │ ├── agents.py │ ├── base.py │ ├── document_question_answering.py │ ├── evaluate_agent.py │ ├── image_captioning.py │ ├── image_question_answering.py │ ├── image_segmentation.py │ ├── prompts.py │ ├── python_interpreter.py │ ├── speech_to_text.py │ ├── text_classification.py │ ├── text_question_answering.py │ ├── text_summarization.py │ ├── text_to_speech.py │ └── translation.py │ ├── trainer.py │ ├── trainer_callback.py │ ├── trainer_pt_utils.py │ ├── trainer_seq2seq.py │ ├── trainer_utils.py │ ├── training_args.py │ ├── training_args_seq2seq.py │ ├── training_args_tf.py │ └── utils │ ├── __init__.py │ ├── backbone_utils.py │ ├── bitsandbytes.py │ ├── constants.py │ ├── doc.py │ ├── dummy_detectron2_objects.py │ ├── dummy_essentia_and_librosa_and_pretty_midi_and_scipy_and_torch_objects.py │ ├── dummy_flax_objects.py │ ├── dummy_keras_nlp_objects.py │ ├── dummy_music_objects.py │ ├── dummy_pt_objects.py │ ├── dummy_sentencepiece_and_tokenizers_objects.py │ ├── dummy_sentencepiece_objects.py │ ├── dummy_speech_objects.py │ ├── dummy_tensorflow_text_objects.py │ ├── dummy_tf_objects.py │ ├── dummy_tokenizers_objects.py │ ├── dummy_torchaudio_objects.py │ ├── dummy_vision_objects.py │ ├── fx.py │ ├── generic.py │ ├── hp_naming.py │ ├── hub.py │ ├── import_utils.py │ ├── logging.py │ ├── model_parallel_utils.py │ ├── notebook.py │ ├── peft_utils.py │ ├── quantization_config.py │ ├── sentencepiece_model_pb2.py │ ├── sentencepiece_model_pb2_new.py │ └── versions.py ├── templates ├── adding_a_missing_tokenization_test │ ├── README.md │ ├── cookiecutter-template-{{cookiecutter.modelname}} │ │ └── test_tokenization_{{cookiecutter.lowercase_modelname}}.py │ └── cookiecutter.json ├── adding_a_new_example_script │ ├── README.md │ ├── cookiecutter.json │ └── {{cookiecutter.directory_name}} │ │ └── run_{{cookiecutter.example_shortcut}}.py └── adding_a_new_model │ ├── ADD_NEW_MODEL_PROPOSAL_TEMPLATE.md │ ├── README.md │ ├── cookiecutter-template-{{cookiecutter.modelname}} │ ├── __init__.py │ ├── configuration.json │ ├── configuration_{{cookiecutter.lowercase_modelname}}.py │ ├── modeling_flax_{{cookiecutter.lowercase_modelname}}.py │ ├── modeling_tf_{{cookiecutter.lowercase_modelname}}.py │ ├── modeling_{{cookiecutter.lowercase_modelname}}.py │ ├── test_modeling_flax_{{cookiecutter.lowercase_modelname}}.py │ ├── test_modeling_tf_{{cookiecutter.lowercase_modelname}}.py │ ├── test_modeling_{{cookiecutter.lowercase_modelname}}.py │ ├── to_replace_{{cookiecutter.lowercase_modelname}}.py │ ├── tokenization_fast_{{cookiecutter.lowercase_modelname}}.py │ ├── tokenization_{{cookiecutter.lowercase_modelname}}.py │ └── {{cookiecutter.lowercase_modelname}}.md │ ├── cookiecutter.json │ ├── open_model_proposals │ ├── ADD_BIG_BIRD.md │ └── README.md │ └── tests │ ├── encoder-bert-tokenizer.json │ ├── flax-encoder-bert-tokenizer.json │ ├── flax-seq-2-seq-bart-tokenizer.json │ ├── pt-encoder-bert-tokenizer.json │ ├── pt-seq-2-seq-bart-tokenizer.json │ ├── standalone.json │ ├── tf-encoder-bert-tokenizer.json │ └── tf-seq-2-seq-bart-tokenizer.json ├── tests ├── __init__.py ├── benchmark │ ├── __init__.py │ ├── test_benchmark.py │ └── test_benchmark_tf.py ├── bettertransformer │ ├── __init__.py │ └── test_integration.py ├── deepspeed │ ├── ds_config_zero2.json │ ├── ds_config_zero3.json │ ├── test_deepspeed.py │ ├── test_model_zoo.py │ └── vit_feature_extractor.json ├── extended │ └── test_trainer_ext.py ├── fixtures │ ├── add_distilbert_like_config.json │ ├── dummy-config.json │ ├── dummy_feature_extractor_config.json │ ├── empty.txt │ ├── input.txt │ ├── merges.txt │ ├── preprocessor_config.json │ ├── sample_text.txt │ ├── sample_text_no_unicode.txt │ ├── spiece.model │ ├── test_entity_vocab.json │ ├── test_sentencepiece.model │ ├── test_sentencepiece_bpe.model │ ├── test_sentencepiece_bpe_char.model │ ├── test_sentencepiece_no_bos.model │ ├── test_sentencepiece_with_bytefallback.model │ ├── tests_samples │ │ ├── .gitignore │ │ ├── COCO │ │ │ ├── 000000004016.png │ │ │ ├── 000000039769.png │ │ │ ├── coco_annotations.txt │ │ │ ├── coco_panoptic │ │ │ │ └── 000000039769.png │ │ │ └── coco_panoptic_annotations.txt │ │ ├── GermEval │ │ │ ├── dev.txt │ │ │ ├── labels.txt │ │ │ └── train.txt │ │ ├── MRPC │ │ │ ├── dev.csv │ │ │ ├── dev.tsv │ │ │ ├── train.csv │ │ │ └── train.tsv │ │ ├── SQUAD │ │ │ └── sample.json │ │ ├── STS-B │ │ │ ├── dev.tsv │ │ │ └── train.tsv │ │ ├── conll │ │ │ └── sample.json │ │ ├── swag │ │ │ └── sample.json │ │ ├── wiki_text │ │ │ └── wiki_00 │ │ ├── wmt16 │ │ │ └── sample.json │ │ ├── wmt_en_ro │ │ │ ├── test.json │ │ │ ├── train.json │ │ │ └── val.json │ │ └── xsum │ │ │ └── sample.json │ ├── vocab.json │ └── vocab.txt ├── fsdp │ └── test_fsdp.py ├── generation │ ├── __init__.py │ ├── test_beam_constraints.py │ ├── test_beam_search.py │ ├── test_configuration_utils.py │ ├── test_flax_logits_process.py │ ├── test_flax_utils.py │ ├── test_framework_agnostic.py │ ├── test_logits_process.py │ ├── test_stopping_criteria.py │ ├── test_streamers.py │ ├── test_tf_logits_process.py │ ├── test_tf_utils.py │ └── test_utils.py ├── models │ ├── __init__.py │ ├── albert │ │ ├── __init__.py │ │ ├── test_modeling_albert.py │ │ ├── test_modeling_flax_albert.py │ │ ├── test_modeling_tf_albert.py │ │ └── test_tokenization_albert.py │ ├── align │ │ ├── __init__.py │ │ ├── test_modeling_align.py │ │ └── test_processor_align.py │ ├── altclip │ │ ├── __init__.py │ │ └── test_modeling_altclip.py │ ├── audio_spectrogram_transformer │ │ ├── __init__.py │ │ ├── test_feature_extraction_audio_spectrogram_transformer.py │ │ └── test_modeling_audio_spectrogram_transformer.py │ ├── auto │ │ ├── __init__.py │ │ ├── test_configuration_auto.py │ │ ├── test_feature_extraction_auto.py │ │ ├── test_image_processing_auto.py │ │ ├── test_modeling_auto.py │ │ ├── test_modeling_flax_auto.py │ │ ├── test_modeling_tf_auto.py │ │ ├── test_modeling_tf_pytorch.py │ │ ├── test_processor_auto.py │ │ └── test_tokenization_auto.py │ ├── autoformer │ │ ├── __init__.py │ │ └── test_modeling_autoformer.py │ ├── bark │ │ ├── __init__.py │ │ ├── test_modeling_bark.py │ │ └── test_processor_bark.py │ ├── bart │ │ ├── __init__.py │ │ ├── test_modeling_bart.py │ │ ├── test_modeling_flax_bart.py │ │ ├── test_modeling_tf_bart.py │ │ └── test_tokenization_bart.py │ ├── barthez │ │ ├── __init__.py │ │ └── test_tokenization_barthez.py │ ├── bartpho │ │ ├── __init__.py │ │ └── test_tokenization_bartpho.py │ ├── beit │ │ ├── __init__.py │ │ ├── test_image_processing_beit.py │ │ ├── test_modeling_beit.py │ │ └── test_modeling_flax_beit.py │ ├── bert │ │ ├── __init__.py │ │ ├── test_modeling_bert.py │ │ ├── test_modeling_flax_bert.py │ │ ├── test_modeling_tf_bert.py │ │ ├── test_tokenization_bert.py │ │ └── test_tokenization_bert_tf.py │ ├── bert_generation │ │ ├── __init__.py │ │ ├── test_modeling_bert_generation.py │ │ └── test_tokenization_bert_generation.py │ ├── bert_japanese │ │ ├── __init__.py │ │ └── test_tokenization_bert_japanese.py │ ├── bertweet │ │ ├── __init__.py │ │ └── test_tokenization_bertweet.py │ ├── big_bird │ │ ├── __init__.py │ │ ├── test_modeling_big_bird.py │ │ ├── test_modeling_flax_big_bird.py │ │ └── test_tokenization_big_bird.py │ ├── bigbird_pegasus │ │ ├── __init__.py │ │ └── test_modeling_bigbird_pegasus.py │ ├── biogpt │ │ ├── __init__.py │ │ ├── test_modeling_biogpt.py │ │ └── test_tokenization_biogpt.py │ ├── bit │ │ ├── __init__.py │ │ └── test_modeling_bit.py │ ├── blenderbot │ │ ├── __init__.py │ │ ├── test_modeling_blenderbot.py │ │ ├── test_modeling_flax_blenderbot.py │ │ ├── test_modeling_tf_blenderbot.py │ │ └── test_tokenization_blenderbot.py │ ├── blenderbot_small │ │ ├── __init__.py │ │ ├── test_modeling_blenderbot_small.py │ │ ├── test_modeling_flax_blenderbot_small.py │ │ ├── test_modeling_tf_blenderbot_small.py │ │ └── test_tokenization_blenderbot_small.py │ ├── blip │ │ ├── __init__.py │ │ ├── test_image_processing_blip.py │ │ ├── test_modeling_blip.py │ │ ├── test_modeling_blip_text.py │ │ ├── test_modeling_tf_blip.py │ │ ├── test_modeling_tf_blip_text.py │ │ └── test_processor_blip.py │ ├── blip_2 │ │ ├── __init__.py │ │ ├── test_modeling_blip_2.py │ │ └── test_processor_blip_2.py │ ├── bloom │ │ ├── __init__.py │ │ ├── test_modeling_bloom.py │ │ ├── test_modeling_flax_bloom.py │ │ └── test_tokenization_bloom.py │ ├── bridgetower │ │ ├── __init__.py │ │ ├── test_image_processing_bridgetower.py │ │ └── test_modeling_bridgetower.py │ ├── bros │ │ ├── __init__.py │ │ └── test_modeling_bros.py │ ├── byt5 │ │ ├── __init__.py │ │ └── test_tokenization_byt5.py │ ├── camembert │ │ ├── __init__.py │ │ ├── test_modeling_camembert.py │ │ ├── test_modeling_tf_camembert.py │ │ └── test_tokenization_camembert.py │ ├── canine │ │ ├── __init__.py │ │ ├── test_modeling_canine.py │ │ └── test_tokenization_canine.py │ ├── chinese_clip │ │ ├── __init__.py │ │ ├── test_image_processing_chinese_clip.py │ │ ├── test_modeling_chinese_clip.py │ │ └── test_processor_chinese_clip.py │ ├── clap │ │ ├── __init__.py │ │ ├── test_feature_extraction_clap.py │ │ ├── test_modeling_clap.py │ │ └── test_processor_clap.py │ ├── clip │ │ ├── __init__.py │ │ ├── test_image_processing_clip.py │ │ ├── test_modeling_clip.py │ │ ├── test_modeling_flax_clip.py │ │ ├── test_modeling_tf_clip.py │ │ ├── test_processor_clip.py │ │ └── test_tokenization_clip.py │ ├── clipseg │ │ ├── __init__.py │ │ ├── test_modeling_clipseg.py │ │ └── test_processor_clipseg.py │ ├── clvp │ │ ├── __init__.py │ │ ├── test_feature_extraction_clvp.py │ │ ├── test_modeling_clvp.py │ │ ├── test_processor_clvp.py │ │ └── test_tokenization_clvp.py │ ├── code_llama │ │ ├── __init__.py │ │ └── test_tokenization_code_llama.py │ ├── codegen │ │ ├── __init__.py │ │ ├── test_modeling_codegen.py │ │ └── test_tokenization_codegen.py │ ├── cohere │ │ ├── __init__.py │ │ ├── test_modeling_cohere.py │ │ └── test_tokenization_cohere.py │ ├── conditional_detr │ │ ├── __init__.py │ │ ├── test_image_processing_conditional_detr.py │ │ └── test_modeling_conditional_detr.py │ ├── convbert │ │ ├── __init__.py │ │ ├── test_modeling_convbert.py │ │ └── test_modeling_tf_convbert.py │ ├── convnext │ │ ├── __init__.py │ │ ├── test_image_processing_convnext.py │ │ ├── test_modeling_convnext.py │ │ └── test_modeling_tf_convnext.py │ ├── convnextv2 │ │ ├── __init__.py │ │ ├── test_modeling_convnextv2.py │ │ └── test_modeling_tf_convnextv2.py │ ├── cpm │ │ ├── __init__.py │ │ └── test_tokenization_cpm.py │ ├── cpmant │ │ ├── __init__.py │ │ ├── test_modeling_cpmant.py │ │ └── test_tokenization_cpmant.py │ ├── ctrl │ │ ├── __init__.py │ │ ├── test_modeling_ctrl.py │ │ ├── test_modeling_tf_ctrl.py │ │ └── test_tokenization_ctrl.py │ ├── cvt │ │ ├── __init__.py │ │ ├── test_modeling_cvt.py │ │ └── test_modeling_tf_cvt.py │ ├── data2vec │ │ ├── __init__.py │ │ ├── test_modeling_data2vec_audio.py │ │ ├── test_modeling_data2vec_text.py │ │ ├── test_modeling_data2vec_vision.py │ │ └── test_modeling_tf_data2vec_vision.py │ ├── dbrx │ │ ├── __init__.py │ │ └── test_modeling_dbrx.py │ ├── deberta │ │ ├── __init__.py │ │ ├── test_modeling_deberta.py │ │ ├── test_modeling_tf_deberta.py │ │ └── test_tokenization_deberta.py │ ├── deberta_v2 │ │ ├── __init__.py │ │ ├── test_modeling_deberta_v2.py │ │ ├── test_modeling_tf_deberta_v2.py │ │ └── test_tokenization_deberta_v2.py │ ├── decision_transformer │ │ ├── __init__.py │ │ └── test_modeling_decision_transformer.py │ ├── deformable_detr │ │ ├── __init__.py │ │ ├── test_image_processing_deformable_detr.py │ │ └── test_modeling_deformable_detr.py │ ├── deit │ │ ├── __init__.py │ │ ├── test_image_processing_deit.py │ │ ├── test_modeling_deit.py │ │ └── test_modeling_tf_deit.py │ ├── depth_anything │ │ ├── __init__.py │ │ └── test_modeling_depth_anything.py │ ├── deta │ │ ├── __init__.py │ │ ├── test_image_processing_deta.py │ │ └── test_modeling_deta.py │ ├── detr │ │ ├── __init__.py │ │ ├── test_image_processing_detr.py │ │ └── test_modeling_detr.py │ ├── dinat │ │ ├── __init__.py │ │ └── test_modeling_dinat.py │ ├── dinov2 │ │ ├── __init__.py │ │ └── test_modeling_dinov2.py │ ├── distilbert │ │ ├── __init__.py │ │ ├── test_modeling_distilbert.py │ │ ├── test_modeling_flax_distilbert.py │ │ ├── test_modeling_tf_distilbert.py │ │ └── test_tokenization_distilbert.py │ ├── dit │ │ ├── __init__.py │ │ └── test_modeling_dit.py │ ├── donut │ │ ├── __init__.py │ │ ├── test_image_processing_donut.py │ │ ├── test_modeling_donut_swin.py │ │ └── test_processing_donut.py │ ├── dpr │ │ ├── __init__.py │ │ ├── test_modeling_dpr.py │ │ ├── test_modeling_tf_dpr.py │ │ └── test_tokenization_dpr.py │ ├── dpt │ │ ├── __init__.py │ │ ├── test_image_processing_dpt.py │ │ ├── test_modeling_dpt.py │ │ ├── test_modeling_dpt_auto_backbone.py │ │ └── test_modeling_dpt_hybrid.py │ ├── efficientformer │ │ ├── __init__.py │ │ ├── test_image_processing_efficientformer.py │ │ ├── test_modeling_efficientformer.py │ │ └── test_modeling_tf_efficientformer.py │ ├── efficientnet │ │ ├── __init__.py │ │ ├── test_image_processing_efficientnet.py │ │ └── test_modeling_efficientnet.py │ ├── electra │ │ ├── __init__.py │ │ ├── test_modeling_electra.py │ │ ├── test_modeling_flax_electra.py │ │ ├── test_modeling_tf_electra.py │ │ └── test_tokenization_electra.py │ ├── encodec │ │ ├── __init__.py │ │ ├── test_feature_extraction_encodec.py │ │ └── test_modeling_encodec.py │ ├── encoder_decoder │ │ ├── __init__.py │ │ ├── test_modeling_encoder_decoder.py │ │ ├── test_modeling_flax_encoder_decoder.py │ │ └── test_modeling_tf_encoder_decoder.py │ ├── ernie │ │ ├── __init__.py │ │ └── test_modeling_ernie.py │ ├── ernie_m │ │ ├── __init__.py │ │ ├── test_modeling_ernie_m.py │ │ └── test_tokenization_ernie_m.py │ ├── esm │ │ ├── __init__.py │ │ ├── test_modeling_esm.py │ │ ├── test_modeling_esmfold.py │ │ ├── test_modeling_tf_esm.py │ │ └── test_tokenization_esm.py │ ├── falcon │ │ ├── __init__.py │ │ └── test_modeling_falcon.py │ ├── fastspeech2_conformer │ │ ├── __init__.py │ │ ├── test_modeling_fastspeech2_conformer.py │ │ └── test_tokenization_fastspeech2_conformer.py │ ├── flaubert │ │ ├── __init__.py │ │ ├── test_modeling_flaubert.py │ │ └── test_modeling_tf_flaubert.py │ ├── flava │ │ ├── __init__.py │ │ ├── test_image_processing_flava.py │ │ ├── test_modeling_flava.py │ │ └── test_processor_flava.py │ ├── fnet │ │ ├── __init__.py │ │ ├── test_modeling_fnet.py │ │ └── test_tokenization_fnet.py │ ├── focalnet │ │ ├── __init__.py │ │ └── test_modeling_focalnet.py │ ├── fsmt │ │ ├── __init__.py │ │ ├── test_modeling_fsmt.py │ │ └── test_tokenization_fsmt.py │ ├── funnel │ │ ├── __init__.py │ │ ├── test_modeling_funnel.py │ │ ├── test_modeling_tf_funnel.py │ │ └── test_tokenization_funnel.py │ ├── fuyu │ │ ├── __init__.py │ │ ├── test_image_processing_fuyu.py │ │ ├── test_modeling_fuyu.py │ │ └── test_processing_fuyu.py │ ├── gemma │ │ ├── __init__.py │ │ ├── test_modeling_flax_gemma.py │ │ ├── test_modeling_gemma.py │ │ └── test_tokenization_gemma.py │ ├── git │ │ ├── __init__.py │ │ ├── test_modeling_git.py │ │ └── test_processor_git.py │ ├── glpn │ │ ├── __init__.py │ │ ├── test_image_processing_glpn.py │ │ └── test_modeling_glpn.py │ ├── gpt2 │ │ ├── __init__.py │ │ ├── test_modeling_flax_gpt2.py │ │ ├── test_modeling_gpt2.py │ │ ├── test_modeling_tf_gpt2.py │ │ ├── test_tokenization_gpt2.py │ │ └── test_tokenization_gpt2_tf.py │ ├── gpt_bigcode │ │ ├── __init__.py │ │ └── test_modeling_gpt_bigcode.py │ ├── gpt_neo │ │ ├── __init__.py │ │ ├── test_modeling_flax_gpt_neo.py │ │ └── test_modeling_gpt_neo.py │ ├── gpt_neox │ │ ├── __init__.py │ │ └── test_modeling_gpt_neox.py │ ├── gpt_neox_japanese │ │ ├── __init__.py │ │ ├── test_modeling_gpt_neox_japanese.py │ │ └── test_tokenization_gpt_neox_japanese.py │ ├── gpt_sw3 │ │ ├── __init__.py │ │ └── test_tokenization_gpt_sw3.py │ ├── gptj │ │ ├── __init__.py │ │ ├── test_modeling_flax_gptj.py │ │ ├── test_modeling_gptj.py │ │ └── test_modeling_tf_gptj.py │ ├── gptsan_japanese │ │ ├── __init__.py │ │ ├── test_modeling_gptsan_japanese.py │ │ └── test_tokenization_gptsan_japanese.py │ ├── graphormer │ │ ├── __init__.py │ │ └── test_modeling_graphormer.py │ ├── grounding_dino │ │ ├── __init__.py │ │ ├── test_image_processing_grounding_dino.py │ │ ├── test_modeling_grounding_dino.py │ │ └── test_processor_grounding_dino.py │ ├── groupvit │ │ ├── __init__.py │ │ ├── test_modeling_groupvit.py │ │ └── test_modeling_tf_groupvit.py │ ├── herbert │ │ ├── __init__.py │ │ └── test_tokenization_herbert.py │ ├── hubert │ │ ├── __init__.py │ │ ├── test_modeling_hubert.py │ │ └── test_modeling_tf_hubert.py │ ├── ibert │ │ ├── __init__.py │ │ └── test_modeling_ibert.py │ ├── idefics │ │ ├── __init__.py │ │ ├── test_image_processing_idefics.py │ │ ├── test_modeling_idefics.py │ │ └── test_processor_idefics.py │ ├── idefics2 │ │ ├── __init__.py │ │ ├── test_image_processing_idefics2.py │ │ ├── test_modeling_idefics2.py │ │ └── test_processing_idefics2.py │ ├── imagegpt │ │ ├── __init__.py │ │ ├── test_image_processing_imagegpt.py │ │ └── test_modeling_imagegpt.py │ ├── informer │ │ ├── __init__.py │ │ └── test_modeling_informer.py │ ├── instructblip │ │ ├── __init__.py │ │ ├── test_modeling_instructblip.py │ │ └── test_processor_instructblip.py │ ├── jamba │ │ ├── __init__.py │ │ └── test_modeling_jamba.py │ ├── jukebox │ │ ├── __init__.py │ │ ├── test_modeling_jukebox.py │ │ └── test_tokenization_jukebox.py │ ├── kosmos2 │ │ ├── __init__.py │ │ ├── test_modeling_kosmos2.py │ │ └── test_processor_kosmos2.py │ ├── layoutlm │ │ ├── __init__.py │ │ ├── test_modeling_layoutlm.py │ │ ├── test_modeling_tf_layoutlm.py │ │ └── test_tokenization_layoutlm.py │ ├── layoutlmv2 │ │ ├── __init__.py │ │ ├── test_image_processing_layoutlmv2.py │ │ ├── test_modeling_layoutlmv2.py │ │ ├── test_processor_layoutlmv2.py │ │ └── test_tokenization_layoutlmv2.py │ ├── layoutlmv3 │ │ ├── __init__.py │ │ ├── test_image_processing_layoutlmv3.py │ │ ├── test_modeling_layoutlmv3.py │ │ ├── test_modeling_tf_layoutlmv3.py │ │ ├── test_processor_layoutlmv3.py │ │ └── test_tokenization_layoutlmv3.py │ ├── layoutxlm │ │ ├── __init__.py │ │ ├── test_processor_layoutxlm.py │ │ └── test_tokenization_layoutxlm.py │ ├── led │ │ ├── __init__.py │ │ ├── test_modeling_led.py │ │ ├── test_modeling_tf_led.py │ │ └── test_tokenization_led.py │ ├── levit │ │ ├── __init__.py │ │ ├── test_image_processing_levit.py │ │ └── test_modeling_levit.py │ ├── lilt │ │ ├── __init__.py │ │ └── test_modeling_lilt.py │ ├── llama │ │ ├── __init__.py │ │ ├── test_modeling_flax_llama.py │ │ ├── test_modeling_llama.py │ │ └── test_tokenization_llama.py │ ├── llava │ │ ├── __init__.py │ │ └── test_modeling_llava.py │ ├── llava_next │ │ ├── __init__.py │ │ ├── test_image_processor_llava_next.py │ │ └── test_modeling_llava_next.py │ ├── longformer │ │ ├── __init__.py │ │ ├── test_modeling_longformer.py │ │ ├── test_modeling_tf_longformer.py │ │ └── test_tokenization_longformer.py │ ├── longt5 │ │ ├── __init__.py │ │ ├── test_modeling_flax_longt5.py │ │ └── test_modeling_longt5.py │ ├── luke │ │ ├── __init__.py │ │ ├── test_modeling_luke.py │ │ └── test_tokenization_luke.py │ ├── lxmert │ │ ├── __init__.py │ │ ├── test_modeling_lxmert.py │ │ ├── test_modeling_tf_lxmert.py │ │ └── test_tokenization_lxmert.py │ ├── m2m_100 │ │ ├── __init__.py │ │ ├── test_modeling_m2m_100.py │ │ └── test_tokenization_m2m_100.py │ ├── mamba │ │ ├── __init__.py │ │ └── test_modeling_mamba.py │ ├── marian │ │ ├── __init__.py │ │ ├── test_modeling_flax_marian.py │ │ ├── test_modeling_marian.py │ │ ├── test_modeling_tf_marian.py │ │ └── test_tokenization_marian.py │ ├── markuplm │ │ ├── __init__.py │ │ ├── test_feature_extraction_markuplm.py │ │ ├── test_modeling_markuplm.py │ │ ├── test_processor_markuplm.py │ │ └── test_tokenization_markuplm.py │ ├── mask2former │ │ ├── __init__.py │ │ ├── test_image_processing_mask2former.py │ │ └── test_modeling_mask2former.py │ ├── maskformer │ │ ├── __init__.py │ │ ├── test_image_processing_maskformer.py │ │ ├── test_modeling_maskformer.py │ │ └── test_modeling_maskformer_swin.py │ ├── mbart │ │ ├── __init__.py │ │ ├── test_modeling_flax_mbart.py │ │ ├── test_modeling_mbart.py │ │ ├── test_modeling_tf_mbart.py │ │ └── test_tokenization_mbart.py │ ├── mbart50 │ │ ├── __init__.py │ │ └── test_tokenization_mbart50.py │ ├── mega │ │ ├── __init__.py │ │ └── test_modeling_mega.py │ ├── megatron_bert │ │ ├── __init__.py │ │ └── test_modeling_megatron_bert.py │ ├── megatron_gpt2 │ │ ├── __init__.py │ │ └── test_modeling_megatron_gpt2.py │ ├── mgp_str │ │ ├── __init__.py │ │ ├── test_modeling_mgp_str.py │ │ ├── test_processor_mgp_str.py │ │ └── test_tokenization_mgp_str.py │ ├── mistral │ │ ├── __init__.py │ │ ├── test_modeling_flax_mistral.py │ │ └── test_modeling_mistral.py │ ├── mixtral │ │ ├── __init__.py │ │ └── test_modeling_mixtral.py │ ├── mluke │ │ ├── __init__.py │ │ └── test_tokenization_mluke.py │ ├── mobilebert │ │ ├── __init__.py │ │ ├── test_modeling_mobilebert.py │ │ ├── test_modeling_tf_mobilebert.py │ │ └── test_tokenization_mobilebert.py │ ├── mobilenet_v1 │ │ ├── __init__.py │ │ ├── test_image_processing_mobilenet_v1.py │ │ └── test_modeling_mobilenet_v1.py │ ├── mobilenet_v2 │ │ ├── __init__.py │ │ ├── test_image_processing_mobilenet_v2.py │ │ └── test_modeling_mobilenet_v2.py │ ├── mobilevit │ │ ├── __init__.py │ │ ├── test_image_processing_mobilevit.py │ │ ├── test_modeling_mobilevit.py │ │ └── test_modeling_tf_mobilevit.py │ ├── mobilevitv2 │ │ ├── __init__.py │ │ └── test_modeling_mobilevitv2.py │ ├── mpnet │ │ ├── __init__.py │ │ ├── test_modeling_mpnet.py │ │ ├── test_modeling_tf_mpnet.py │ │ └── test_tokenization_mpnet.py │ ├── mpt │ │ ├── __init__.py │ │ └── test_modeling_mpt.py │ ├── mra │ │ ├── __init__.py │ │ └── test_modeling_mra.py │ ├── mt5 │ │ ├── __init__.py │ │ ├── test_modeling_flax_mt5.py │ │ ├── test_modeling_mt5.py │ │ └── test_modeling_tf_mt5.py │ ├── musicgen │ │ ├── __init__.py │ │ ├── test_modeling_musicgen.py │ │ └── test_processing_musicgen.py │ ├── musicgen_melody │ │ ├── __init__.py │ │ ├── test_feature_extraction_musicgen_melody.py │ │ ├── test_modeling_musicgen_melody.py │ │ └── test_processor_musicgen_melody.py │ ├── mvp │ │ ├── __init__.py │ │ ├── test_modeling_mvp.py │ │ └── test_tokenization_mvp.py │ ├── nat │ │ ├── __init__.py │ │ └── test_modeling_nat.py │ ├── nezha │ │ ├── __init__.py │ │ └── test_modeling_nezha.py │ ├── nllb │ │ ├── __init__.py │ │ └── test_tokenization_nllb.py │ ├── nllb_moe │ │ ├── __init__.py │ │ └── test_modeling_nllb_moe.py │ ├── nougat │ │ ├── __init__.py │ │ ├── test_image_processing_nougat.py │ │ └── test_tokenization_nougat.py │ ├── nystromformer │ │ ├── __init__.py │ │ └── test_modeling_nystromformer.py │ ├── olmo │ │ ├── __init__.py │ │ └── test_modeling_olmo.py │ ├── oneformer │ │ ├── __init__.py │ │ ├── test_image_processing_oneformer.py │ │ ├── test_modeling_oneformer.py │ │ └── test_processor_oneformer.py │ ├── openai │ │ ├── __init__.py │ │ ├── test_modeling_openai.py │ │ ├── test_modeling_tf_openai.py │ │ └── test_tokenization_openai.py │ ├── opt │ │ ├── __init__.py │ │ ├── test_modeling_flax_opt.py │ │ ├── test_modeling_opt.py │ │ └── test_modeling_tf_opt.py │ ├── owlv2 │ │ ├── __init__.py │ │ ├── test_image_processor_owlv2.py │ │ └── test_modeling_owlv2.py │ ├── owlvit │ │ ├── __init__.py │ │ ├── test_image_processing_owlvit.py │ │ ├── test_modeling_owlvit.py │ │ └── test_processor_owlvit.py │ ├── patchtsmixer │ │ ├── __init__.py │ │ └── test_modeling_patchtsmixer.py │ ├── patchtst │ │ ├── __init__.py │ │ └── test_modeling_patchtst.py │ ├── pegasus │ │ ├── __init__.py │ │ ├── test_modeling_flax_pegasus.py │ │ ├── test_modeling_pegasus.py │ │ ├── test_modeling_tf_pegasus.py │ │ └── test_tokenization_pegasus.py │ ├── pegasus_x │ │ ├── __init__.py │ │ └── test_modeling_pegasus_x.py │ ├── perceiver │ │ ├── __init__.py │ │ ├── test_modeling_perceiver.py │ │ └── test_tokenization_perceiver.py │ ├── persimmon │ │ ├── __init__.py │ │ └── test_modeling_persimmon.py │ ├── phi │ │ ├── __init__.py │ │ └── test_modeling_phi.py │ ├── phobert │ │ ├── __init__.py │ │ └── test_tokenization_phobert.py │ ├── pix2struct │ │ ├── __init__.py │ │ ├── test_image_processing_pix2struct.py │ │ ├── test_modeling_pix2struct.py │ │ └── test_processor_pix2struct.py │ ├── plbart │ │ ├── __init__.py │ │ ├── test_modeling_plbart.py │ │ └── test_tokenization_plbart.py │ ├── poolformer │ │ ├── __init__.py │ │ ├── test_image_processing_poolformer.py │ │ └── test_modeling_poolformer.py │ ├── pop2piano │ │ ├── __init__.py │ │ ├── test_feature_extraction_pop2piano.py │ │ ├── test_modeling_pop2piano.py │ │ ├── test_processor_pop2piano.py │ │ └── test_tokenization_pop2piano.py │ ├── prophetnet │ │ ├── __init__.py │ │ ├── test_modeling_prophetnet.py │ │ └── test_tokenization_prophetnet.py │ ├── pvt │ │ ├── __init__.py │ │ ├── test_image_processing_pvt.py │ │ └── test_modeling_pvt.py │ ├── pvt_v2 │ │ ├── __init__.py │ │ └── test_modeling_pvt_v2.py │ ├── qdqbert │ │ ├── __init__.py │ │ └── test_modeling_qdqbert.py │ ├── qwen2 │ │ ├── __init__.py │ │ ├── test_modeling_qwen2.py │ │ └── test_tokenization_qwen2.py │ ├── qwen2_moe │ │ ├── __init__.py │ │ └── test_modeling_qwen2_moe.py │ ├── rag │ │ ├── __init__.py │ │ ├── test_modeling_rag.py │ │ ├── test_modeling_tf_rag.py │ │ ├── test_retrieval_rag.py │ │ └── test_tokenization_rag.py │ ├── realm │ │ ├── __init__.py │ │ ├── test_modeling_realm.py │ │ ├── test_retrieval_realm.py │ │ └── test_tokenization_realm.py │ ├── recurrent_gemma │ │ ├── __init__.py │ │ └── test_modeling_recurrent_gemma.py │ ├── reformer │ │ ├── __init__.py │ │ ├── test_modeling_reformer.py │ │ └── test_tokenization_reformer.py │ ├── regnet │ │ ├── __init__.py │ │ ├── test_modeling_flax_regnet.py │ │ ├── test_modeling_regnet.py │ │ └── test_modeling_tf_regnet.py │ ├── rembert │ │ ├── __init__.py │ │ ├── test_modeling_rembert.py │ │ ├── test_modeling_tf_rembert.py │ │ └── test_tokenization_rembert.py │ ├── resnet │ │ ├── __init__.py │ │ ├── test_modeling_flax_resnet.py │ │ ├── test_modeling_resnet.py │ │ └── test_modeling_tf_resnet.py │ ├── roberta │ │ ├── __init__.py │ │ ├── test_modeling_flax_roberta.py │ │ ├── test_modeling_roberta.py │ │ ├── test_modeling_tf_roberta.py │ │ └── test_tokenization_roberta.py │ ├── roberta_prelayernorm │ │ ├── __init__.py │ │ ├── test_modeling_flax_roberta_prelayernorm.py │ │ ├── test_modeling_roberta_prelayernorm.py │ │ └── test_modeling_tf_roberta_prelayernorm.py │ ├── roc_bert │ │ ├── __init__.py │ │ ├── test_modeling_roc_bert.py │ │ └── test_tokenization_roc_bert.py │ ├── roformer │ │ ├── __init__.py │ │ ├── test_modeling_flax_roformer.py │ │ ├── test_modeling_roformer.py │ │ ├── test_modeling_tf_roformer.py │ │ └── test_tokenization_roformer.py │ ├── rwkv │ │ ├── __init__.py │ │ └── test_modeling_rwkv.py │ ├── sam │ │ ├── __init__.py │ │ ├── test_modeling_sam.py │ │ ├── test_modeling_tf_sam.py │ │ └── test_processor_sam.py │ ├── seamless_m4t │ │ ├── __init__.py │ │ ├── test_feature_extraction_seamless_m4t.py │ │ ├── test_modeling_seamless_m4t.py │ │ ├── test_processor_seamless_m4t.py │ │ └── test_tokenization_seamless_m4t.py │ ├── seamless_m4t_v2 │ │ ├── __init__.py │ │ └── test_modeling_seamless_m4t_v2.py │ ├── segformer │ │ ├── __init__.py │ │ ├── test_image_processing_segformer.py │ │ ├── test_modeling_segformer.py │ │ └── test_modeling_tf_segformer.py │ ├── seggpt │ │ ├── __init__.py │ │ ├── test_image_processing_seggpt.py │ │ └── test_modeling_seggpt.py │ ├── sew │ │ ├── __init__.py │ │ └── test_modeling_sew.py │ ├── sew_d │ │ ├── __init__.py │ │ └── test_modeling_sew_d.py │ ├── siglip │ │ ├── __init__.py │ │ ├── test_image_processor_siglip.py │ │ ├── test_modeling_siglip.py │ │ └── test_tokenization_siglip.py │ ├── speech_encoder_decoder │ │ ├── __init__.py │ │ ├── test_modeling_flax_speech_encoder_decoder.py │ │ └── test_modeling_speech_encoder_decoder.py │ ├── speech_to_text │ │ ├── __init__.py │ │ ├── test_feature_extraction_speech_to_text.py │ │ ├── test_modeling_speech_to_text.py │ │ ├── test_modeling_tf_speech_to_text.py │ │ ├── test_processor_speech_to_text.py │ │ └── test_tokenization_speech_to_text.py │ ├── speech_to_text_2 │ │ ├── __init__.py │ │ ├── test_modeling_speech_to_text_2.py │ │ └── test_tokenization_speech_to_text_2.py │ ├── speecht5 │ │ ├── __init__.py │ │ ├── test_feature_extraction_speecht5.py │ │ ├── test_modeling_speecht5.py │ │ ├── test_processor_speecht5.py │ │ └── test_tokenization_speecht5.py │ ├── splinter │ │ ├── __init__.py │ │ └── test_modeling_splinter.py │ ├── squeezebert │ │ ├── __init__.py │ │ ├── test_modeling_squeezebert.py │ │ └── test_tokenization_squeezebert.py │ ├── stablelm │ │ ├── __init__.py │ │ └── test_modeling_stablelm.py │ ├── starcoder2 │ │ ├── __init__.py │ │ └── test_modeling_starcoder2.py │ ├── superpoint │ │ ├── __init__.py │ │ ├── test_image_processing_superpoint.py │ │ └── test_modeling_superpoint.py │ ├── swiftformer │ │ ├── __init__.py │ │ ├── test_modeling_swiftformer.py │ │ └── test_modeling_tf_swiftformer.py │ ├── swin │ │ ├── __init__.py │ │ ├── test_modeling_swin.py │ │ └── test_modeling_tf_swin.py │ ├── swin2sr │ │ ├── __init__.py │ │ ├── test_image_processing_swin2sr.py │ │ └── test_modeling_swin2sr.py │ ├── swinv2 │ │ ├── __init__.py │ │ └── test_modeling_swinv2.py │ ├── switch_transformers │ │ ├── __init__.py │ │ └── test_modeling_switch_transformers.py │ ├── t5 │ │ ├── __init__.py │ │ ├── test_modeling_flax_t5.py │ │ ├── test_modeling_t5.py │ │ ├── test_modeling_tf_t5.py │ │ └── test_tokenization_t5.py │ ├── table_transformer │ │ ├── __init__.py │ │ └── test_modeling_table_transformer.py │ ├── tapas │ │ ├── __init__.py │ │ ├── test_modeling_tapas.py │ │ ├── test_modeling_tf_tapas.py │ │ └── test_tokenization_tapas.py │ ├── time_series_transformer │ │ ├── __init__.py │ │ └── test_modeling_time_series_transformer.py │ ├── timesformer │ │ ├── __init__.py │ │ └── test_modeling_timesformer.py │ ├── timm_backbone │ │ ├── __init__.py │ │ └── test_modeling_timm_backbone.py │ ├── trocr │ │ ├── __init__.py │ │ └── test_modeling_trocr.py │ ├── tvlt │ │ ├── __init__.py │ │ ├── test_feature_extraction_tvlt.py │ │ ├── test_image_processor_tvlt.py │ │ ├── test_modeling_tvlt.py │ │ └── test_processor_tvlt.py │ ├── tvp │ │ ├── __init__.py │ │ ├── test_image_processing_tvp.py │ │ └── test_modeling_tvp.py │ ├── udop │ │ ├── __init__.py │ │ ├── test_modeling_udop.py │ │ ├── test_processor_udop.py │ │ └── test_tokenization_udop.py │ ├── umt5 │ │ ├── __init__.py │ │ └── test_modeling_umt5.py │ ├── unispeech │ │ ├── __init__.py │ │ └── test_modeling_unispeech.py │ ├── unispeech_sat │ │ ├── __init__.py │ │ └── test_modeling_unispeech_sat.py │ ├── univnet │ │ ├── __init__.py │ │ ├── test_feature_extraction_univnet.py │ │ └── test_modeling_univnet.py │ ├── upernet │ │ ├── __init__.py │ │ └── test_modeling_upernet.py │ ├── videomae │ │ ├── __init__.py │ │ ├── test_image_processing_videomae.py │ │ └── test_modeling_videomae.py │ ├── vilt │ │ ├── __init__.py │ │ ├── test_image_processing_vilt.py │ │ └── test_modeling_vilt.py │ ├── vipllava │ │ ├── __init__.py │ │ └── test_modeling_vipllava.py │ ├── vision_encoder_decoder │ │ ├── __init__.py │ │ ├── test_modeling_flax_vision_encoder_decoder.py │ │ ├── test_modeling_tf_vision_encoder_decoder.py │ │ └── test_modeling_vision_encoder_decoder.py │ ├── vision_text_dual_encoder │ │ ├── __init__.py │ │ ├── test_modeling_flax_vision_text_dual_encoder.py │ │ ├── test_modeling_tf_vision_text_dual_encoder.py │ │ ├── test_modeling_vision_text_dual_encoder.py │ │ └── test_processor_vision_text_dual_encoder.py │ ├── visual_bert │ │ ├── __init__.py │ │ └── test_modeling_visual_bert.py │ ├── vit │ │ ├── __init__.py │ │ ├── test_image_processing_vit.py │ │ ├── test_modeling_flax_vit.py │ │ ├── test_modeling_tf_vit.py │ │ └── test_modeling_vit.py │ ├── vit_hybrid │ │ ├── __init__.py │ │ └── test_modeling_vit_hybrid.py │ ├── vit_mae │ │ ├── __init__.py │ │ ├── test_modeling_tf_vit_mae.py │ │ └── test_modeling_vit_mae.py │ ├── vit_msn │ │ ├── __init__.py │ │ └── test_modeling_vit_msn.py │ ├── vitdet │ │ ├── __init__.py │ │ └── test_modeling_vitdet.py │ ├── vitmatte │ │ ├── __init__.py │ │ ├── test_image_processing_vitmatte.py │ │ └── test_modeling_vitmatte.py │ ├── vits │ │ ├── __init__.py │ │ ├── test_modeling_vits.py │ │ └── test_tokenization_vits.py │ ├── vivit │ │ ├── __init__.py │ │ ├── test_image_processing_vivit.py │ │ └── test_modeling_vivit.py │ ├── wav2vec2 │ │ ├── __init__.py │ │ ├── test_feature_extraction_wav2vec2.py │ │ ├── test_modeling_flax_wav2vec2.py │ │ ├── test_modeling_tf_wav2vec2.py │ │ ├── test_modeling_wav2vec2.py │ │ ├── test_processor_wav2vec2.py │ │ └── test_tokenization_wav2vec2.py │ ├── wav2vec2_bert │ │ ├── __init__.py │ │ ├── test_modeling_wav2vec2_bert.py │ │ └── test_processor_wav2vec2_bert.py │ ├── wav2vec2_conformer │ │ ├── __init__.py │ │ └── test_modeling_wav2vec2_conformer.py │ ├── wav2vec2_phoneme │ │ ├── __init__.py │ │ └── test_tokenization_wav2vec2_phoneme.py │ ├── wav2vec2_with_lm │ │ ├── __init__.py │ │ └── test_processor_wav2vec2_with_lm.py │ ├── wavlm │ │ ├── __init__.py │ │ └── test_modeling_wavlm.py │ ├── whisper │ │ ├── __init__.py │ │ ├── test_feature_extraction_whisper.py │ │ ├── test_modeling_flax_whisper.py │ │ ├── test_modeling_tf_whisper.py │ │ ├── test_modeling_whisper.py │ │ ├── test_processor_whisper.py │ │ └── test_tokenization_whisper.py │ ├── x_clip │ │ ├── __init__.py │ │ └── test_modeling_x_clip.py │ ├── xglm │ │ ├── __init__.py │ │ ├── test_modeling_flax_xglm.py │ │ ├── test_modeling_tf_xglm.py │ │ ├── test_modeling_xglm.py │ │ └── test_tokenization_xglm.py │ ├── xlm │ │ ├── __init__.py │ │ ├── test_modeling_tf_xlm.py │ │ ├── test_modeling_xlm.py │ │ └── test_tokenization_xlm.py │ ├── xlm_prophetnet │ │ ├── __init__.py │ │ ├── test_modeling_xlm_prophetnet.py │ │ └── test_tokenization_xlm_prophetnet.py │ ├── xlm_roberta │ │ ├── __init__.py │ │ ├── test_modeling_flax_xlm_roberta.py │ │ ├── test_modeling_tf_xlm_roberta.py │ │ ├── test_modeling_xlm_roberta.py │ │ └── test_tokenization_xlm_roberta.py │ ├── xlm_roberta_xl │ │ ├── __init__.py │ │ └── test_modeling_xlm_roberta_xl.py │ ├── xlnet │ │ ├── __init__.py │ │ ├── test_modeling_tf_xlnet.py │ │ ├── test_modeling_xlnet.py │ │ └── test_tokenization_xlnet.py │ ├── xmod │ │ ├── __init__.py │ │ └── test_modeling_xmod.py │ ├── yolos │ │ ├── __init__.py │ │ ├── test_image_processing_yolos.py │ │ └── test_modeling_yolos.py │ └── yoso │ │ ├── __init__.py │ │ └── test_modeling_yoso.py ├── optimization │ ├── __init__.py │ ├── test_optimization.py │ └── test_optimization_tf.py ├── peft_integration │ └── test_peft_integration.py ├── pipelines │ ├── __init__.py │ ├── test_pipelines_audio_classification.py │ ├── test_pipelines_automatic_speech_recognition.py │ ├── test_pipelines_common.py │ ├── test_pipelines_conversational.py │ ├── test_pipelines_depth_estimation.py │ ├── test_pipelines_document_question_answering.py │ ├── test_pipelines_feature_extraction.py │ ├── test_pipelines_fill_mask.py │ ├── test_pipelines_image_classification.py │ ├── test_pipelines_image_feature_extraction.py │ ├── test_pipelines_image_segmentation.py │ ├── test_pipelines_image_to_image.py │ ├── test_pipelines_image_to_text.py │ ├── test_pipelines_mask_generation.py │ ├── test_pipelines_object_detection.py │ ├── test_pipelines_question_answering.py │ ├── test_pipelines_summarization.py │ ├── test_pipelines_table_question_answering.py │ ├── test_pipelines_text2text_generation.py │ ├── test_pipelines_text_classification.py │ ├── test_pipelines_text_generation.py │ ├── test_pipelines_text_to_audio.py │ ├── test_pipelines_token_classification.py │ ├── test_pipelines_translation.py │ ├── test_pipelines_video_classification.py │ ├── test_pipelines_visual_question_answering.py │ ├── test_pipelines_zero_shot.py │ ├── test_pipelines_zero_shot_audio_classification.py │ ├── test_pipelines_zero_shot_image_classification.py │ └── test_pipelines_zero_shot_object_detection.py ├── quantization │ ├── aqlm_integration │ │ ├── __init__.py │ │ └── test_aqlm.py │ ├── autoawq │ │ ├── __init__.py │ │ └── test_awq.py │ ├── bnb │ │ ├── README.md │ │ ├── __init__.py │ │ ├── test_4bit.py │ │ └── test_mixed_int8.py │ ├── gptq │ │ ├── __init__.py │ │ └── test_gptq.py │ └── quanto_integration │ │ ├── __init__.py │ │ └── test_quanto.py ├── repo_utils │ ├── test_check_copies.py │ ├── test_check_docstrings.py │ ├── test_check_dummies.py │ ├── test_get_test_info.py │ └── test_tests_fetcher.py ├── sagemaker │ ├── README.md │ ├── __init__.py │ ├── conftest.py │ ├── scripts │ │ ├── pytorch │ │ │ ├── requirements.txt │ │ │ ├── run_ddp.py │ │ │ └── run_glue_model_parallelism.py │ │ └── tensorflow │ │ │ ├── requirements.txt │ │ │ ├── run_tf.py │ │ │ └── run_tf_dist.py │ ├── test_multi_node_data_parallel.py │ ├── test_multi_node_model_parallel.py │ └── test_single_node_gpu.py ├── test_backbone_common.py ├── test_cache_utils.py ├── test_configuration_common.py ├── test_configuration_utils.py ├── test_feature_extraction_common.py ├── test_feature_extraction_utils.py ├── test_image_processing_common.py ├── test_image_processing_utils.py ├── test_image_transforms.py ├── test_modeling_common.py ├── test_modeling_flax_common.py ├── test_modeling_flax_utils.py ├── test_modeling_tf_common.py ├── test_modeling_tf_utils.py ├── test_modeling_utils.py ├── test_pipeline_mixin.py ├── test_processing_common.py ├── test_sequence_feature_extraction_common.py ├── test_tokenization_common.py ├── test_tokenization_utils.py ├── tokenization │ ├── __init__.py │ ├── test_tokenization_fast.py │ └── test_tokenization_utils.py ├── tools │ ├── __init__.py │ ├── test_agent_types.py │ ├── test_document_question_answering.py │ ├── test_image_captioning.py │ ├── test_image_question_answering.py │ ├── test_image_segmentation.py │ ├── test_python_interpreter.py │ ├── test_speech_to_text.py │ ├── test_text_classification.py │ ├── test_text_question_answering.py │ ├── test_text_summarization.py │ ├── test_text_to_speech.py │ ├── test_tools_common.py │ └── test_translation.py ├── trainer │ ├── __init__.py │ ├── test_data_collator.py │ ├── test_trainer.py │ ├── test_trainer_callback.py │ ├── test_trainer_distributed.py │ ├── test_trainer_seq2seq.py │ ├── test_trainer_tpu.py │ └── test_trainer_utils.py └── utils │ ├── __init__.py │ ├── test_activations.py │ ├── test_activations_tf.py │ ├── test_add_new_model_like.py │ ├── test_audio_utils.py │ ├── test_backbone_utils.py │ ├── test_cli.py │ ├── test_convert_slow_tokenizer.py │ ├── test_doc_samples.py │ ├── test_dynamic_module_utils.py │ ├── test_file_utils.py │ ├── test_generic.py │ ├── test_hf_argparser.py │ ├── test_hub_utils.py │ ├── test_image_processing_utils.py │ ├── test_image_utils.py │ ├── test_logging.py │ ├── test_model_card.py │ ├── test_model_output.py │ ├── test_modeling_tf_core.py │ ├── test_offline.py │ ├── test_skip_decorators.py │ ├── test_versions_utils.py │ └── tiny_model_summary.json └── utils ├── add_pipeline_model_mapping_to_test.py ├── check_build.py ├── check_config_attributes.py ├── check_config_docstrings.py ├── check_copies.py ├── check_doc_toc.py ├── check_docstrings.py ├── check_doctest_list.py ├── check_dummies.py ├── check_inits.py ├── check_model_tester.py ├── check_repo.py ├── check_self_hosted_runner.py ├── check_support_list.py ├── check_table.py ├── check_task_guides.py ├── check_tf_ops.py ├── create_dummy_models.py ├── custom_init_isort.py ├── download_glue_data.py ├── extract_warnings.py ├── get_ci_error_statistics.py ├── get_github_job_time.py ├── get_modified_files.py ├── get_previous_daily_ci.py ├── get_test_info.py ├── important_models.txt ├── not_doctested.txt ├── notification_service.py ├── notification_service_doc_tests.py ├── notification_service_quantization.py ├── past_ci_versions.py ├── print_env.py ├── release.py ├── slow_documentation_tests.txt ├── sort_auto_mappings.py ├── split_doctest_jobs.py ├── split_model_tests.py ├── test_module ├── __init__.py ├── custom_configuration.py ├── custom_feature_extraction.py ├── custom_image_processing.py ├── custom_modeling.py ├── custom_pipeline.py ├── custom_processing.py ├── custom_tokenization.py └── custom_tokenization_fast.py ├── tests_fetcher.py ├── tf_ops └── onnx.json ├── update_metadata.py └── update_tiny_models.py /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/README.md -------------------------------------------------------------------------------- /img/Background.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/img/Background.png -------------------------------------------------------------------------------- /img/equation.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/img/equation.png -------------------------------------------------------------------------------- /img/hyperparameter.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/img/hyperparameter.png -------------------------------------------------------------------------------- /img/overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/img/overview.png -------------------------------------------------------------------------------- /reasoning_evaluation/gsm8k/topp/top95_13B_gsm8k.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/reasoning_evaluation/gsm8k/topp/top95_13B_gsm8k.json -------------------------------------------------------------------------------- /reasoning_evaluation/gsm8k/topp/top95_70B_gsm8k.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/reasoning_evaluation/gsm8k/topp/top95_70B_gsm8k.json -------------------------------------------------------------------------------- /reasoning_evaluation/gsm8k/topp/top95_7B_gsm8k.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/reasoning_evaluation/gsm8k/topp/top95_7B_gsm8k.json -------------------------------------------------------------------------------- /test.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/test.ipynb -------------------------------------------------------------------------------- /transformers-main/.coveragerc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/.coveragerc -------------------------------------------------------------------------------- /transformers-main/.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/.gitattributes -------------------------------------------------------------------------------- /transformers-main/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/.gitignore -------------------------------------------------------------------------------- /transformers-main/CITATION.cff: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/CITATION.cff -------------------------------------------------------------------------------- /transformers-main/CODE_OF_CONDUCT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/CODE_OF_CONDUCT.md -------------------------------------------------------------------------------- /transformers-main/CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/CONTRIBUTING.md -------------------------------------------------------------------------------- /transformers-main/ISSUES.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/ISSUES.md -------------------------------------------------------------------------------- /transformers-main/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/LICENSE -------------------------------------------------------------------------------- /transformers-main/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/Makefile -------------------------------------------------------------------------------- /transformers-main/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README.md -------------------------------------------------------------------------------- /transformers-main/README_de.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README_de.md -------------------------------------------------------------------------------- /transformers-main/README_es.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README_es.md -------------------------------------------------------------------------------- /transformers-main/README_fr.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README_fr.md -------------------------------------------------------------------------------- /transformers-main/README_hd.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README_hd.md -------------------------------------------------------------------------------- /transformers-main/README_ja.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README_ja.md -------------------------------------------------------------------------------- /transformers-main/README_ko.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README_ko.md -------------------------------------------------------------------------------- /transformers-main/README_pt-br.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README_pt-br.md -------------------------------------------------------------------------------- /transformers-main/README_ru.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README_ru.md -------------------------------------------------------------------------------- /transformers-main/README_te.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README_te.md -------------------------------------------------------------------------------- /transformers-main/README_vi.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README_vi.md -------------------------------------------------------------------------------- /transformers-main/README_zh-hans.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README_zh-hans.md -------------------------------------------------------------------------------- /transformers-main/README_zh-hant.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/README_zh-hant.md -------------------------------------------------------------------------------- /transformers-main/SECURITY.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/SECURITY.md -------------------------------------------------------------------------------- /transformers-main/awesome-transformers.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/awesome-transformers.md -------------------------------------------------------------------------------- /transformers-main/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/conftest.py -------------------------------------------------------------------------------- /transformers-main/docker/transformers-gpu/Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docker/transformers-gpu/Dockerfile -------------------------------------------------------------------------------- /transformers-main/docs/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/README.md -------------------------------------------------------------------------------- /transformers-main/docs/TRANSLATING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/TRANSLATING.md -------------------------------------------------------------------------------- /transformers-main/docs/source/_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/_config.py -------------------------------------------------------------------------------- /transformers-main/docs/source/de/_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/_config.py -------------------------------------------------------------------------------- /transformers-main/docs/source/de/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/de/accelerate.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/accelerate.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/add_new_model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/add_new_model.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/add_new_pipeline.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/add_new_pipeline.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/contributing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/contributing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/index.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/installation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/installation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/llm_tutorial.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/llm_tutorial.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/model_sharing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/model_sharing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/peft.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/peft.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/pr_checks.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/pr_checks.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/preprocessing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/preprocessing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/quicktour.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/quicktour.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/run_scripts.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/run_scripts.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/testing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/testing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/de/training.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/de/training.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/_config.py -------------------------------------------------------------------------------- /transformers-main/docs/source/en/_redirects.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/_redirects.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/en/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/en/accelerate.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/accelerate.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/add_new_model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/add_new_model.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/add_new_pipeline.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/add_new_pipeline.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/attention.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/attention.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/benchmarks.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/benchmarks.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/bertology.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/bertology.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/big_models.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/big_models.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/chat_templating.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/chat_templating.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/community.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/community.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/contributing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/contributing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/create_a_model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/create_a_model.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/custom_models.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/custom_models.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/custom_tools.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/custom_tools.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/debugging.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/debugging.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/deepspeed.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/deepspeed.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/fast_tokenizers.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/fast_tokenizers.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/fsdp.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/fsdp.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/glossary.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/glossary.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/hf_quantizer.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/hf_quantizer.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/hpo_train.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/hpo_train.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/index.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/installation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/installation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/llm_tutorial.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/llm_tutorial.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/albert.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/albert.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/align.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/align.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/auto.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/auto.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/bark.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/bark.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/bart.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/bart.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/beit.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/beit.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/bert.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/bert.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/biogpt.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/biogpt.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/bit.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/bit.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/blip-2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/blip-2.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/blip.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/blip.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/bloom.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/bloom.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/bort.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/bort.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/bros.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/bros.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/byt5.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/byt5.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/canine.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/canine.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/clap.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/clap.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/clip.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/clip.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/clvp.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/clvp.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/cohere.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/cohere.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/cpm.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/cpm.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/cpmant.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/cpmant.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/ctrl.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/ctrl.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/cvt.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/cvt.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/dbrx.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/dbrx.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/deit.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/deit.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/deplot.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/deplot.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/deta.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/deta.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/detr.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/detr.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/dinat.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/dinat.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/dinov2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/dinov2.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/dit.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/dit.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/donut.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/donut.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/dpr.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/dpr.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/dpt.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/dpt.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/ernie.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/ernie.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/esm.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/esm.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/falcon.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/falcon.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/flava.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/flava.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/fnet.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/fnet.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/fsmt.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/fsmt.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/funnel.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/funnel.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/fuyu.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/fuyu.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/gemma.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/gemma.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/git.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/git.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/glpn.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/glpn.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/gpt2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/gpt2.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/gptj.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/gptj.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/hubert.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/hubert.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/ibert.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/ibert.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/jamba.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/jamba.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/led.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/led.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/levit.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/levit.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/lilt.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/lilt.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/llama.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/llama.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/llama2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/llama2.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/llava.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/llava.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/longt5.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/longt5.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/luke.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/luke.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/lxmert.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/lxmert.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/mamba.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/mamba.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/marian.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/marian.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/matcha.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/matcha.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/mbart.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/mbart.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/mctct.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/mctct.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/mega.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/mega.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/mluke.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/mluke.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/mms.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/mms.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/mpnet.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/mpnet.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/mpt.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/mpt.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/mra.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/mra.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/mt5.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/mt5.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/mvp.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/mvp.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/nat.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/nat.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/nezha.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/nezha.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/nllb.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/nllb.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/nougat.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/nougat.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/olmo.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/olmo.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/opt.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/opt.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/owlv2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/owlv2.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/owlvit.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/owlvit.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/phi.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/phi.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/plbart.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/plbart.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/pvt.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/pvt.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/pvt_v2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/pvt_v2.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/qwen2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/qwen2.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/rag.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/rag.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/realm.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/realm.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/regnet.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/regnet.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/resnet.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/resnet.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/rwkv.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/rwkv.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/sam.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/sam.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/seggpt.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/seggpt.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/sew-d.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/sew-d.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/sew.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/sew.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/swin.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/swin.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/t5.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/t5.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/tvlt.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/tvlt.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/tvp.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/tvp.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/udop.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/udop.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/ul2.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/ul2.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/umt5.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/umt5.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/van.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/van.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/vilt.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/vilt.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/vit.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/vit.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/vits.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/vits.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/xglm.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/xglm.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/xlm.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/xlm.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/xmod.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/xmod.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_doc/yoso.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_doc/yoso.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_sharing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_sharing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/model_summary.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/model_summary.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/multilingual.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/multilingual.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/notebooks.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/notebooks.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/pad_truncation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/pad_truncation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/peft.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/peft.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/perf_hardware.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/perf_hardware.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/perf_infer_cpu.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/perf_infer_cpu.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/perf_train_cpu.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/perf_train_cpu.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/performance.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/performance.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/perplexity.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/perplexity.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/philosophy.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/philosophy.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/pr_checks.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/pr_checks.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/preprocessing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/preprocessing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/quantization.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/quantization.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/quicktour.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/quicktour.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/run_scripts.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/run_scripts.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/sagemaker.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/sagemaker.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/serialization.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/serialization.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/task_summary.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/task_summary.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/tasks/asr.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/tasks/asr.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/tasks/idefics.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/tasks/idefics.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/testing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/testing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/tf_xla.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/tf_xla.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/tflite.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/tflite.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/torchscript.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/torchscript.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/trainer.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/trainer.md -------------------------------------------------------------------------------- /transformers-main/docs/source/en/training.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/en/training.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/_config.py -------------------------------------------------------------------------------- /transformers-main/docs/source/es/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/es/accelerate.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/accelerate.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/attention.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/attention.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/bertology.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/bertology.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/community.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/community.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/create_a_model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/create_a_model.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/custom_models.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/custom_models.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/debugging.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/debugging.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/glossary.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/glossary.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/index.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/installation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/installation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/model_sharing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/model_sharing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/multilingual.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/multilingual.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/pad_truncation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/pad_truncation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/performance.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/performance.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/perplexity.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/perplexity.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/philosophy.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/philosophy.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/pr_checks.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/pr_checks.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/preprocessing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/preprocessing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/quicktour.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/quicktour.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/run_scripts.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/run_scripts.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/sagemaker.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/sagemaker.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/serialization.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/serialization.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/task_summary.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/task_summary.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/tasks/asr.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/tasks/asr.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/torchscript.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/torchscript.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/trainer.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/trainer.md -------------------------------------------------------------------------------- /transformers-main/docs/source/es/training.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/es/training.md -------------------------------------------------------------------------------- /transformers-main/docs/source/fr/_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/fr/_config.py -------------------------------------------------------------------------------- /transformers-main/docs/source/fr/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/fr/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/fr/in_translation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/fr/in_translation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/fr/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/fr/index.md -------------------------------------------------------------------------------- /transformers-main/docs/source/fr/installation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/fr/installation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/fr/quicktour.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/fr/quicktour.md -------------------------------------------------------------------------------- /transformers-main/docs/source/hi/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/hi/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/it/_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/_config.py -------------------------------------------------------------------------------- /transformers-main/docs/source/it/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/it/accelerate.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/accelerate.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/add_new_model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/add_new_model.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/big_models.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/big_models.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/community.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/community.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/create_a_model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/create_a_model.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/custom_models.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/custom_models.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/debugging.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/debugging.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/index.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/installation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/installation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/migration.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/migration.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/model_sharing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/model_sharing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/multilingual.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/multilingual.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/perf_hardware.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/perf_hardware.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/perf_infer_cpu.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/perf_infer_cpu.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/perf_train_cpu.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/perf_train_cpu.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/perf_train_tpu.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/perf_train_tpu.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/pr_checks.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/pr_checks.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/preprocessing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/preprocessing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/quicktour.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/quicktour.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/run_scripts.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/run_scripts.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/serialization.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/serialization.md -------------------------------------------------------------------------------- /transformers-main/docs/source/it/training.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/it/training.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/accelerate.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/accelerate.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/add_new_model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/add_new_model.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/attention.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/attention.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/benchmarks.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/benchmarks.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/bertology.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/bertology.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/big_models.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/big_models.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/community.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/community.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/create_a_model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/create_a_model.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/custom_models.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/custom_models.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/custom_tools.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/custom_tools.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/glossary.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/glossary.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/hpo_train.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/hpo_train.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/index.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/installation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/installation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/llm_tutorial.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/llm_tutorial.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/auto.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/auto.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/bark.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/bark.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/bart.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/bart.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/beit.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/beit.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/bert.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/bert.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/bit.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/bit.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/blip.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/blip.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/bort.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/bort.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/bros.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/bros.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/byt5.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/byt5.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/clap.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/clap.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/clip.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/clip.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/clvp.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/clvp.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/cpm.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/cpm.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/ctrl.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/ctrl.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/cvt.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/cvt.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/deit.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/deit.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/deta.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/deta.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_doc/detr.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_doc/detr.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_sharing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_sharing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/model_summary.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/model_summary.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/multilingual.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/multilingual.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/pad_truncation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/pad_truncation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/peft.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/peft.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/perf_hardware.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/perf_hardware.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/perf_infer_cpu.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/perf_infer_cpu.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/perf_train_cpu.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/perf_train_cpu.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/perf_train_tpu.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/perf_train_tpu.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/performance.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/performance.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/perplexity.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/perplexity.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/philosophy.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/philosophy.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/pr_checks.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/pr_checks.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/preprocessing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/preprocessing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/quicktour.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/quicktour.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/run_scripts.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/run_scripts.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/serialization.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/serialization.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/task_summary.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/task_summary.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/tasks/asr.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/tasks/asr.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/tasks/idefics.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/tasks/idefics.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/testing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/testing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/tf_xla.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/tf_xla.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/tflite.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/tflite.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/torchscript.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/torchscript.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ja/training.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ja/training.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/_config.py -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/accelerate.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/accelerate.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/add_new_model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/add_new_model.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/attention.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/attention.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/bertology.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/bertology.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/big_models.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/big_models.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/community.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/community.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/contributing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/contributing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/create_a_model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/create_a_model.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/custom_models.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/custom_models.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/custom_tools.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/custom_tools.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/debugging.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/debugging.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/hpo_train.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/hpo_train.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/in_translation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/in_translation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/index.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/installation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/installation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/llm_tutorial.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/llm_tutorial.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/model_sharing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/model_sharing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/model_summary.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/model_summary.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/multilingual.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/multilingual.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/pad_truncation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/pad_truncation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/peft.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/peft.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/perf_hardware.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/perf_hardware.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/perf_infer_cpu.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/perf_infer_cpu.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/perf_train_cpu.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/perf_train_cpu.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/performance.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/performance.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/perplexity.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/perplexity.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/philosophy.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/philosophy.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/pr_checks.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/pr_checks.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/preprocessing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/preprocessing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/quicktour.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/quicktour.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/run_scripts.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/run_scripts.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/sagemaker.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/sagemaker.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/serialization.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/serialization.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/task_summary.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/task_summary.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/tasks/asr.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/tasks/asr.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/testing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/testing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/tf_xla.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/tf_xla.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/tflite.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/tflite.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/torchscript.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/torchscript.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ko/training.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ko/training.md -------------------------------------------------------------------------------- /transformers-main/docs/source/ms/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ms/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/ms/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/ms/index.md -------------------------------------------------------------------------------- /transformers-main/docs/source/pt/_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/pt/_config.py -------------------------------------------------------------------------------- /transformers-main/docs/source/pt/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/pt/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/pt/accelerate.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/pt/accelerate.md -------------------------------------------------------------------------------- /transformers-main/docs/source/pt/create_a_model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/pt/create_a_model.md -------------------------------------------------------------------------------- /transformers-main/docs/source/pt/custom_models.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/pt/custom_models.md -------------------------------------------------------------------------------- /transformers-main/docs/source/pt/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/pt/index.md -------------------------------------------------------------------------------- /transformers-main/docs/source/pt/installation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/pt/installation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/pt/multilingual.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/pt/multilingual.md -------------------------------------------------------------------------------- /transformers-main/docs/source/pt/quicktour.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/pt/quicktour.md -------------------------------------------------------------------------------- /transformers-main/docs/source/pt/run_scripts.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/pt/run_scripts.md -------------------------------------------------------------------------------- /transformers-main/docs/source/pt/serialization.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/pt/serialization.md -------------------------------------------------------------------------------- /transformers-main/docs/source/pt/training.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/pt/training.md -------------------------------------------------------------------------------- /transformers-main/docs/source/te/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/te/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/te/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/te/index.md -------------------------------------------------------------------------------- /transformers-main/docs/source/te/quicktour.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/te/quicktour.md -------------------------------------------------------------------------------- /transformers-main/docs/source/tr/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/tr/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/tr/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/tr/index.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/_toctree.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/_toctree.yml -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/accelerate.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/accelerate.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/big_models.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/big_models.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/contributing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/contributing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/create_a_model.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/create_a_model.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/custom_models.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/custom_models.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/debugging.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/debugging.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/fsdp.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/fsdp.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/hpo_train.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/hpo_train.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/index.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/installation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/installation.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/llm_tutorial.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/llm_tutorial.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/model_sharing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/model_sharing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/multilingual.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/multilingual.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/peft.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/peft.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/perf_hardware.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/perf_hardware.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/performance.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/performance.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/preprocessing.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/preprocessing.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/quicktour.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/quicktour.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/run_scripts.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/run_scripts.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/serialization.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/serialization.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/task_summary.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/task_summary.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/tasks/asr.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/tasks/asr.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/tf_xla.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/tf_xla.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/tflite.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/tflite.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/torchscript.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/torchscript.md -------------------------------------------------------------------------------- /transformers-main/docs/source/zh/training.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/docs/source/zh/training.md -------------------------------------------------------------------------------- /transformers-main/examples/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/README.md -------------------------------------------------------------------------------- /transformers-main/examples/flax/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/flax/README.md -------------------------------------------------------------------------------- /transformers-main/examples/flax/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/flax/conftest.py -------------------------------------------------------------------------------- /transformers-main/examples/flax/vision/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/flax/vision/README.md -------------------------------------------------------------------------------- /transformers-main/examples/legacy/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/legacy/README.md -------------------------------------------------------------------------------- /transformers-main/examples/legacy/benchmarking/requirements.txt: -------------------------------------------------------------------------------- 1 | torch >= 1.3 -------------------------------------------------------------------------------- /transformers-main/examples/legacy/run_camembert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/legacy/run_camembert.py -------------------------------------------------------------------------------- /transformers-main/examples/legacy/run_swag.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/legacy/run_swag.py -------------------------------------------------------------------------------- /transformers-main/examples/legacy/seq2seq/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/legacy/seq2seq/utils.py -------------------------------------------------------------------------------- /transformers-main/examples/pytorch/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/pytorch/README.md -------------------------------------------------------------------------------- /transformers-main/examples/pytorch/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/pytorch/conftest.py -------------------------------------------------------------------------------- /transformers-main/examples/pytorch/xla_spawn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/pytorch/xla_spawn.py -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/adversarial/requirements.txt: -------------------------------------------------------------------------------- 1 | transformers == 3.5.1 2 | -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/bert-loses-patience/pabee/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/bert-loses-patience/requirements.txt: -------------------------------------------------------------------------------- 1 | transformers == 3.5.1 -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/bertabs/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/bertabs/requirements.txt: -------------------------------------------------------------------------------- 1 | transformers == 3.5.1 2 | 3 | # For ROUGE 4 | nltk 5 | py-rouge 6 | -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/bertology/requirements.txt: -------------------------------------------------------------------------------- 1 | transformers == 3.5.1 2 | -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/codeparrot/scripts/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/deebert/requirements.txt: -------------------------------------------------------------------------------- 1 | transformers == 3.5.1 2 | -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/deebert/src/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/fsner/requirements.txt: -------------------------------------------------------------------------------- 1 | transformers>=4.9.2 -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/information-gain-filtration/igf/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/layoutlmv3/requirements.txt: -------------------------------------------------------------------------------- 1 | datasets 2 | seqeval 3 | pillow 4 | -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/longform-qa/requirements.txt: -------------------------------------------------------------------------------- 1 | datasets >= 1.1.3 2 | faiss-cpu 3 | streamlit 4 | elasticsearch 5 | -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/mlm_wwm/requirements.txt: -------------------------------------------------------------------------------- 1 | datasets >= 1.1.3 2 | sentencepiece != 0.1.92 3 | protobuf 4 | ltp 5 | -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/onnx/summarization/requirements.txt: -------------------------------------------------------------------------------- 1 | torch >= 1.10 -------------------------------------------------------------------------------- /transformers-main/examples/research_projects/tapex/requirements.txt: -------------------------------------------------------------------------------- 1 | numpy 2 | datasets 3 | pandas 4 | nltk -------------------------------------------------------------------------------- /transformers-main/examples/run_on_remote.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/run_on_remote.py -------------------------------------------------------------------------------- /transformers-main/examples/tensorflow/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/examples/tensorflow/README.md -------------------------------------------------------------------------------- /transformers-main/examples/tensorflow/benchmarking/requirements.txt: -------------------------------------------------------------------------------- 1 | tensorflow >= 2.3 -------------------------------------------------------------------------------- /transformers-main/examples/tensorflow/contrastive-image-text/requirements.txt: -------------------------------------------------------------------------------- 1 | tensorflow>=2.6.0 2 | datasets>=1.8.0 -------------------------------------------------------------------------------- /transformers-main/examples/tensorflow/image-classification/requirements.txt: -------------------------------------------------------------------------------- 1 | datasets>=1.17.0 2 | evaluate 3 | tensorflow>=2.4 4 | -------------------------------------------------------------------------------- /transformers-main/examples/tensorflow/language-modeling/requirements.txt: -------------------------------------------------------------------------------- 1 | datasets >= 1.8.0 2 | sentencepiece != 0.1.92 -------------------------------------------------------------------------------- /transformers-main/examples/tensorflow/multiple-choice/requirements.txt: -------------------------------------------------------------------------------- 1 | sentencepiece != 0.1.92 2 | protobuf 3 | tensorflow >= 2.3 4 | -------------------------------------------------------------------------------- /transformers-main/hubconf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/hubconf.py -------------------------------------------------------------------------------- /transformers-main/model_cards/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/model_cards/README.md -------------------------------------------------------------------------------- /transformers-main/notebooks/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/notebooks/README.md -------------------------------------------------------------------------------- /transformers-main/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/pyproject.toml -------------------------------------------------------------------------------- /transformers-main/scripts/check_tokenizers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/scripts/check_tokenizers.py -------------------------------------------------------------------------------- /transformers-main/scripts/fsmt/s3-move.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/scripts/fsmt/s3-move.sh -------------------------------------------------------------------------------- /transformers-main/scripts/fsmt/tests-to-run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/scripts/fsmt/tests-to-run.sh -------------------------------------------------------------------------------- /transformers-main/scripts/stale.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/scripts/stale.py -------------------------------------------------------------------------------- /transformers-main/scripts/tatoeba/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/scripts/tatoeba/README.md -------------------------------------------------------------------------------- /transformers-main/scripts/tatoeba/upload_models.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/scripts/tatoeba/upload_models.sh -------------------------------------------------------------------------------- /transformers-main/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/setup.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/__init__.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/activations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/activations.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/audio_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/audio_utils.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/benchmark/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/src/transformers/cache_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/cache_utils.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/commands/env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/commands/env.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/commands/lfs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/commands/lfs.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/commands/run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/commands/run.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/debug_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/debug_utils.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/deepspeed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/deepspeed.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/file_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/file_utils.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/hf_argparser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/hf_argparser.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/image_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/image_utils.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/modelcard.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/modelcard.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/models/deprecated/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/src/transformers/models/deprecated/bort/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/src/transformers/models/dialogpt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/src/transformers/models/dit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/src/transformers/onnx/config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/onnx/config.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/onnx/convert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/onnx/convert.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/onnx/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/onnx/utils.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/optimization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/optimization.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/tf_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/tf_utils.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/tools/agents.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/tools/agents.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/tools/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/tools/base.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/trainer.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/utils/doc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/utils/doc.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/utils/fx.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/utils/fx.py -------------------------------------------------------------------------------- /transformers-main/src/transformers/utils/hub.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/src/transformers/utils/hub.py -------------------------------------------------------------------------------- /transformers-main/tests/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/benchmark/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/bettertransformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/fixtures/dummy-config.json: -------------------------------------------------------------------------------- 1 | { 2 | "model_type": "roberta" 3 | } -------------------------------------------------------------------------------- /transformers-main/tests/fixtures/empty.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/fixtures/input.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/fixtures/input.txt -------------------------------------------------------------------------------- /transformers-main/tests/fixtures/merges.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/fixtures/merges.txt -------------------------------------------------------------------------------- /transformers-main/tests/fixtures/sample_text.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/fixtures/sample_text.txt -------------------------------------------------------------------------------- /transformers-main/tests/fixtures/spiece.model: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/fixtures/spiece.model -------------------------------------------------------------------------------- /transformers-main/tests/fixtures/vocab.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/fixtures/vocab.json -------------------------------------------------------------------------------- /transformers-main/tests/fixtures/vocab.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/fixtures/vocab.txt -------------------------------------------------------------------------------- /transformers-main/tests/fsdp/test_fsdp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/fsdp/test_fsdp.py -------------------------------------------------------------------------------- /transformers-main/tests/generation/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/generation/test_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/generation/test_utils.py -------------------------------------------------------------------------------- /transformers-main/tests/models/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/albert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/align/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/altclip/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/audio_spectrogram_transformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/auto/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/autoformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/bark/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/bart/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/barthez/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/bartpho/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/beit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/bert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/bert_generation/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/bert_japanese/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/bertweet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/big_bird/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/bigbird_pegasus/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/biogpt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/bit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/blenderbot/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/blenderbot_small/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/blip/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/blip_2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/bloom/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/bridgetower/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/bros/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/byt5/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/camembert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/canine/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/chinese_clip/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/clap/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/clip/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/clipseg/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/clvp/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/code_llama/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/codegen/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/cohere/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/conditional_detr/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/convbert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/convnext/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/convnextv2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/cpm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/cpmant/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/ctrl/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/cvt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/data2vec/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/dbrx/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/deberta/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/deberta_v2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/decision_transformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/deformable_detr/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/deit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/depth_anything/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/deta/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/detr/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/dinat/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/dinov2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/distilbert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/dit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/donut/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/dpr/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/dpt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/efficientformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/efficientnet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/electra/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/encodec/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/encoder_decoder/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/ernie/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/ernie_m/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/esm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/falcon/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/fastspeech2_conformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/flaubert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/flava/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/fnet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/focalnet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/fsmt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/funnel/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/fuyu/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/gemma/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/git/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/glpn/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/gpt2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/gpt_bigcode/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/gpt_neo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/gpt_neox/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/gpt_neox_japanese/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/gpt_sw3/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/gptj/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/gptsan_japanese/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/graphormer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/grounding_dino/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/groupvit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/herbert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/hubert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/ibert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/idefics/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/idefics2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/imagegpt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/informer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/instructblip/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/jamba/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/jukebox/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/kosmos2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/layoutlm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/layoutlmv2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/layoutlmv3/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/layoutxlm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/led/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/levit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/lilt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/llama/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/llava/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/llava_next/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/longformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/longt5/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/luke/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/lxmert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/m2m_100/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mamba/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/marian/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/markuplm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mask2former/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/maskformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mbart/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mbart50/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mega/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/megatron_bert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/megatron_gpt2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mgp_str/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mistral/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mixtral/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mluke/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mobilebert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mobilenet_v1/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mobilenet_v2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mobilevit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mobilevitv2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mpnet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mpt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mra/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mt5/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/musicgen/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/musicgen_melody/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/mvp/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/nat/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/nezha/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/nllb/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/nllb_moe/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/nougat/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/nystromformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/olmo/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/oneformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/openai/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/opt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/owlv2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/owlvit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/patchtsmixer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/patchtst/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/pegasus/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/pegasus_x/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/perceiver/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/persimmon/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/phi/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/phobert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/pix2struct/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/plbart/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/poolformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/pop2piano/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/prophetnet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/pvt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/pvt_v2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/qdqbert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/qwen2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/qwen2_moe/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/rag/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/realm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/recurrent_gemma/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/reformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/regnet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/rembert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/resnet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/roberta/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/roberta_prelayernorm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/roc_bert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/roformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/rwkv/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/sam/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/seamless_m4t/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/seamless_m4t_v2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/segformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/seggpt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/sew/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/sew_d/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/siglip/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/speech_encoder_decoder/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/speech_to_text/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/speech_to_text_2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/speecht5/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/splinter/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/squeezebert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/stablelm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/starcoder2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/superpoint/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/swiftformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/swin/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/swin2sr/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/swinv2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/switch_transformers/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/t5/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/table_transformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/tapas/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/time_series_transformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/timesformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/timm_backbone/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/trocr/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/tvlt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/tvp/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/udop/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/umt5/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /transformers-main/tests/models/unispeech/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/unispeech_sat/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/univnet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/upernet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/videomae/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/vilt/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/vipllava/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/vision_encoder_decoder/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/vision_text_dual_encoder/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/visual_bert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/vit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/vit_hybrid/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/vit_mae/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/vit_msn/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/vitdet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/vitmatte/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/vits/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/vivit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/wav2vec2/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/wav2vec2_bert/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/wav2vec2_conformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/wav2vec2_phoneme/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/wav2vec2_with_lm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/wavlm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/whisper/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/x_clip/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/xglm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/xlm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/xlm_prophetnet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/xlm_roberta/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/xlm_roberta_xl/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/xlnet/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/xmod/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/yolos/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/models/yoso/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/optimization/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/pipelines/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/quantization/aqlm_integration/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/quantization/autoawq/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/quantization/bnb/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/quantization/bnb/README.md -------------------------------------------------------------------------------- /transformers-main/tests/quantization/bnb/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/quantization/gptq/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/quantization/quanto_integration/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/sagemaker/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/sagemaker/README.md -------------------------------------------------------------------------------- /transformers-main/tests/sagemaker/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/sagemaker/__init__.py -------------------------------------------------------------------------------- /transformers-main/tests/sagemaker/conftest.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/sagemaker/conftest.py -------------------------------------------------------------------------------- /transformers-main/tests/test_backbone_common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/test_backbone_common.py -------------------------------------------------------------------------------- /transformers-main/tests/test_cache_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/test_cache_utils.py -------------------------------------------------------------------------------- /transformers-main/tests/test_image_transforms.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/test_image_transforms.py -------------------------------------------------------------------------------- /transformers-main/tests/test_modeling_common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/test_modeling_common.py -------------------------------------------------------------------------------- /transformers-main/tests/test_modeling_tf_common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/test_modeling_tf_common.py -------------------------------------------------------------------------------- /transformers-main/tests/test_modeling_tf_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/test_modeling_tf_utils.py -------------------------------------------------------------------------------- /transformers-main/tests/test_modeling_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/test_modeling_utils.py -------------------------------------------------------------------------------- /transformers-main/tests/test_pipeline_mixin.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/test_pipeline_mixin.py -------------------------------------------------------------------------------- /transformers-main/tests/test_processing_common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/test_processing_common.py -------------------------------------------------------------------------------- /transformers-main/tests/test_tokenization_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/test_tokenization_utils.py -------------------------------------------------------------------------------- /transformers-main/tests/tokenization/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/tools/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/tools/test_agent_types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/tools/test_agent_types.py -------------------------------------------------------------------------------- /transformers-main/tests/tools/test_tools_common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/tools/test_tools_common.py -------------------------------------------------------------------------------- /transformers-main/tests/tools/test_translation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/tools/test_translation.py -------------------------------------------------------------------------------- /transformers-main/tests/trainer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/trainer/test_trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/trainer/test_trainer.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_activations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_activations.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_audio_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_audio_utils.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_cli.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_doc_samples.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_doc_samples.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_file_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_file_utils.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_generic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_generic.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_hf_argparser.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_hf_argparser.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_hub_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_hub_utils.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_image_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_image_utils.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_logging.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_model_card.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_model_card.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_model_output.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_model_output.py -------------------------------------------------------------------------------- /transformers-main/tests/utils/test_offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/tests/utils/test_offline.py -------------------------------------------------------------------------------- /transformers-main/utils/check_build.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_build.py -------------------------------------------------------------------------------- /transformers-main/utils/check_config_attributes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_config_attributes.py -------------------------------------------------------------------------------- /transformers-main/utils/check_config_docstrings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_config_docstrings.py -------------------------------------------------------------------------------- /transformers-main/utils/check_copies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_copies.py -------------------------------------------------------------------------------- /transformers-main/utils/check_doc_toc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_doc_toc.py -------------------------------------------------------------------------------- /transformers-main/utils/check_docstrings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_docstrings.py -------------------------------------------------------------------------------- /transformers-main/utils/check_doctest_list.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_doctest_list.py -------------------------------------------------------------------------------- /transformers-main/utils/check_dummies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_dummies.py -------------------------------------------------------------------------------- /transformers-main/utils/check_inits.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_inits.py -------------------------------------------------------------------------------- /transformers-main/utils/check_model_tester.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_model_tester.py -------------------------------------------------------------------------------- /transformers-main/utils/check_repo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_repo.py -------------------------------------------------------------------------------- /transformers-main/utils/check_support_list.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_support_list.py -------------------------------------------------------------------------------- /transformers-main/utils/check_table.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_table.py -------------------------------------------------------------------------------- /transformers-main/utils/check_task_guides.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_task_guides.py -------------------------------------------------------------------------------- /transformers-main/utils/check_tf_ops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/check_tf_ops.py -------------------------------------------------------------------------------- /transformers-main/utils/create_dummy_models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/create_dummy_models.py -------------------------------------------------------------------------------- /transformers-main/utils/custom_init_isort.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/custom_init_isort.py -------------------------------------------------------------------------------- /transformers-main/utils/download_glue_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/download_glue_data.py -------------------------------------------------------------------------------- /transformers-main/utils/extract_warnings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/extract_warnings.py -------------------------------------------------------------------------------- /transformers-main/utils/get_ci_error_statistics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/get_ci_error_statistics.py -------------------------------------------------------------------------------- /transformers-main/utils/get_github_job_time.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/get_github_job_time.py -------------------------------------------------------------------------------- /transformers-main/utils/get_modified_files.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/get_modified_files.py -------------------------------------------------------------------------------- /transformers-main/utils/get_previous_daily_ci.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/get_previous_daily_ci.py -------------------------------------------------------------------------------- /transformers-main/utils/get_test_info.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/get_test_info.py -------------------------------------------------------------------------------- /transformers-main/utils/important_models.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/important_models.txt -------------------------------------------------------------------------------- /transformers-main/utils/not_doctested.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/not_doctested.txt -------------------------------------------------------------------------------- /transformers-main/utils/notification_service.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/notification_service.py -------------------------------------------------------------------------------- /transformers-main/utils/past_ci_versions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/past_ci_versions.py -------------------------------------------------------------------------------- /transformers-main/utils/print_env.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/print_env.py -------------------------------------------------------------------------------- /transformers-main/utils/release.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/release.py -------------------------------------------------------------------------------- /transformers-main/utils/sort_auto_mappings.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/sort_auto_mappings.py -------------------------------------------------------------------------------- /transformers-main/utils/split_doctest_jobs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/split_doctest_jobs.py -------------------------------------------------------------------------------- /transformers-main/utils/split_model_tests.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/split_model_tests.py -------------------------------------------------------------------------------- /transformers-main/utils/test_module/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /transformers-main/utils/tests_fetcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/tests_fetcher.py -------------------------------------------------------------------------------- /transformers-main/utils/tf_ops/onnx.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/tf_ops/onnx.json -------------------------------------------------------------------------------- /transformers-main/utils/update_metadata.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/update_metadata.py -------------------------------------------------------------------------------- /transformers-main/utils/update_tiny_models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/zwhong714/adaptive_decoding/HEAD/transformers-main/utils/update_tiny_models.py --------------------------------------------------------------------------------