.coveragerc
.gitattributes
.gitignore
CITATION.cff
CODE_OF_CONDUCT.md
CONTRIBUTING.md
ISSUES.md
LICENSE
MANIFEST.in
Makefile
README.md
README_ko.md
README_zh-hans.md
README_zh-hant.md
hubconf.py
pyproject.toml
setup.cfg
setup.py
valohai.yaml
.circleci/TROUBLESHOOT.md
.circleci/config.yml
.github/PULL_REQUEST_TEMPLATE.md
.github/ISSUE_TEMPLATE/---new-benchmark.md
.github/ISSUE_TEMPLATE/--new-model-addition.md
.github/ISSUE_TEMPLATE/bug-report.md
.github/ISSUE_TEMPLATE/feature-request.md
.github/ISSUE_TEMPLATE/migration.md
.github/ISSUE_TEMPLATE/question-help.md
.github/conda/build.sh
.github/conda/meta.yaml
.github/workflows/TROUBLESHOOT.md
.github/workflows/build_doc_test.yml
.github/workflows/build_documentation.yml
.github/workflows/doctests.yml
.github/workflows/github-torch-hub.yml
.github/workflows/model-templates.yml
.github/workflows/release-conda.yml
.github/workflows/self-nightly-scheduled.yml
.github/workflows/self-push.yml
.github/workflows/self-scheduled.yml
.github/workflows/stale.yml
docker/transformers-cpu/Dockerfile
docker/transformers-gpu/Dockerfile
docker/transformers-pytorch-cpu/Dockerfile
docker/transformers-pytorch-gpu/Dockerfile
docker/transformers-pytorch-tpu/Dockerfile
docker/transformers-pytorch-tpu/bert-base-cased.jsonnet
docker/transformers-pytorch-tpu/dataset.yaml
docker/transformers-pytorch-tpu/docker-entrypoint.sh
docker/transformers-tensorflow-cpu/Dockerfile
docker/transformers-tensorflow-gpu/Dockerfile
docs/Makefile
docs/README.md
docs/source/_toctree.yml
docs/source/add_new_model.rst
docs/source/add_new_pipeline.rst
docs/source/benchmarks.mdx
docs/source/bertology.rst
docs/source/community.md
docs/source/contributing.md
docs/source/converting_tensorflow_models.rst
docs/source/custom_datasets.mdx
docs/source/debugging.rst
docs/source/examples.md
docs/source/fast_tokenizers.rst
docs/source/glossary.rst
docs/source/index.mdx
docs/source/index.rst
docs/source/installation.md
docs/source/migration.md
docs/source/model_sharing.rst
docs/source/model_summary.rst
docs/source/multilingual.mdx
docs/source/notebooks.md
docs/source/parallelism.md
docs/source/performance.md
docs/source/perplexity.mdx
docs/source/philosophy.rst
docs/source/pr_checks.md
docs/source/preprocessing.mdx
docs/source/quicktour.mdx
docs/source/sagemaker.md
docs/source/serialization.rst
docs/source/task_summary.mdx
docs/source/testing.rst
docs/source/tokenizer_summary.mdx
docs/source/training.mdx
docs/source/troubleshooting.md
docs/source/imgs/course_banner.png
docs/source/imgs/local_attention_mask.png
docs/source/imgs/parallelism-deepspeed-3d.png
docs/source/imgs/parallelism-flexflow.jpeg
docs/source/imgs/parallelism-gpipe-bubble.png
docs/source/imgs/parallelism-sagemaker-interleaved-pipeline.png
docs/source/imgs/parallelism-tp-independent-gelu.png
docs/source/imgs/parallelism-tp-parallel_gemm.png
docs/source/imgs/parallelism-tp-parallel_self_attention.png
docs/source/imgs/parallelism-tp-parallel_shard_processing.png
docs/source/imgs/parallelism-zero-dp-pp.png
docs/source/imgs/parallelism-zero.png
docs/source/imgs/ppl_chunked.gif
docs/source/imgs/ppl_full.gif
docs/source/imgs/ppl_sliding.gif
docs/source/imgs/tf32-bf16-fp16-fp32.png
docs/source/imgs/transformers_logo_name.png
docs/source/imgs/transformers_overview.png
docs/source/imgs/warmup_constant_schedule.png
docs/source/imgs/warmup_cosine_hard_restarts_schedule.png
docs/source/imgs/warmup_cosine_schedule.png
docs/source/imgs/warmup_cosine_warm_restarts_schedule.png
docs/source/imgs/warmup_linear_schedule.png
docs/source/internal/file_utils.rst
docs/source/internal/generation_utils.rst
docs/source/internal/modeling_utils.rst
docs/source/internal/pipelines_utils.rst
docs/source/internal/tokenization_utils.rst
docs/source/internal/trainer_utils.rst
docs/source/main_classes/callback.rst
docs/source/main_classes/configuration.rst
docs/source/main_classes/data_collator.rst
docs/source/main_classes/deepspeed.rst
docs/source/main_classes/feature_extractor.rst
docs/source/main_classes/keras_callbacks.rst
docs/source/main_classes/logging.rst
docs/source/main_classes/model.rst
docs/source/main_classes/optimizer_schedules.rst
docs/source/main_classes/output.rst
docs/source/main_classes/pipelines.rst
docs/source/main_classes/processors.rst
docs/source/main_classes/tokenizer.rst
docs/source/main_classes/trainer.rst
docs/source/model_doc/albert.rst
docs/source/model_doc/auto.rst
docs/source/model_doc/bart.rst
docs/source/model_doc/barthez.rst
docs/source/model_doc/bartpho.rst
docs/source/model_doc/beit.rst
docs/source/model_doc/bert.rst
docs/source/model_doc/bert_japanese.rst
docs/source/model_doc/bertgeneration.rst
docs/source/model_doc/bertweet.rst
docs/source/model_doc/bigbird.rst
docs/source/model_doc/bigbird_pegasus.rst
docs/source/model_doc/blenderbot.rst
docs/source/model_doc/blenderbot_small.rst
docs/source/model_doc/bort.rst
docs/source/model_doc/byt5.rst
docs/source/model_doc/camembert.rst
docs/source/model_doc/canine.rst
docs/source/model_doc/clip.rst
docs/source/model_doc/convbert.rst
docs/source/model_doc/cpm.rst
docs/source/model_doc/ctrl.rst
docs/source/model_doc/deberta.rst
docs/source/model_doc/deberta_v2.rst
docs/source/model_doc/deit.rst
docs/source/model_doc/detr.mdx
docs/source/model_doc/dialogpt.rst
docs/source/model_doc/distilbert.rst
docs/source/model_doc/dpr.rst
docs/source/model_doc/electra.rst
docs/source/model_doc/encoderdecoder.rst
docs/source/model_doc/flaubert.rst
docs/source/model_doc/fnet.rst
docs/source/model_doc/fsmt.rst
docs/source/model_doc/funnel.rst
docs/source/model_doc/gpt.rst
docs/source/model_doc/gpt2.rst
docs/source/model_doc/gpt_neo.rst
docs/source/model_doc/gptj.rst
docs/source/model_doc/herbert.rst
docs/source/model_doc/hubert.rst
docs/source/model_doc/ibert.rst
docs/source/model_doc/imagegpt.rst
docs/source/model_doc/layoutlm.rst
docs/source/model_doc/layoutlmv2.rst
docs/source/model_doc/layoutxlm.rst
docs/source/model_doc/led.rst
docs/source/model_doc/longformer.rst
docs/source/model_doc/luke.rst
docs/source/model_doc/lxmert.rst
docs/source/model_doc/m2m_100.rst
docs/source/model_doc/marian.rst
docs/source/model_doc/mbart.rst
docs/source/model_doc/megatron_bert.rst
docs/source/model_doc/megatron_gpt2.rst
docs/source/model_doc/mluke.rst
docs/source/model_doc/mobilebert.rst
docs/source/model_doc/mpnet.rst
docs/source/model_doc/mt5.rst
docs/source/model_doc/pegasus.rst
docs/source/model_doc/perceiver.rst
docs/source/model_doc/phobert.rst
docs/source/model_doc/prophetnet.rst
docs/source/model_doc/qdqbert.rst
docs/source/model_doc/rag.rst
docs/source/model_doc/reformer.rst
docs/source/model_doc/rembert.rst
docs/source/model_doc/retribert.rst
docs/source/model_doc/roberta.rst
docs/source/model_doc/roformer.rst
docs/source/model_doc/segformer.rst
docs/source/model_doc/sew.rst
docs/source/model_doc/sew_d.rst
docs/source/model_doc/speech_to_text.rst
docs/source/model_doc/speech_to_text_2.rst
docs/source/model_doc/speechencoderdecoder.rst
docs/source/model_doc/splinter.rst
docs/source/model_doc/squeezebert.rst
docs/source/model_doc/t5.rst
docs/source/model_doc/t5v1.1.rst
docs/source/model_doc/tapas.rst
docs/source/model_doc/transformerxl.rst
docs/source/model_doc/trocr.rst
docs/source/model_doc/unispeech.rst
docs/source/model_doc/unispeech_sat.rst
docs/source/model_doc/vision_text_dual_encoder.rst
docs/source/model_doc/visionencoderdecoder.rst
docs/source/model_doc/visual_bert.rst
docs/source/model_doc/vit.rst
docs/source/model_doc/wav2vec2.rst
docs/source/model_doc/xlm.rst
docs/source/model_doc/xlmprophetnet.rst
docs/source/model_doc/xlmroberta.rst
docs/source/model_doc/xlnet.rst
docs/source/model_doc/xlsr_wav2vec2.rst
examples/README.md
examples/flax/README.md
examples/flax/_tests_requirements.txt
examples/flax/conftest.py
examples/flax/test_examples.py
examples/flax/language-modeling/README.md
examples/flax/language-modeling/requirements.txt
examples/flax/language-modeling/run_clm_flax.py
examples/flax/language-modeling/run_mlm_flax.py
examples/flax/language-modeling/run_t5_mlm_flax.py
examples/flax/language-modeling/t5_tokenizer_model.py
examples/flax/question-answering/README.md
examples/flax/question-answering/requirements.txt
examples/flax/question-answering/run_qa.py
examples/flax/question-answering/utils_qa.py
examples/flax/summarization/README.md
examples/flax/summarization/requirements.txt
examples/flax/summarization/run_summarization_flax.py
examples/flax/text-classification/README.md
examples/flax/text-classification/requirements.txt
examples/flax/text-classification/run_flax_glue.py
examples/flax/token-classification/README.md
examples/flax/token-classification/requirements.txt
examples/flax/token-classification/run_flax_ner.py
examples/flax/vision/README.md
examples/flax/vision/requirements.txt
examples/flax/vision/run_image_classification.py
examples/legacy/README.md
examples/legacy/run_camembert.py
examples/legacy/run_chinese_ref.py
examples/legacy/run_language_modeling.py
examples/legacy/run_openai_gpt.py
examples/legacy/run_swag.py
examples/legacy/run_transfo_xl.py
examples/legacy/multiple_choice/run_multiple_choice.py
examples/legacy/multiple_choice/utils_multiple_choice.py
examples/legacy/pytorch-lightning/lightning_base.py
examples/legacy/pytorch-lightning/requirements.txt
examples/legacy/pytorch-lightning/run_glue.py
examples/legacy/pytorch-lightning/run_glue.sh
examples/legacy/pytorch-lightning/run_ner.py
examples/legacy/pytorch-lightning/run_ner.sh
examples/legacy/pytorch-lightning/run_pos.sh
examples/legacy/question-answering/README.md
examples/legacy/question-answering/run_squad.py
examples/legacy/question-answering/run_squad_trainer.py
examples/legacy/seq2seq/README.md
examples/legacy/seq2seq/__init__.py
examples/legacy/seq2seq/convert_model_to_fp16.py
examples/legacy/seq2seq/download_wmt.py
examples/legacy/seq2seq/finetune.sh
examples/legacy/seq2seq/finetune_tpu.sh
examples/legacy/seq2seq/finetune_trainer.py
examples/legacy/seq2seq/minify_dataset.py
examples/legacy/seq2seq/old_test_calculate_rouge.py
examples/legacy/seq2seq/old_test_datasets.py
examples/legacy/seq2seq/old_test_fsmt_bleu_score.py
examples/legacy/seq2seq/old_test_seq2seq_examples.py
examples/legacy/seq2seq/old_test_seq2seq_examples_multi_gpu.py
examples/legacy/seq2seq/old_test_tatoeba_conversion.py
examples/legacy/seq2seq/pack_dataset.py
examples/legacy/seq2seq/requirements.txt
examples/legacy/seq2seq/romanian_postprocessing.md
examples/legacy/seq2seq/rouge_cli.py
examples/legacy/seq2seq/run_distributed_eval.py
examples/legacy/seq2seq/run_eval.py
examples/legacy/seq2seq/run_eval_search.py
examples/legacy/seq2seq/save_len_file.py
examples/legacy/seq2seq/save_randomly_initialized_model.py
examples/legacy/seq2seq/sentence_splitter.py
examples/legacy/seq2seq/seq2seq_trainer.py
examples/legacy/seq2seq/seq2seq_training_args.py
examples/legacy/seq2seq/train_distil_marian_enro.sh
examples/legacy/seq2seq/train_distil_marian_enro_tpu.sh
examples/legacy/seq2seq/train_distilbart_cnn.sh
examples/legacy/seq2seq/train_mbart_cc25_enro.sh
examples/legacy/seq2seq/utils.py
examples/legacy/seq2seq/xla_spawn.py
examples/legacy/seq2seq/test_data/fsmt/build-eval-data.py
examples/legacy/seq2seq/test_data/fsmt/fsmt_val_data.json
examples/legacy/seq2seq/test_data/wmt_en_ro/test.source
examples/legacy/seq2seq/test_data/wmt_en_ro/test.target
examples/legacy/seq2seq/test_data/wmt_en_ro/train.len
examples/legacy/seq2seq/test_data/wmt_en_ro/train.source
examples/legacy/seq2seq/test_data/wmt_en_ro/train.target
examples/legacy/seq2seq/test_data/wmt_en_ro/val.len
examples/legacy/seq2seq/test_data/wmt_en_ro/val.source
examples/legacy/seq2seq/test_data/wmt_en_ro/val.target
examples/legacy/text-classification/run_tf_text_classification.py
examples/legacy/token-classification/README.md
examples/legacy/token-classification/run.sh
examples/legacy/token-classification/run_chunk.sh
examples/legacy/token-classification/run_ner.py
examples/legacy/token-classification/run_pos.sh
examples/legacy/token-classification/run_tf_ner.py
examples/legacy/token-classification/tasks.py
examples/legacy/token-classification/utils_ner.py
examples/legacy/token-classification/scripts/preprocess.py
examples/onnx/pytorch/summarization/README.md
examples/onnx/pytorch/summarization/requirements.txt
examples/onnx/pytorch/summarization/run_onnx_exporter.py
examples/onnx/pytorch/summarization/bart_onnx/generation_onnx.py
examples/onnx/pytorch/summarization/bart_onnx/reduce_onnx_size.py
examples/pytorch/README.md
examples/pytorch/_tests_requirements.txt
examples/pytorch/conftest.py
examples/pytorch/test_examples.py
examples/pytorch/test_xla_examples.py
examples/pytorch/xla_spawn.py
examples/pytorch/audio-classification/README.md
examples/pytorch/audio-classification/requirements.txt
examples/pytorch/audio-classification/run_audio_classification.py
examples/pytorch/benchmarking/README.md
examples/pytorch/benchmarking/plot_csv_file.py
examples/pytorch/benchmarking/requirements.txt
examples/pytorch/benchmarking/run_benchmark.py
examples/pytorch/image-classification/README.md
examples/pytorch/image-classification/requirements.txt
examples/pytorch/image-classification/run_image_classification.py
examples/pytorch/language-modeling/README.md
examples/pytorch/language-modeling/requirements.txt
examples/pytorch/language-modeling/run_clm.py
examples/pytorch/language-modeling/run_clm_no_trainer.py
examples/pytorch/language-modeling/run_mlm.py
examples/pytorch/language-modeling/run_mlm_no_trainer.py
examples/pytorch/language-modeling/run_plm.py
examples/pytorch/multiple-choice/README.md
examples/pytorch/multiple-choice/requirements.txt
examples/pytorch/multiple-choice/run_no_trainer.sh
examples/pytorch/multiple-choice/run_swag.py
examples/pytorch/multiple-choice/run_swag_no_trainer.py
examples/pytorch/question-answering/README.md
examples/pytorch/question-answering/requirements.txt
examples/pytorch/question-answering/run_qa.py
examples/pytorch/question-answering/run_qa_beam_search.py
examples/pytorch/question-answering/run_qa_beam_search_no_trainer.py
examples/pytorch/question-answering/run_qa_no_trainer.py
examples/pytorch/question-answering/run_seq2seq_qa.py
examples/pytorch/question-answering/trainer_qa.py
examples/pytorch/question-answering/trainer_seq2seq_qa.py
examples/pytorch/question-answering/utils_qa.py
examples/pytorch/speech-pretraining/README.md
examples/pytorch/speech-pretraining/requirements.txt
examples/pytorch/speech-pretraining/run_wav2vec2_pretraining_no_trainer.py
examples/pytorch/speech-recognition/README.md
examples/pytorch/speech-recognition/requirements.txt
examples/pytorch/speech-recognition/run_speech_recognition_ctc.py
examples/pytorch/summarization/README.md
examples/pytorch/summarization/requirements.txt
examples/pytorch/summarization/run_summarization.py
examples/pytorch/summarization/run_summarization_no_trainer.py
examples/pytorch/text-classification/README.md
examples/pytorch/text-classification/requirements.txt
examples/pytorch/text-classification/run_glue.py
examples/pytorch/text-classification/run_glue_no_trainer.py
examples/pytorch/text-classification/run_xnli.py
examples/pytorch/text-generation/README.md
examples/pytorch/text-generation/requirements.txt
examples/pytorch/text-generation/run_generation.py
examples/pytorch/token-classification/README.md
examples/pytorch/token-classification/requirements.txt
examples/pytorch/token-classification/run.sh
examples/pytorch/token-classification/run_ner.py
examples/pytorch/token-classification/run_ner_no_trainer.py
examples/pytorch/token-classification/run_no_trainer.sh
examples/pytorch/translation/README.md
examples/pytorch/translation/requirements.txt
examples/pytorch/translation/run_translation.py
examples/pytorch/translation/run_translation_no_trainer.py
examples/research_projects/README.md
examples/research_projects/adversarial/README.md
examples/research_projects/adversarial/requirements.txt
examples/research_projects/adversarial/run_hans.py
examples/research_projects/adversarial/utils_hans.py
examples/research_projects/bert-loses-patience/README.md
examples/research_projects/bert-loses-patience/requirements.txt
examples/research_projects/bert-loses-patience/run_glue_with_pabee.py
examples/research_projects/bert-loses-patience/test_run_glue_with_pabee.py
examples/research_projects/bert-loses-patience/pabee/__init__.py
examples/research_projects/bert-loses-patience/pabee/modeling_pabee_albert.py
examples/research_projects/bert-loses-patience/pabee/modeling_pabee_bert.py
examples/research_projects/bertabs/README.md
examples/research_projects/bertabs/__init__.py
examples/research_projects/bertabs/configuration_bertabs.py
examples/research_projects/bertabs/convert_bertabs_original_pytorch_checkpoint.py
examples/research_projects/bertabs/modeling_bertabs.py
examples/research_projects/bertabs/requirements.txt
examples/research_projects/bertabs/run_summarization.py
examples/research_projects/bertabs/test_utils_summarization.py
examples/research_projects/bertabs/utils_summarization.py
examples/research_projects/bertology/requirements.txt
examples/research_projects/bertology/run_bertology.py
examples/research_projects/bertology/run_prune_gpt.py
examples/research_projects/codeparrot/README.md
examples/research_projects/codeparrot/requirements.txt
examples/research_projects/codeparrot/scripts/arguments.py
examples/research_projects/codeparrot/scripts/bpe_training.py
examples/research_projects/codeparrot/scripts/codeparrot_training.py
examples/research_projects/codeparrot/scripts/human_eval.py
examples/research_projects/codeparrot/scripts/initialize_model.py
examples/research_projects/codeparrot/scripts/preprocessing.py
examples/research_projects/codeparrot/scripts/validation_loss.py
examples/research_projects/deebert/README.md
examples/research_projects/deebert/entropy_eval.sh
examples/research_projects/deebert/eval_deebert.sh
examples/research_projects/deebert/requirements.txt
examples/research_projects/deebert/run_glue_deebert.py
examples/research_projects/deebert/test_glue_deebert.py
examples/research_projects/deebert/train_deebert.sh
examples/research_projects/deebert/src/__init__.py
examples/research_projects/deebert/src/modeling_highway_bert.py
examples/research_projects/deebert/src/modeling_highway_roberta.py
examples/research_projects/distillation/README.md
examples/research_projects/distillation/distiller.py
examples/research_projects/distillation/grouped_batch_sampler.py
examples/research_projects/distillation/lm_seqs_dataset.py
examples/research_projects/distillation/requirements.txt
examples/research_projects/distillation/run_squad_w_distillation.py
examples/research_projects/distillation/train.py
examples/research_projects/distillation/utils.py
examples/research_projects/distillation/scripts/binarized_data.py
examples/research_projects/distillation/scripts/extract.py
examples/research_projects/distillation/scripts/extract_distilbert.py
examples/research_projects/distillation/scripts/token_counts.py
examples/research_projects/distillation/training_configs/distilbert-base-cased.json
examples/research_projects/distillation/training_configs/distilbert-base-multilingual-cased.json
examples/research_projects/distillation/training_configs/distilbert-base-uncased.json
examples/research_projects/distillation/training_configs/distilgpt2.json
examples/research_projects/distillation/training_configs/distilroberta-base.json
examples/research_projects/fsner/README.md
examples/research_projects/fsner/pyproject.toml
examples/research_projects/fsner/requirements.txt
examples/research_projects/fsner/setup.py
examples/research_projects/fsner/src/fsner/__init__.py
examples/research_projects/fsner/src/fsner/model.py
examples/research_projects/fsner/src/fsner/tokenizer_utils.py
examples/research_projects/jax-projects/HOW_TO_PROPOSE_PROJECT.md
examples/research_projects/jax-projects/README.md
examples/research_projects/jax-projects/big_bird/README.md
examples/research_projects/jax-projects/big_bird/bigbird_flax.py
examples/research_projects/jax-projects/big_bird/evaluate.py
examples/research_projects/jax-projects/big_bird/prepare_natural_questions.py
examples/research_projects/jax-projects/big_bird/requirements.txt
examples/research_projects/jax-projects/big_bird/sweep_flax.yaml
examples/research_projects/jax-projects/big_bird/train.py
examples/research_projects/jax-projects/dataset-streaming/README.md
examples/research_projects/jax-projects/dataset-streaming/run_mlm_flax_stream.py
examples/research_projects/jax-projects/hybrid_clip/README.md
examples/research_projects/jax-projects/hybrid_clip/configuration_hybrid_clip.py
examples/research_projects/jax-projects/hybrid_clip/modeling_hybrid_clip.py
examples/research_projects/jax-projects/hybrid_clip/requirements.txt
examples/research_projects/jax-projects/hybrid_clip/run_hybrid_clip.py
examples/research_projects/jax-projects/model_parallel/README.md
examples/research_projects/jax-projects/model_parallel/partitions.py
examples/research_projects/jax-projects/model_parallel/run_clm_mp.py
examples/research_projects/jax-projects/wav2vec2/README.md
examples/research_projects/jax-projects/wav2vec2/run_wav2vec2_pretrain_flax.py
examples/research_projects/longform-qa/README.md
examples/research_projects/longform-qa/eli5_app.py
examples/research_projects/longform-qa/eli5_utils.py
examples/research_projects/longform-qa/requirements.txt
examples/research_projects/lxmert/README.md
examples/research_projects/lxmert/demo.ipynb
examples/research_projects/lxmert/extracting_data.py
examples/research_projects/lxmert/modeling_frcnn.py
examples/research_projects/lxmert/processing_image.py
examples/research_projects/lxmert/requirements.txt
examples/research_projects/lxmert/utils.py
examples/research_projects/lxmert/visualizing_image.py
examples/research_projects/mlm_wwm/README.md
examples/research_projects/mlm_wwm/requirements.txt
examples/research_projects/mlm_wwm/run_chinese_ref.py
examples/research_projects/mlm_wwm/run_mlm_wwm.py
examples/research_projects/mm-imdb/README.md
examples/research_projects/mm-imdb/run_mmimdb.py
examples/research_projects/mm-imdb/utils_mmimdb.py
examples/research_projects/movement-pruning/README.md
examples/research_projects/movement-pruning/Saving_PruneBERT.ipynb
examples/research_projects/movement-pruning/bertarize.py
examples/research_projects/movement-pruning/counts_parameters.py
examples/research_projects/movement-pruning/masked_run_glue.py
examples/research_projects/movement-pruning/masked_run_squad.py
examples/research_projects/movement-pruning/requirements.txt
examples/research_projects/movement-pruning/emmental/__init__.py
examples/research_projects/movement-pruning/emmental/configuration_bert_masked.py
examples/research_projects/movement-pruning/emmental/modeling_bert_masked.py
examples/research_projects/movement-pruning/emmental/modules/__init__.py
examples/research_projects/movement-pruning/emmental/modules/binarizer.py
examples/research_projects/movement-pruning/emmental/modules/masked_nn.py
examples/research_projects/performer/README.md
examples/research_projects/performer/full_script.sh
examples/research_projects/performer/modeling_flax_performer.py
examples/research_projects/performer/modeling_flax_performer_utils.py
examples/research_projects/performer/run_mlm_performer.py
examples/research_projects/performer/sanity_script.sh
examples/research_projects/pplm/README.md
examples/research_projects/pplm/pplm_classification_head.py
examples/research_projects/pplm/requirements.txt
examples/research_projects/pplm/run_pplm.py
examples/research_projects/pplm/run_pplm_discrim_train.py
examples/research_projects/pplm/imgs/headfigure.png
examples/research_projects/pplm/imgs/wooly.png
examples/research_projects/quantization-qdqbert/Dockerfile
examples/research_projects/quantization-qdqbert/README.md
examples/research_projects/quantization-qdqbert/evaluate-hf-trt-qa.py
examples/research_projects/quantization-qdqbert/quant_trainer.py
examples/research_projects/quantization-qdqbert/run_quant_qa.py
examples/research_projects/quantization-qdqbert/trainer_quant_qa.py
examples/research_projects/quantization-qdqbert/utils_qa.py
examples/research_projects/rag/README.md
examples/research_projects/rag/__init__.py
examples/research_projects/rag/_test_finetune_rag.py
examples/research_projects/rag/callbacks_rag.py
examples/research_projects/rag/consolidate_rag_checkpoint.py
examples/research_projects/rag/distributed_pytorch_retriever.py
examples/research_projects/rag/distributed_ray_retriever.py
examples/research_projects/rag/eval_rag.py
examples/research_projects/rag/finetune_rag.py
examples/research_projects/rag/finetune_rag.sh
examples/research_projects/rag/finetune_rag_ray.sh
examples/research_projects/rag/lightning_base.py
examples/research_projects/rag/parse_dpr_relevance_data.py
examples/research_projects/rag/requirements.txt
examples/research_projects/rag/test_distributed_retriever.py
examples/research_projects/rag/use_own_knowledge_dataset.py
examples/research_projects/rag/utils_rag.py
examples/research_projects/rag-end2end-retriever/README.md
examples/research_projects/rag-end2end-retriever/callbacks_rag.py
examples/research_projects/rag-end2end-retriever/distributed_ray_retriever.py
examples/research_projects/rag-end2end-retriever/eval_rag.py
examples/research_projects/rag-end2end-retriever/finetune_rag.py
examples/research_projects/rag-end2end-retriever/finetune_rag_ray_end2end.sh
examples/research_projects/rag-end2end-retriever/kb_encode_utils.py
examples/research_projects/rag-end2end-retriever/lightning_base.py
examples/research_projects/rag-end2end-retriever/requirements.txt
examples/research_projects/rag-end2end-retriever/use_own_knowledge_dataset.py
examples/research_projects/rag-end2end-retriever/utils_rag.py
examples/research_projects/rag-end2end-retriever/test_run/test_finetune.sh
examples/research_projects/rag-end2end-retriever/test_run/test_rag_new_features.sh
examples/research_projects/rag-end2end-retriever/test_run/dummy-kb/my_knowledge_dataset.csv
examples/research_projects/rag-end2end-retriever/test_run/dummy-train-data/train.source
examples/research_projects/rag-end2end-retriever/test_run/dummy-train-data/train.target
examples/research_projects/rag-end2end-retriever/test_run/dummy-train-data/val.source
examples/research_projects/rag-end2end-retriever/test_run/dummy-train-data/val.target
examples/research_projects/rag/test_data/my_knowledge_dataset.csv
examples/research_projects/seq2seq-distillation/README.md
examples/research_projects/seq2seq-distillation/_test_bash_script.py
examples/research_projects/seq2seq-distillation/_test_make_student.py
examples/research_projects/seq2seq-distillation/_test_seq2seq_examples.py
examples/research_projects/seq2seq-distillation/_test_seq2seq_examples_multi_gpu.py
examples/research_projects/seq2seq-distillation/callbacks.py
examples/research_projects/seq2seq-distillation/convert_pl_checkpoint_to_hf.py
examples/research_projects/seq2seq-distillation/distil_marian_enro_teacher.sh
examples/research_projects/seq2seq-distillation/distil_marian_no_teacher.sh
examples/research_projects/seq2seq-distillation/distillation.py
examples/research_projects/seq2seq-distillation/dynamic_bs_example.sh
examples/research_projects/seq2seq-distillation/finetune.py
examples/research_projects/seq2seq-distillation/finetune.sh
examples/research_projects/seq2seq-distillation/finetune_bart_tiny.sh
examples/research_projects/seq2seq-distillation/finetune_pegasus_xsum.sh
examples/research_projects/seq2seq-distillation/finetune_t5.sh
examples/research_projects/seq2seq-distillation/lightning_base.py
examples/research_projects/seq2seq-distillation/make_student.py
examples/research_projects/seq2seq-distillation/precomputed_pseudo_labels.md
examples/research_projects/seq2seq-distillation/requirements.txt
examples/research_projects/seq2seq-distillation/run_eval.py
examples/research_projects/seq2seq-distillation/sentence_splitter.py
examples/research_projects/seq2seq-distillation/train_distilbart_cnn.sh
examples/research_projects/seq2seq-distillation/train_distilbart_xsum.sh
examples/research_projects/seq2seq-distillation/train_mbart_cc25_enro.sh
examples/research_projects/seq2seq-distillation/utils.py
examples/research_projects/visual_bert/README.md
examples/research_projects/visual_bert/demo.ipynb
examples/research_projects/visual_bert/extracting_data.py
examples/research_projects/visual_bert/modeling_frcnn.py
examples/research_projects/visual_bert/processing_image.py
examples/research_projects/visual_bert/requirements.txt
examples/research_projects/visual_bert/utils.py
examples/research_projects/visual_bert/visualizing_image.py
examples/research_projects/wav2vec2/FINE_TUNE_XLSR_WAV2VEC2.md
examples/research_projects/wav2vec2/README.md
examples/research_projects/wav2vec2/ds_config_wav2vec2_zero2.json
examples/research_projects/wav2vec2/ds_config_wav2vec2_zero3.json
examples/research_projects/wav2vec2/finetune_base_100.sh
examples/research_projects/wav2vec2/finetune_base_timit_asr.sh
examples/research_projects/wav2vec2/finetune_large_lv60_100.sh
examples/research_projects/wav2vec2/finetune_large_lv60_timit_asr.sh
examples/research_projects/wav2vec2/finetune_large_xlsr_53_arabic_speech_corpus.sh
examples/research_projects/wav2vec2/finetune_wav2vec2_xlsr_turkish.sh
examples/research_projects/wav2vec2/requirements.txt
examples/research_projects/wav2vec2/run_asr.py
examples/research_projects/wav2vec2/run_common_voice.py
examples/research_projects/wav2vec2/run_pretrain.py
examples/research_projects/wav2vec2/test_wav2vec2_deepspeed.py
examples/research_projects/wav2vec2/vocab/buckwalter.json
examples/research_projects/zero-shot-distillation/README.md
examples/research_projects/zero-shot-distillation/distill_classifier.py
examples/tensorflow/README.md
examples/tensorflow/benchmarking/README.md
examples/tensorflow/benchmarking/plot_csv_file.py
examples/tensorflow/benchmarking/requirements.txt
examples/tensorflow/benchmarking/run_benchmark_tf.py
examples/tensorflow/language-modeling/README.md
examples/tensorflow/language-modeling/requirements.txt
examples/tensorflow/language-modeling/run_clm.py
examples/tensorflow/language-modeling/run_mlm.py
examples/tensorflow/multiple-choice/README.md
examples/tensorflow/multiple-choice/requirements.txt
examples/tensorflow/multiple-choice/run_swag.py
examples/tensorflow/question-answering/README.md
examples/tensorflow/question-answering/requirements.txt
examples/tensorflow/question-answering/run_qa.py
examples/tensorflow/question-answering/utils_qa.py
examples/tensorflow/summarization/README.md
examples/tensorflow/summarization/run_summarization.py
examples/tensorflow/text-classification/README.md
examples/tensorflow/text-classification/requirements.txt
examples/tensorflow/text-classification/run_glue.py
examples/tensorflow/text-classification/run_text_classification.py
examples/tensorflow/token-classification/README.md
examples/tensorflow/token-classification/run_ner.py
examples/tensorflow/translation/README.md
examples/tensorflow/translation/run_translation.py
model_cards/README.md
notebooks/README.md
scripts/check_tokenizers.py
scripts/stale.py
scripts/fsmt/convert-allenai-wmt16.sh
scripts/fsmt/convert-allenai-wmt19.sh
scripts/fsmt/convert-facebook-wmt19.sh
scripts/fsmt/eval-allenai-wmt16.sh
scripts/fsmt/eval-allenai-wmt19.sh
scripts/fsmt/eval-facebook-wmt19.sh
scripts/fsmt/fsmt-make-super-tiny-model.py
scripts/fsmt/fsmt-make-tiny-model.py
scripts/fsmt/gen-card-allenai-wmt16.py
scripts/fsmt/gen-card-allenai-wmt19.py
scripts/fsmt/gen-card-facebook-wmt19.py
scripts/fsmt/s3-move.sh
scripts/fsmt/tests-to-run.sh
scripts/pegasus/build_test_sample_spm_no_bos.py
scripts/tatoeba/README.md
scripts/tatoeba/upload_models.sh
src/transformers/__init__.py
src/transformers/activations.py
src/transformers/activations_tf.py
src/transformers/configuration_utils.py
src/transformers/convert_graph_to_onnx.py
src/transformers/convert_pytorch_checkpoint_to_tf2.py
src/transformers/convert_slow_tokenizer.py
src/transformers/convert_slow_tokenizers_checkpoints_to_fast.py
src/transformers/convert_tf_hub_seq_to_seq_bert_to_pytorch.py
src/transformers/debug_utils.py
src/transformers/deepspeed.py
src/transformers/dependency_versions_check.py
src/transformers/dependency_versions_table.py
src/transformers/feature_extraction_sequence_utils.py
src/transformers/feature_extraction_utils.py
src/transformers/file_utils.py
src/transformers/generation_beam_search.py
src/transformers/generation_flax_logits_process.py
src/transformers/generation_flax_utils.py
src/transformers/generation_logits_process.py
src/transformers/generation_stopping_criteria.py
src/transformers/generation_tf_utils.py
src/transformers/generation_utils.py
src/transformers/hf_argparser.py
src/transformers/image_utils.py
src/transformers/integrations.py
src/transformers/keras_callbacks.py
src/transformers/modelcard.py
src/transformers/modeling_flax_outputs.py
src/transformers/modeling_flax_pytorch_utils.py
src/transformers/modeling_flax_utils.py
src/transformers/modeling_outputs.py
src/transformers/modeling_tf_outputs.py
src/transformers/modeling_tf_pytorch_utils.py
src/transformers/modeling_tf_utils.py
src/transformers/modeling_utils.py
src/transformers/optimization.py
src/transformers/optimization_tf.py
src/transformers/py.typed
src/transformers/testing_utils.py
src/transformers/tokenization_utils.py
src/transformers/tokenization_utils_base.py
src/transformers/tokenization_utils_fast.py
src/transformers/trainer.py
src/transformers/trainer_callback.py
src/transformers/trainer_pt_utils.py
src/transformers/trainer_seq2seq.py
src/transformers/trainer_tf.py
src/transformers/trainer_utils.py
src/transformers/training_args.py
src/transformers/training_args_seq2seq.py
src/transformers/training_args_tf.py
src/transformers.egg-info/PKG-INFO
src/transformers.egg-info/SOURCES.txt
src/transformers.egg-info/dependency_links.txt
src/transformers.egg-info/entry_points.txt
src/transformers.egg-info/not-zip-safe
src/transformers.egg-info/requires.txt
src/transformers.egg-info/top_level.txt
src/transformers/benchmark/__init__.py
src/transformers/benchmark/benchmark.py
src/transformers/benchmark/benchmark_args.py
src/transformers/benchmark/benchmark_args_tf.py
src/transformers/benchmark/benchmark_args_utils.py
src/transformers/benchmark/benchmark_tf.py
src/transformers/benchmark/benchmark_utils.py
src/transformers/commands/__init__.py
src/transformers/commands/add_new_model.py
src/transformers/commands/convert.py
src/transformers/commands/download.py
src/transformers/commands/env.py
src/transformers/commands/lfs.py
src/transformers/commands/run.py
src/transformers/commands/serving.py
src/transformers/commands/train.py
src/transformers/commands/transformers_cli.py
src/transformers/commands/user.py
src/transformers/data/__init__.py
src/transformers/data/data_collator.py
src/transformers/data/test_generation_utils.py
src/transformers/data/datasets/__init__.py
src/transformers/data/datasets/glue.py
src/transformers/data/datasets/language_modeling.py
src/transformers/data/datasets/squad.py
src/transformers/data/metrics/__init__.py
src/transformers/data/metrics/squad_metrics.py
src/transformers/data/processors/__init__.py
src/transformers/data/processors/glue.py
src/transformers/data/processors/squad.py
src/transformers/data/processors/utils.py
src/transformers/data/processors/xnli.py
src/transformers/models/__init__.py
src/transformers/models/albert/__init__.py
src/transformers/models/albert/configuration_albert.py
src/transformers/models/albert/convert_albert_original_tf_checkpoint_to_pytorch.py
src/transformers/models/albert/modeling_albert.py
src/transformers/models/albert/modeling_flax_albert.py
src/transformers/models/albert/modeling_tf_albert.py
src/transformers/models/albert/tokenization_albert.py
src/transformers/models/albert/tokenization_albert_fast.py
src/transformers/models/auto/__init__.py
src/transformers/models/auto/auto_factory.py
src/transformers/models/auto/configuration_auto.py
src/transformers/models/auto/dynamic.py
src/transformers/models/auto/feature_extraction_auto.py
src/transformers/models/auto/modeling_auto.py
src/transformers/models/auto/modeling_flax_auto.py
src/transformers/models/auto/modeling_tf_auto.py
src/transformers/models/auto/processing_auto.py
src/transformers/models/auto/tokenization_auto.py
src/transformers/models/bart/__init__.py
src/transformers/models/bart/configuration_bart.py
src/transformers/models/bart/convert_bart_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/bart/modeling_bart.py
src/transformers/models/bart/modeling_flax_bart.py
src/transformers/models/bart/modeling_tf_bart.py
src/transformers/models/bart/tokenization_bart.py
src/transformers/models/bart/tokenization_bart_fast.py
src/transformers/models/barthez/__init__.py
src/transformers/models/barthez/tokenization_barthez.py
src/transformers/models/barthez/tokenization_barthez_fast.py
src/transformers/models/bartpho/__init__.py
src/transformers/models/bartpho/tokenization_bartpho.py
src/transformers/models/beit/__init__.py
src/transformers/models/beit/configuration_beit.py
src/transformers/models/beit/convert_beit_unilm_to_pytorch.py
src/transformers/models/beit/feature_extraction_beit.py
src/transformers/models/beit/modeling_beit.py
src/transformers/models/beit/modeling_flax_beit.py
src/transformers/models/bert/__init__.py
src/transformers/models/bert/configuration_bert.py
src/transformers/models/bert/convert_bert_original_tf2_checkpoint_to_pytorch.py
src/transformers/models/bert/convert_bert_original_tf_checkpoint_to_pytorch.py
src/transformers/models/bert/convert_bert_pytorch_checkpoint_to_original_tf.py
src/transformers/models/bert/modeling_bert.py
src/transformers/models/bert/modeling_flax_bert.py
src/transformers/models/bert/modeling_tf_bert.py
src/transformers/models/bert/tokenization_bert.py
src/transformers/models/bert/tokenization_bert_fast.py
src/transformers/models/bert_generation/__init__.py
src/transformers/models/bert_generation/configuration_bert_generation.py
src/transformers/models/bert_generation/modeling_bert_generation.py
src/transformers/models/bert_generation/tokenization_bert_generation.py
src/transformers/models/bert_japanese/__init__.py
src/transformers/models/bert_japanese/tokenization_bert_japanese.py
src/transformers/models/bertweet/__init__.py
src/transformers/models/bertweet/tokenization_bertweet.py
src/transformers/models/big_bird/__init__.py
src/transformers/models/big_bird/configuration_big_bird.py
src/transformers/models/big_bird/convert_bigbird_original_tf_checkpoint_to_pytorch.py
src/transformers/models/big_bird/modeling_big_bird.py
src/transformers/models/big_bird/modeling_flax_big_bird.py
src/transformers/models/big_bird/tokenization_big_bird.py
src/transformers/models/big_bird/tokenization_big_bird_fast.py
src/transformers/models/bigbird_pegasus/__init__.py
src/transformers/models/bigbird_pegasus/configuration_bigbird_pegasus.py
src/transformers/models/bigbird_pegasus/convert_bigbird_pegasus_tf_to_pytorch.py
src/transformers/models/bigbird_pegasus/modeling_bigbird_pegasus.py
src/transformers/models/blenderbot/__init__.py
src/transformers/models/blenderbot/configuration_blenderbot.py
src/transformers/models/blenderbot/convert_blenderbot_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/blenderbot/modeling_blenderbot.py
src/transformers/models/blenderbot/modeling_flax_blenderbot.py
src/transformers/models/blenderbot/modeling_tf_blenderbot.py
src/transformers/models/blenderbot/tokenization_blenderbot.py
src/transformers/models/blenderbot/tokenization_blenderbot_fast.py
src/transformers/models/blenderbot_small/__init__.py
src/transformers/models/blenderbot_small/configuration_blenderbot_small.py
src/transformers/models/blenderbot_small/modeling_blenderbot_small.py
src/transformers/models/blenderbot_small/modeling_flax_blenderbot_small.py
src/transformers/models/blenderbot_small/modeling_tf_blenderbot_small.py
src/transformers/models/blenderbot_small/tokenization_blenderbot_small.py
src/transformers/models/blenderbot_small/tokenization_blenderbot_small_fast.py
src/transformers/models/bort/convert_bort_original_gluonnlp_checkpoint_to_pytorch.py
src/transformers/models/byt5/__init__.py
src/transformers/models/byt5/convert_byt5_original_tf_checkpoint_to_pytorch.py
src/transformers/models/byt5/tokenization_byt5.py
src/transformers/models/camembert/__init__.py
src/transformers/models/camembert/configuration_camembert.py
src/transformers/models/camembert/modeling_camembert.py
src/transformers/models/camembert/modeling_tf_camembert.py
src/transformers/models/camembert/tokenization_camembert.py
src/transformers/models/camembert/tokenization_camembert_fast.py
src/transformers/models/canine/__init__.py
src/transformers/models/canine/configuration_canine.py
src/transformers/models/canine/convert_canine_original_tf_checkpoint_to_pytorch.py
src/transformers/models/canine/modeling_canine.py
src/transformers/models/canine/tokenization_canine.py
src/transformers/models/clip/__init__.py
src/transformers/models/clip/configuration_clip.py
src/transformers/models/clip/convert_clip_original_pytorch_to_hf.py
src/transformers/models/clip/feature_extraction_clip.py
src/transformers/models/clip/modeling_clip.py
src/transformers/models/clip/modeling_flax_clip.py
src/transformers/models/clip/processing_clip.py
src/transformers/models/clip/tokenization_clip.py
src/transformers/models/clip/tokenization_clip_fast.py
src/transformers/models/convbert/__init__.py
src/transformers/models/convbert/configuration_convbert.py
src/transformers/models/convbert/convert_convbert_original_tf1_checkpoint_to_pytorch_and_tf2.py
src/transformers/models/convbert/modeling_convbert.py
src/transformers/models/convbert/modeling_tf_convbert.py
src/transformers/models/convbert/tokenization_convbert.py
src/transformers/models/convbert/tokenization_convbert_fast.py
src/transformers/models/cpm/__init__.py
src/transformers/models/cpm/tokenization_cpm.py
src/transformers/models/cpm/tokenization_cpm_fast.py
src/transformers/models/ctrl/__init__.py
src/transformers/models/ctrl/configuration_ctrl.py
src/transformers/models/ctrl/modeling_ctrl.py
src/transformers/models/ctrl/modeling_tf_ctrl.py
src/transformers/models/ctrl/tokenization_ctrl.py
src/transformers/models/deberta/__init__.py
src/transformers/models/deberta/configuration_deberta.py
src/transformers/models/deberta/modeling_deberta.py
src/transformers/models/deberta/modeling_tf_deberta.py
src/transformers/models/deberta/tokenization_deberta.py
src/transformers/models/deberta/tokenization_deberta_fast.py
src/transformers/models/deberta_v2/__init__.py
src/transformers/models/deberta_v2/configuration_deberta_v2.py
src/transformers/models/deberta_v2/modeling_deberta_v2.py
src/transformers/models/deberta_v2/modeling_tf_deberta_v2.py
src/transformers/models/deberta_v2/tokenization_deberta_v2.py
src/transformers/models/deit/__init__.py
src/transformers/models/deit/configuration_deit.py
src/transformers/models/deit/convert_deit_timm_to_pytorch.py
src/transformers/models/deit/feature_extraction_deit.py
src/transformers/models/deit/modeling_deit.py
src/transformers/models/detr/__init__.py
src/transformers/models/detr/configuration_detr.py
src/transformers/models/detr/convert_detr_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/detr/feature_extraction_detr.py
src/transformers/models/detr/modeling_detr.py
src/transformers/models/dialogpt/__init__.py
src/transformers/models/dialogpt/convert_dialogpt_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/distilbert/__init__.py
src/transformers/models/distilbert/configuration_distilbert.py
src/transformers/models/distilbert/modeling_distilbert.py
src/transformers/models/distilbert/modeling_flax_distilbert.py
src/transformers/models/distilbert/modeling_tf_distilbert.py
src/transformers/models/distilbert/tokenization_distilbert.py
src/transformers/models/distilbert/tokenization_distilbert_fast.py
src/transformers/models/dpr/__init__.py
src/transformers/models/dpr/configuration_dpr.py
src/transformers/models/dpr/convert_dpr_original_checkpoint_to_pytorch.py
src/transformers/models/dpr/modeling_dpr.py
src/transformers/models/dpr/modeling_tf_dpr.py
src/transformers/models/dpr/tokenization_dpr.py
src/transformers/models/dpr/tokenization_dpr_fast.py
src/transformers/models/electra/__init__.py
src/transformers/models/electra/configuration_electra.py
src/transformers/models/electra/convert_electra_original_tf_checkpoint_to_pytorch.py
src/transformers/models/electra/modeling_electra.py
src/transformers/models/electra/modeling_flax_electra.py
src/transformers/models/electra/modeling_tf_electra.py
src/transformers/models/electra/tokenization_electra.py
src/transformers/models/electra/tokenization_electra_fast.py
src/transformers/models/encoder_decoder/__init__.py
src/transformers/models/encoder_decoder/configuration_encoder_decoder.py
src/transformers/models/encoder_decoder/modeling_encoder_decoder.py
src/transformers/models/encoder_decoder/modeling_flax_encoder_decoder.py
src/transformers/models/encoder_decoder/modeling_tf_encoder_decoder.py
src/transformers/models/flaubert/__init__.py
src/transformers/models/flaubert/configuration_flaubert.py
src/transformers/models/flaubert/modeling_flaubert.py
src/transformers/models/flaubert/modeling_tf_flaubert.py
src/transformers/models/flaubert/tokenization_flaubert.py
src/transformers/models/fnet/__init__.py
src/transformers/models/fnet/configuration_fnet.py
src/transformers/models/fnet/convert_fnet_original_flax_checkpoint_to_pytorch.py
src/transformers/models/fnet/modeling_fnet.py
src/transformers/models/fnet/tokenization_fnet.py
src/transformers/models/fnet/tokenization_fnet_fast.py
src/transformers/models/fsmt/__init__.py
src/transformers/models/fsmt/configuration_fsmt.py
src/transformers/models/fsmt/convert_fsmt_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/fsmt/modeling_fsmt.py
src/transformers/models/fsmt/tokenization_fsmt.py
src/transformers/models/funnel/__init__.py
src/transformers/models/funnel/configuration_funnel.py
src/transformers/models/funnel/convert_funnel_original_tf_checkpoint_to_pytorch.py
src/transformers/models/funnel/modeling_funnel.py
src/transformers/models/funnel/modeling_tf_funnel.py
src/transformers/models/funnel/tokenization_funnel.py
src/transformers/models/funnel/tokenization_funnel_fast.py
src/transformers/models/gpt2/__init__.py
src/transformers/models/gpt2/configuration_gpt2.py
src/transformers/models/gpt2/convert_gpt2_original_tf_checkpoint_to_pytorch.py
src/transformers/models/gpt2/modeling_flax_gpt2.py
src/transformers/models/gpt2/modeling_gpt2.py
src/transformers/models/gpt2/modeling_tf_gpt2.py
src/transformers/models/gpt2/tokenization_gpt2.py
src/transformers/models/gpt2/tokenization_gpt2_fast.py
src/transformers/models/gpt_neo/__init__.py
src/transformers/models/gpt_neo/configuration_gpt_neo.py
src/transformers/models/gpt_neo/convert_gpt_neo_mesh_tf_to_pytorch.py
src/transformers/models/gpt_neo/modeling_flax_gpt_neo.py
src/transformers/models/gpt_neo/modeling_gpt_neo.py
src/transformers/models/gptj/__init__.py
src/transformers/models/gptj/configuration_gptj.py
src/transformers/models/gptj/modeling_flax_gptj.py
src/transformers/models/gptj/modeling_gptj.py
src/transformers/models/herbert/__init__.py
src/transformers/models/herbert/tokenization_herbert.py
src/transformers/models/herbert/tokenization_herbert_fast.py
src/transformers/models/hubert/__init__.py
src/transformers/models/hubert/configuration_hubert.py
src/transformers/models/hubert/convert_distilhubert_original_s3prl_checkpoint_to_pytorch.py
src/transformers/models/hubert/convert_hubert_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/hubert/convert_hubert_original_s3prl_checkpoint_to_pytorch.py
src/transformers/models/hubert/modeling_hubert.py
src/transformers/models/hubert/modeling_tf_hubert.py
src/transformers/models/ibert/__init__.py
src/transformers/models/ibert/configuration_ibert.py
src/transformers/models/ibert/modeling_ibert.py
src/transformers/models/ibert/quant_modules.py
src/transformers/models/imagegpt/__init__.py
src/transformers/models/imagegpt/configuration_imagegpt.py
src/transformers/models/imagegpt/convert_imagegpt_original_tf2_to_pytorch.py
src/transformers/models/imagegpt/feature_extraction_imagegpt.py
src/transformers/models/imagegpt/modeling_imagegpt.py
src/transformers/models/layoutlm/__init__.py
src/transformers/models/layoutlm/configuration_layoutlm.py
src/transformers/models/layoutlm/modeling_layoutlm.py
src/transformers/models/layoutlm/modeling_tf_layoutlm.py
src/transformers/models/layoutlm/tokenization_layoutlm.py
src/transformers/models/layoutlm/tokenization_layoutlm_fast.py
src/transformers/models/layoutlmv2/__init__.py
src/transformers/models/layoutlmv2/configuration_layoutlmv2.py
src/transformers/models/layoutlmv2/feature_extraction_layoutlmv2.py
src/transformers/models/layoutlmv2/modeling_layoutlmv2.py
src/transformers/models/layoutlmv2/processing_layoutlmv2.py
src/transformers/models/layoutlmv2/tokenization_layoutlmv2.py
src/transformers/models/layoutlmv2/tokenization_layoutlmv2_fast.py
src/transformers/models/layoutxlm/__init__.py
src/transformers/models/layoutxlm/processing_layoutxlm.py
src/transformers/models/layoutxlm/tokenization_layoutxlm.py
src/transformers/models/layoutxlm/tokenization_layoutxlm_fast.py
src/transformers/models/led/__init__.py
src/transformers/models/led/configuration_led.py
src/transformers/models/led/modeling_led.py
src/transformers/models/led/modeling_tf_led.py
src/transformers/models/led/tokenization_led.py
src/transformers/models/led/tokenization_led_fast.py
src/transformers/models/longformer/__init__.py
src/transformers/models/longformer/configuration_longformer.py
src/transformers/models/longformer/convert_longformer_original_pytorch_lightning_to_pytorch.py
src/transformers/models/longformer/modeling_longformer.py
src/transformers/models/longformer/modeling_tf_longformer.py
src/transformers/models/longformer/tokenization_longformer.py
src/transformers/models/longformer/tokenization_longformer_fast.py
src/transformers/models/luke/__init__.py
src/transformers/models/luke/configuration_luke.py
src/transformers/models/luke/convert_luke_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/luke/modeling_luke.py
src/transformers/models/luke/tokenization_luke.py
src/transformers/models/lxmert/__init__.py
src/transformers/models/lxmert/configuration_lxmert.py
src/transformers/models/lxmert/convert_lxmert_original_tf_checkpoint_to_pytorch.py
src/transformers/models/lxmert/modeling_lxmert.py
src/transformers/models/lxmert/modeling_tf_lxmert.py
src/transformers/models/lxmert/tokenization_lxmert.py
src/transformers/models/lxmert/tokenization_lxmert_fast.py
src/transformers/models/m2m_100/__init__.py
src/transformers/models/m2m_100/configuration_m2m_100.py
src/transformers/models/m2m_100/convert_m2m100_original_checkpoint_to_pytorch.py
src/transformers/models/m2m_100/modeling_m2m_100.py
src/transformers/models/m2m_100/tokenization_m2m_100.py
src/transformers/models/marian/__init__.py
src/transformers/models/marian/configuration_marian.py
src/transformers/models/marian/convert_marian_tatoeba_to_pytorch.py
src/transformers/models/marian/convert_marian_to_pytorch.py
src/transformers/models/marian/modeling_flax_marian.py
src/transformers/models/marian/modeling_marian.py
src/transformers/models/marian/modeling_tf_marian.py
src/transformers/models/marian/tokenization_marian.py
src/transformers/models/mbart/__init__.py
src/transformers/models/mbart/configuration_mbart.py
src/transformers/models/mbart/convert_mbart_original_checkpoint_to_pytorch.py
src/transformers/models/mbart/modeling_flax_mbart.py
src/transformers/models/mbart/modeling_mbart.py
src/transformers/models/mbart/modeling_tf_mbart.py
src/transformers/models/mbart/tokenization_mbart.py
src/transformers/models/mbart/tokenization_mbart_fast.py
src/transformers/models/mbart50/__init__.py
src/transformers/models/mbart50/tokenization_mbart50.py
src/transformers/models/mbart50/tokenization_mbart50_fast.py
src/transformers/models/megatron_bert/__init__.py
src/transformers/models/megatron_bert/configuration_megatron_bert.py
src/transformers/models/megatron_bert/convert_megatron_bert_checkpoint.py
src/transformers/models/megatron_bert/modeling_megatron_bert.py
src/transformers/models/megatron_gpt2/__init__.py
src/transformers/models/megatron_gpt2/convert_megatron_gpt2_checkpoint.py
src/transformers/models/mluke/__init__.py
src/transformers/models/mluke/convert_mluke_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/mluke/tokenization_mluke.py
src/transformers/models/mmbt/__init__.py
src/transformers/models/mmbt/configuration_mmbt.py
src/transformers/models/mmbt/modeling_mmbt.py
src/transformers/models/mobilebert/__init__.py
src/transformers/models/mobilebert/configuration_mobilebert.py
src/transformers/models/mobilebert/convert_mobilebert_original_tf_checkpoint_to_pytorch.py
src/transformers/models/mobilebert/modeling_mobilebert.py
src/transformers/models/mobilebert/modeling_tf_mobilebert.py
src/transformers/models/mobilebert/tokenization_mobilebert.py
src/transformers/models/mobilebert/tokenization_mobilebert_fast.py
src/transformers/models/mpnet/__init__.py
src/transformers/models/mpnet/configuration_mpnet.py
src/transformers/models/mpnet/modeling_mpnet.py
src/transformers/models/mpnet/modeling_tf_mpnet.py
src/transformers/models/mpnet/tokenization_mpnet.py
src/transformers/models/mpnet/tokenization_mpnet_fast.py
src/transformers/models/mt5/__init__.py
src/transformers/models/mt5/configuration_mt5.py
src/transformers/models/mt5/modeling_flax_mt5.py
src/transformers/models/mt5/modeling_mt5.py
src/transformers/models/mt5/modeling_tf_mt5.py
src/transformers/models/openai/__init__.py
src/transformers/models/openai/configuration_openai.py
src/transformers/models/openai/convert_openai_original_tf_checkpoint_to_pytorch.py
src/transformers/models/openai/modeling_openai.py
src/transformers/models/openai/modeling_tf_openai.py
src/transformers/models/openai/tokenization_openai.py
src/transformers/models/openai/tokenization_openai_fast.py
src/transformers/models/pegasus/__init__.py
src/transformers/models/pegasus/configuration_pegasus.py
src/transformers/models/pegasus/convert_pegasus_tf_to_pytorch.py
src/transformers/models/pegasus/modeling_flax_pegasus.py
src/transformers/models/pegasus/modeling_pegasus.py
src/transformers/models/pegasus/modeling_tf_pegasus.py
src/transformers/models/pegasus/tokenization_pegasus.py
src/transformers/models/pegasus/tokenization_pegasus_fast.py
src/transformers/models/perceiver/__init__.py
src/transformers/models/perceiver/configuration_perceiver.py
src/transformers/models/perceiver/convert_perceiver_haiku_to_pytorch.py
src/transformers/models/perceiver/feature_extraction_perceiver.py
src/transformers/models/perceiver/modeling_perceiver.py
src/transformers/models/perceiver/tokenization_perceiver.py
src/transformers/models/phobert/__init__.py
src/transformers/models/phobert/tokenization_phobert.py
src/transformers/models/prophetnet/__init__.py
src/transformers/models/prophetnet/configuration_prophetnet.py
src/transformers/models/prophetnet/convert_prophetnet_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/prophetnet/modeling_prophetnet.py
src/transformers/models/prophetnet/tokenization_prophetnet.py
src/transformers/models/qdqbert/__init__.py
src/transformers/models/qdqbert/configuration_qdqbert.py
src/transformers/models/qdqbert/modeling_qdqbert.py
src/transformers/models/rag/__init__.py
src/transformers/models/rag/configuration_rag.py
src/transformers/models/rag/modeling_rag.py
src/transformers/models/rag/modeling_tf_rag.py
src/transformers/models/rag/retrieval_rag.py
src/transformers/models/rag/tokenization_rag.py
src/transformers/models/reformer/__init__.py
src/transformers/models/reformer/configuration_reformer.py
src/transformers/models/reformer/convert_reformer_trax_checkpoint_to_pytorch.py
src/transformers/models/reformer/modeling_reformer.py
src/transformers/models/reformer/tokenization_reformer.py
src/transformers/models/reformer/tokenization_reformer_fast.py
src/transformers/models/rembert/__init__.py
src/transformers/models/rembert/configuration_rembert.py
src/transformers/models/rembert/convert_rembert_tf_checkpoint_to_pytorch.py
src/transformers/models/rembert/modeling_rembert.py
src/transformers/models/rembert/modeling_tf_rembert.py
src/transformers/models/rembert/tokenization_rembert.py
src/transformers/models/rembert/tokenization_rembert_fast.py
src/transformers/models/retribert/__init__.py
src/transformers/models/retribert/configuration_retribert.py
src/transformers/models/retribert/modeling_retribert.py
src/transformers/models/retribert/tokenization_retribert.py
src/transformers/models/retribert/tokenization_retribert_fast.py
src/transformers/models/roberta/__init__.py
src/transformers/models/roberta/configuration_roberta.py
src/transformers/models/roberta/convert_roberta_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/roberta/modeling_flax_roberta.py
src/transformers/models/roberta/modeling_roberta.py
src/transformers/models/roberta/modeling_tf_roberta.py
src/transformers/models/roberta/tokenization_roberta.py
src/transformers/models/roberta/tokenization_roberta_fast.py
src/transformers/models/roformer/__init__.py
src/transformers/models/roformer/configuration_roformer.py
src/transformers/models/roformer/convert_roformer_original_tf_checkpoint_to_pytorch.py
src/transformers/models/roformer/modeling_roformer.py
src/transformers/models/roformer/modeling_tf_roformer.py
src/transformers/models/roformer/tokenization_roformer.py
src/transformers/models/roformer/tokenization_roformer_fast.py
src/transformers/models/roformer/tokenization_utils.py
src/transformers/models/segformer/__init__.py
src/transformers/models/segformer/configuration_segformer.py
src/transformers/models/segformer/convert_segformer_original_to_pytorch.py
src/transformers/models/segformer/feature_extraction_segformer.py
src/transformers/models/segformer/modeling_segformer.py
src/transformers/models/sew/__init__.py
src/transformers/models/sew/configuration_sew.py
src/transformers/models/sew/convert_sew_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/sew/modeling_sew.py
src/transformers/models/sew_d/__init__.py
src/transformers/models/sew_d/configuration_sew_d.py
src/transformers/models/sew_d/convert_sew_d_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/sew_d/modeling_sew_d.py
src/transformers/models/speech_encoder_decoder/__init__.py
src/transformers/models/speech_encoder_decoder/configuration_speech_encoder_decoder.py
src/transformers/models/speech_encoder_decoder/convert_mbart_wav2vec2_seq2seq_original_to_pytorch.py
src/transformers/models/speech_encoder_decoder/convert_speech_to_text_wav2vec2_seq2seq_original_to_pytorch.py
src/transformers/models/speech_encoder_decoder/modeling_speech_encoder_decoder.py
src/transformers/models/speech_to_text/__init__.py
src/transformers/models/speech_to_text/configuration_speech_to_text.py
src/transformers/models/speech_to_text/convert_s2t_fairseq_to_tfms.py
src/transformers/models/speech_to_text/feature_extraction_speech_to_text.py
src/transformers/models/speech_to_text/modeling_speech_to_text.py
src/transformers/models/speech_to_text/processing_speech_to_text.py
src/transformers/models/speech_to_text/tokenization_speech_to_text.py
src/transformers/models/speech_to_text_2/__init__.py
src/transformers/models/speech_to_text_2/configuration_speech_to_text_2.py
src/transformers/models/speech_to_text_2/modeling_speech_to_text_2.py
src/transformers/models/speech_to_text_2/processing_speech_to_text_2.py
src/transformers/models/speech_to_text_2/tokenization_speech_to_text_2.py
src/transformers/models/splinter/__init__.py
src/transformers/models/splinter/configuration_splinter.py
src/transformers/models/splinter/modeling_splinter.py
src/transformers/models/splinter/tokenization_splinter.py
src/transformers/models/splinter/tokenization_splinter_fast.py
src/transformers/models/squeezebert/__init__.py
src/transformers/models/squeezebert/configuration_squeezebert.py
src/transformers/models/squeezebert/modeling_squeezebert.py
src/transformers/models/squeezebert/tokenization_squeezebert.py
src/transformers/models/squeezebert/tokenization_squeezebert_fast.py
src/transformers/models/t5/__init__.py
src/transformers/models/t5/configuration_t5.py
src/transformers/models/t5/convert_t5_original_tf_checkpoint_to_pytorch.py
src/transformers/models/t5/modeling_flax_t5.py
src/transformers/models/t5/modeling_t5.py
src/transformers/models/t5/modeling_tf_t5.py
src/transformers/models/t5/tokenization_t5.py
src/transformers/models/t5/tokenization_t5_fast.py
src/transformers/models/tapas/__init__.py
src/transformers/models/tapas/configuration_tapas.py
src/transformers/models/tapas/convert_tapas_original_tf_checkpoint_to_pytorch.py
src/transformers/models/tapas/modeling_tapas.py
src/transformers/models/tapas/modeling_tf_tapas.py
src/transformers/models/tapas/tokenization_tapas.py
src/transformers/models/transfo_xl/__init__.py
src/transformers/models/transfo_xl/configuration_transfo_xl.py
src/transformers/models/transfo_xl/convert_transfo_xl_original_tf_checkpoint_to_pytorch.py
src/transformers/models/transfo_xl/modeling_tf_transfo_xl.py
src/transformers/models/transfo_xl/modeling_tf_transfo_xl_utilities.py
src/transformers/models/transfo_xl/modeling_transfo_xl.py
src/transformers/models/transfo_xl/modeling_transfo_xl_utilities.py
src/transformers/models/transfo_xl/tokenization_transfo_xl.py
src/transformers/models/trocr/__init__.py
src/transformers/models/trocr/configuration_trocr.py
src/transformers/models/trocr/modeling_trocr.py
src/transformers/models/trocr/processing_trocr.py
src/transformers/models/unispeech/__init__.py
src/transformers/models/unispeech/configuration_unispeech.py
src/transformers/models/unispeech/convert_unispeech_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/unispeech/modeling_unispeech.py
src/transformers/models/unispeech_sat/__init__.py
src/transformers/models/unispeech_sat/configuration_unispeech_sat.py
src/transformers/models/unispeech_sat/convert_unispeech_sat_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/unispeech_sat/modeling_unispeech_sat.py
src/transformers/models/vision_encoder_decoder/__init__.py
src/transformers/models/vision_encoder_decoder/configuration_vision_encoder_decoder.py
src/transformers/models/vision_encoder_decoder/convert_trocr_unilm_to_pytorch.py
src/transformers/models/vision_encoder_decoder/modeling_flax_vision_encoder_decoder.py
src/transformers/models/vision_encoder_decoder/modeling_vision_encoder_decoder.py
src/transformers/models/vision_text_dual_encoder/__init__.py
src/transformers/models/vision_text_dual_encoder/configuration_vision_text_dual_encoder.py
src/transformers/models/vision_text_dual_encoder/modeling_flax_vision_text_dual_encoder.py
src/transformers/models/vision_text_dual_encoder/modeling_vision_text_dual_encoder.py
src/transformers/models/vision_text_dual_encoder/processing_vision_text_dual_encoder.py
src/transformers/models/visual_bert/__init__.py
src/transformers/models/visual_bert/configuration_visual_bert.py
src/transformers/models/visual_bert/convert_visual_bert_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/visual_bert/modeling_visual_bert.py
src/transformers/models/vit/__init__.py
src/transformers/models/vit/configuration_vit.py
src/transformers/models/vit/convert_dino_to_pytorch.py
src/transformers/models/vit/convert_vit_timm_to_pytorch.py
src/transformers/models/vit/feature_extraction_vit.py
src/transformers/models/vit/modeling_flax_vit.py
src/transformers/models/vit/modeling_tf_vit.py
src/transformers/models/vit/modeling_vit.py
src/transformers/models/wav2vec2/__init__.py
src/transformers/models/wav2vec2/configuration_wav2vec2.py
src/transformers/models/wav2vec2/convert_wav2vec2_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/wav2vec2/convert_wav2vec2_original_s3prl_checkpoint_to_pytorch.py
src/transformers/models/wav2vec2/feature_extraction_wav2vec2.py
src/transformers/models/wav2vec2/modeling_flax_wav2vec2.py
src/transformers/models/wav2vec2/modeling_tf_wav2vec2.py
src/transformers/models/wav2vec2/modeling_wav2vec2.py
src/transformers/models/wav2vec2/processing_wav2vec2.py
src/transformers/models/wav2vec2/tokenization_wav2vec2.py
src/transformers/models/wav2vec2_with_lm/__init__.py
src/transformers/models/wav2vec2_with_lm/processing_wav2vec2_with_lm.py
src/transformers/models/xlm/__init__.py
src/transformers/models/xlm/configuration_xlm.py
src/transformers/models/xlm/convert_xlm_original_pytorch_checkpoint_to_pytorch.py
src/transformers/models/xlm/modeling_tf_xlm.py
src/transformers/models/xlm/modeling_xlm.py
src/transformers/models/xlm/tokenization_xlm.py
src/transformers/models/xlm_prophetnet/__init__.py
src/transformers/models/xlm_prophetnet/configuration_xlm_prophetnet.py
src/transformers/models/xlm_prophetnet/modeling_xlm_prophetnet.py
src/transformers/models/xlm_prophetnet/tokenization_xlm_prophetnet.py
src/transformers/models/xlm_roberta/__init__.py
src/transformers/models/xlm_roberta/configuration_xlm_roberta.py
src/transformers/models/xlm_roberta/modeling_tf_xlm_roberta.py
src/transformers/models/xlm_roberta/modeling_xlm_roberta.py
src/transformers/models/xlm_roberta/tokenization_xlm_roberta.py
src/transformers/models/xlm_roberta/tokenization_xlm_roberta_fast.py
src/transformers/models/xlnet/__init__.py
src/transformers/models/xlnet/configuration_xlnet.py
src/transformers/models/xlnet/convert_xlnet_original_tf_checkpoint_to_pytorch.py
src/transformers/models/xlnet/modeling_tf_xlnet.py
src/transformers/models/xlnet/modeling_xlnet.py
src/transformers/models/xlnet/tokenization_xlnet.py
src/transformers/models/xlnet/tokenization_xlnet_fast.py
src/transformers/onnx/__init__.py
src/transformers/onnx/__main__.py
src/transformers/onnx/config.py
src/transformers/onnx/convert.py
src/transformers/onnx/features.py
src/transformers/onnx/utils.py
src/transformers/pipelines/__init__.py
src/transformers/pipelines/audio_classification.py
src/transformers/pipelines/automatic_speech_recognition.py
src/transformers/pipelines/base.py
src/transformers/pipelines/conversational.py
src/transformers/pipelines/feature_extraction.py
src/transformers/pipelines/fill_mask.py
src/transformers/pipelines/image_classification.py
src/transformers/pipelines/image_segmentation.py
src/transformers/pipelines/object_detection.py
src/transformers/pipelines/question_answering.py
src/transformers/pipelines/table_question_answering.py
src/transformers/pipelines/text2text_generation.py
src/transformers/pipelines/text_classification.py
src/transformers/pipelines/text_generation.py
src/transformers/pipelines/token_classification.py
src/transformers/pipelines/zero_shot_classification.py
src/transformers/sagemaker/__init__.py
src/transformers/sagemaker/trainer_sm.py
src/transformers/sagemaker/training_args_sm.py
src/transformers/utils/__init__.py
src/transformers/utils/dummy_detectron2_objects.py
src/transformers/utils/dummy_flax_objects.py
src/transformers/utils/dummy_pt_objects.py
src/transformers/utils/dummy_pytorch_quantization_and_torch_objects.py
src/transformers/utils/dummy_scatter_objects.py
src/transformers/utils/dummy_sentencepiece_and_speech_objects.py
src/transformers/utils/dummy_sentencepiece_and_tokenizers_objects.py
src/transformers/utils/dummy_sentencepiece_objects.py
src/transformers/utils/dummy_speech_objects.py
src/transformers/utils/dummy_tf_objects.py
src/transformers/utils/dummy_timm_and_vision_objects.py
src/transformers/utils/dummy_timm_objects.py
src/transformers/utils/dummy_tokenizers_objects.py
src/transformers/utils/dummy_vision_objects.py
src/transformers/utils/fx.py
src/transformers/utils/fx_transformations.py
src/transformers/utils/hp_naming.py
src/transformers/utils/logging.py
src/transformers/utils/model_parallel_utils.py
src/transformers/utils/notebook.py
src/transformers/utils/sentencepiece_model_pb2.py
src/transformers/utils/versions.py
templates/adding_a_new_example_script/README.md
templates/adding_a_new_example_script/cookiecutter.json
templates/adding_a_new_example_script/{{cookiecutter.directory_name}}/run_{{cookiecutter.example_shortcut}}.py
templates/adding_a_new_model/ADD_NEW_MODEL_PROPOSAL_TEMPLATE.md
templates/adding_a_new_model/README.md
templates/adding_a_new_model/cookiecutter.json
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/__init__.py
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/configuration.json
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/configuration_{{cookiecutter.lowercase_modelname}}.py
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/modeling_flax_{{cookiecutter.lowercase_modelname}}.py
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/modeling_tf_{{cookiecutter.lowercase_modelname}}.py
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/modeling_{{cookiecutter.lowercase_modelname}}.py
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/test_modeling_flax_{{cookiecutter.lowercase_modelname}}.py
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/test_modeling_tf_{{cookiecutter.lowercase_modelname}}.py
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/test_modeling_{{cookiecutter.lowercase_modelname}}.py
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/to_replace_{{cookiecutter.lowercase_modelname}}.py
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/tokenization_fast_{{cookiecutter.lowercase_modelname}}.py
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/tokenization_{{cookiecutter.lowercase_modelname}}.py
templates/adding_a_new_model/cookiecutter-template-{{cookiecutter.modelname}}/{{cookiecutter.lowercase_modelname}}.rst
templates/adding_a_new_model/open_model_proposals/ADD_BIG_BIRD.md
templates/adding_a_new_model/open_model_proposals/README.md
templates/adding_a_new_model/tests/encoder-bert-tokenizer.json
templates/adding_a_new_model/tests/flax-encoder-bert-tokenizer.json
templates/adding_a_new_model/tests/flax-seq-2-seq-bart-tokenizer.json
templates/adding_a_new_model/tests/pt-encoder-bert-tokenizer.json
templates/adding_a_new_model/tests/pt-seq-2-seq-bart-tokenizer.json
templates/adding_a_new_model/tests/standalone.json
templates/adding_a_new_model/tests/tf-encoder-bert-tokenizer.json
templates/adding_a_new_model/tests/tf-seq-2-seq-bart-tokenizer.json
tests/__init__.py
tests/conftest.py
tests/test_activations.py
tests/test_activations_tf.py
tests/test_benchmark.py
tests/test_benchmark_tf.py
tests/test_cli.py
tests/test_configuration_auto.py
tests/test_configuration_common.py
tests/test_data_collator.py
tests/test_doc_samples.py
tests/test_feature_extraction_auto.py
tests/test_feature_extraction_beit.py
tests/test_feature_extraction_clip.py
tests/test_feature_extraction_common.py
tests/test_feature_extraction_deit.py
tests/test_feature_extraction_detr.py
tests/test_feature_extraction_imagegpt.py
tests/test_feature_extraction_layoutlmv2.py
tests/test_feature_extraction_segformer.py
tests/test_feature_extraction_speech_to_text.py
tests/test_feature_extraction_vit.py
tests/test_feature_extraction_wav2vec2.py
tests/test_file_utils.py
tests/test_flax_auto.py
tests/test_generation_beam_search.py
tests/test_generation_flax_logits_process.py
tests/test_generation_flax_utils.py
tests/test_generation_logits_process.py
tests/test_generation_stopping_criteria.py
tests/test_generation_utils.py
tests/test_hf_argparser.py
tests/test_image_utils.py
tests/test_logging.py
tests/test_model_card.py
tests/test_model_output.py
tests/test_modeling_albert.py
tests/test_modeling_auto.py
tests/test_modeling_bart.py
tests/test_modeling_beit.py
tests/test_modeling_bert.py
tests/test_modeling_bert_generation.py
tests/test_modeling_big_bird.py
tests/test_modeling_bigbird_pegasus.py
tests/test_modeling_blenderbot.py
tests/test_modeling_blenderbot_small.py
tests/test_modeling_bort.py
tests/test_modeling_camembert.py
tests/test_modeling_canine.py
tests/test_modeling_clip.py
tests/test_modeling_common.py
tests/test_modeling_convbert.py
tests/test_modeling_ctrl.py
tests/test_modeling_deberta.py
tests/test_modeling_deberta_v2.py
tests/test_modeling_deit.py
tests/test_modeling_detr.py
tests/test_modeling_distilbert.py
tests/test_modeling_dpr.py
tests/test_modeling_electra.py
tests/test_modeling_encoder_decoder.py
tests/test_modeling_flaubert.py
tests/test_modeling_flax_albert.py
tests/test_modeling_flax_bart.py
tests/test_modeling_flax_beit.py
tests/test_modeling_flax_bert.py
tests/test_modeling_flax_big_bird.py
tests/test_modeling_flax_blenderbot.py
tests/test_modeling_flax_blenderbot_small.py
tests/test_modeling_flax_clip.py
tests/test_modeling_flax_common.py
tests/test_modeling_flax_distilbert.py
tests/test_modeling_flax_electra.py
tests/test_modeling_flax_encoder_decoder.py
tests/test_modeling_flax_gpt2.py
tests/test_modeling_flax_gpt_neo.py
tests/test_modeling_flax_gptj.py
tests/test_modeling_flax_marian.py
tests/test_modeling_flax_mbart.py
tests/test_modeling_flax_mt5.py
tests/test_modeling_flax_pegasus.py
tests/test_modeling_flax_roberta.py
tests/test_modeling_flax_t5.py
tests/test_modeling_flax_vision_encoder_decoder.py
tests/test_modeling_flax_vision_text_dual_encoder.py
tests/test_modeling_flax_vit.py
tests/test_modeling_flax_wav2vec2.py
tests/test_modeling_fnet.py
tests/test_modeling_fsmt.py
tests/test_modeling_funnel.py
tests/test_modeling_gpt2.py
tests/test_modeling_gpt_neo.py
tests/test_modeling_gptj.py
tests/test_modeling_hubert.py
tests/test_modeling_ibert.py
tests/test_modeling_imagegpt.py
tests/test_modeling_layoutlm.py
tests/test_modeling_layoutlmv2.py
tests/test_modeling_led.py
tests/test_modeling_longformer.py
tests/test_modeling_luke.py
tests/test_modeling_lxmert.py
tests/test_modeling_m2m_100.py
tests/test_modeling_marian.py
tests/test_modeling_mbart.py
tests/test_modeling_megatron_bert.py
tests/test_modeling_megatron_gpt2.py
tests/test_modeling_mobilebert.py
tests/test_modeling_mpnet.py
tests/test_modeling_mt5.py
tests/test_modeling_openai.py
tests/test_modeling_pegasus.py
tests/test_modeling_perceiver.py
tests/test_modeling_prophetnet.py
tests/test_modeling_qdqbert.py
tests/test_modeling_rag.py
tests/test_modeling_reformer.py
tests/test_modeling_rembert.py
tests/test_modeling_roberta.py
tests/test_modeling_roformer.py
tests/test_modeling_segformer.py
tests/test_modeling_sew.py
tests/test_modeling_sew_d.py
tests/test_modeling_speech_encoder_decoder.py
tests/test_modeling_speech_to_text.py
tests/test_modeling_speech_to_text_2.py
tests/test_modeling_splinter.py
tests/test_modeling_squeezebert.py
tests/test_modeling_t5.py
tests/test_modeling_tapas.py
tests/test_modeling_tf_albert.py
tests/test_modeling_tf_auto.py
tests/test_modeling_tf_bart.py
tests/test_modeling_tf_bert.py
tests/test_modeling_tf_blenderbot.py
tests/test_modeling_tf_blenderbot_small.py
tests/test_modeling_tf_bort.py
tests/test_modeling_tf_camembert.py
tests/test_modeling_tf_common.py
tests/test_modeling_tf_convbert.py
tests/test_modeling_tf_core.py
tests/test_modeling_tf_ctrl.py
tests/test_modeling_tf_deberta.py
tests/test_modeling_tf_deberta_v2.py
tests/test_modeling_tf_distilbert.py
tests/test_modeling_tf_dpr.py
tests/test_modeling_tf_electra.py
tests/test_modeling_tf_encoder_decoder.py
tests/test_modeling_tf_flaubert.py
tests/test_modeling_tf_funnel.py
tests/test_modeling_tf_gpt2.py
tests/test_modeling_tf_hubert.py
tests/test_modeling_tf_layoutlm.py
tests/test_modeling_tf_led.py
tests/test_modeling_tf_longformer.py
tests/test_modeling_tf_lxmert.py
tests/test_modeling_tf_marian.py
tests/test_modeling_tf_mbart.py
tests/test_modeling_tf_mobilebert.py
tests/test_modeling_tf_mpnet.py
tests/test_modeling_tf_mt5.py
tests/test_modeling_tf_openai.py
tests/test_modeling_tf_pegasus.py
tests/test_modeling_tf_pytorch.py
tests/test_modeling_tf_rag.py
tests/test_modeling_tf_rembert.py
tests/test_modeling_tf_roberta.py
tests/test_modeling_tf_roformer.py
tests/test_modeling_tf_t5.py
tests/test_modeling_tf_tapas.py
tests/test_modeling_tf_transfo_xl.py
tests/test_modeling_tf_vit.py
tests/test_modeling_tf_wav2vec2.py
tests/test_modeling_tf_xlm.py
tests/test_modeling_tf_xlm_roberta.py
tests/test_modeling_tf_xlnet.py
tests/test_modeling_transfo_xl.py
tests/test_modeling_trocr.py
tests/test_modeling_unispeech.py
tests/test_modeling_unispeech_sat.py
tests/test_modeling_vision_encoder_decoder.py
tests/test_modeling_vision_text_dual_encoder.py
tests/test_modeling_visual_bert.py
tests/test_modeling_vit.py
tests/test_modeling_wav2vec2.py
tests/test_modeling_xlm.py
tests/test_modeling_xlm_prophetnet.py
tests/test_modeling_xlm_roberta.py
tests/test_modeling_xlnet.py
tests/test_offline.py
tests/test_onnx.py
tests/test_onnx_v2.py
tests/test_optimization.py
tests/test_optimization_tf.py
tests/test_pipelines_audio_classification.py
tests/test_pipelines_automatic_speech_recognition.py
tests/test_pipelines_common.py
tests/test_pipelines_conversational.py
tests/test_pipelines_feature_extraction.py
tests/test_pipelines_fill_mask.py
tests/test_pipelines_image_classification.py
tests/test_pipelines_image_segmentation.py
tests/test_pipelines_object_detection.py
tests/test_pipelines_question_answering.py
tests/test_pipelines_summarization.py
tests/test_pipelines_table_question_answering.py
tests/test_pipelines_text2text_generation.py
tests/test_pipelines_text_classification.py
tests/test_pipelines_text_generation.py
tests/test_pipelines_token_classification.py
tests/test_pipelines_translation.py
tests/test_pipelines_zero_shot.py
tests/test_processor_auto.py
tests/test_processor_clip.py
tests/test_processor_layoutlmv2.py
tests/test_processor_layoutxlm.py
tests/test_processor_speech_to_text.py
tests/test_processor_vision_text_dual_encoder.py
tests/test_processor_wav2vec2.py
tests/test_processor_wav2vec2_with_lm.py
tests/test_retrieval_rag.py
tests/test_sequence_feature_extraction_common.py
tests/test_skip_decorators.py
tests/test_tokenization_albert.py
tests/test_tokenization_auto.py
tests/test_tokenization_bart.py
tests/test_tokenization_barthez.py
tests/test_tokenization_bartpho.py
tests/test_tokenization_bert.py
tests/test_tokenization_bert_generation.py
tests/test_tokenization_bert_japanese.py
tests/test_tokenization_bertweet.py
tests/test_tokenization_big_bird.py
tests/test_tokenization_blenderbot.py
tests/test_tokenization_byt5.py
tests/test_tokenization_camembert.py
tests/test_tokenization_canine.py
tests/test_tokenization_clip.py
tests/test_tokenization_common.py
tests/test_tokenization_cpm.py
tests/test_tokenization_ctrl.py
tests/test_tokenization_deberta.py
tests/test_tokenization_deberta_v2.py
tests/test_tokenization_distilbert.py
tests/test_tokenization_dpr.py
tests/test_tokenization_fast.py
tests/test_tokenization_fnet.py
tests/test_tokenization_fsmt.py
tests/test_tokenization_funnel.py
tests/test_tokenization_gpt2.py
tests/test_tokenization_herbert.py
tests/test_tokenization_layoutlm.py
tests/test_tokenization_layoutlmv2.py
tests/test_tokenization_layoutxlm.py
tests/test_tokenization_luke.py
tests/test_tokenization_lxmert.py
tests/test_tokenization_m2m_100.py
tests/test_tokenization_marian.py
tests/test_tokenization_mbart.py
tests/test_tokenization_mbart50.py
tests/test_tokenization_mluke.py
tests/test_tokenization_mpnet.py
tests/test_tokenization_openai.py
tests/test_tokenization_pegasus.py
tests/test_tokenization_perceiver.py
tests/test_tokenization_phobert.py
tests/test_tokenization_prophetnet.py
tests/test_tokenization_rag.py
tests/test_tokenization_reformer.py
tests/test_tokenization_roberta.py
tests/test_tokenization_roformer.py
tests/test_tokenization_small_blenderbot.py
tests/test_tokenization_speech_to_text.py
tests/test_tokenization_speech_to_text_2.py
tests/test_tokenization_squeezebert.py
tests/test_tokenization_t5.py
tests/test_tokenization_tapas.py
tests/test_tokenization_transfo_xl.py
tests/test_tokenization_utils.py
tests/test_tokenization_wav2vec2.py
tests/test_tokenization_xlm.py
tests/test_tokenization_xlm_prophetnet.py
tests/test_tokenization_xlm_roberta.py
tests/test_tokenization_xlnet.py
tests/test_trainer.py
tests/test_trainer_callback.py
tests/test_trainer_distributed.py
tests/test_trainer_seq2seq.py
tests/test_trainer_tpu.py
tests/test_trainer_utils.py
tests/test_utils_check_copies.py
tests/test_versions_utils.py
tests/deepspeed/ds_config_zero2.json
tests/deepspeed/ds_config_zero3.json
tests/deepspeed/test_deepspeed.py
tests/deepspeed/test_model_zoo.py
tests/extended/test_trainer_ext.py
tests/fixtures/dummy-config.json
tests/fixtures/dummy_feature_extractor_config.json
tests/fixtures/empty.txt
tests/fixtures/input.txt
tests/fixtures/merges.txt
tests/fixtures/preprocessor_config.json
tests/fixtures/sample_text.txt
tests/fixtures/sample_text_no_unicode.txt
tests/fixtures/spiece.model
tests/fixtures/test_sentencepiece.model
tests/fixtures/test_sentencepiece_bpe.model
tests/fixtures/test_sentencepiece_no_bos.model
tests/fixtures/vocab.json
tests/fixtures/vocab.txt
tests/fixtures/tests_samples/.gitignore
tests/fixtures/tests_samples/COCO/000000039769.png
tests/fixtures/tests_samples/COCO/coco_annotations.txt
tests/fixtures/tests_samples/COCO/coco_panoptic_annotations.txt
tests/fixtures/tests_samples/COCO/coco_panoptic/000000039769.png
tests/fixtures/tests_samples/GermEval/dev.txt
tests/fixtures/tests_samples/GermEval/labels.txt
tests/fixtures/tests_samples/GermEval/train.txt
tests/fixtures/tests_samples/MRPC/dev.csv
tests/fixtures/tests_samples/MRPC/dev.tsv
tests/fixtures/tests_samples/MRPC/train.csv
tests/fixtures/tests_samples/MRPC/train.tsv
tests/fixtures/tests_samples/SQUAD/sample.json
tests/fixtures/tests_samples/STS-B/dev.tsv
tests/fixtures/tests_samples/STS-B/train.tsv
tests/fixtures/tests_samples/conll/sample.json
tests/fixtures/tests_samples/swag/sample.json
tests/fixtures/tests_samples/wiki_text/wiki_00
tests/fixtures/tests_samples/wmt16/sample.json
tests/fixtures/tests_samples/wmt_en_ro/test.json
tests/fixtures/tests_samples/wmt_en_ro/train.json
tests/fixtures/tests_samples/wmt_en_ro/val.json
tests/fixtures/tests_samples/xsum/sample.json
tests/sagemaker/README.md
tests/sagemaker/__init__.py
tests/sagemaker/conftest.py
tests/sagemaker/test_multi_node_data_parallel.py
tests/sagemaker/test_multi_node_model_parallel.py
tests/sagemaker/test_single_node_gpu.py
tests/sagemaker/scripts/pytorch/requirements.txt
tests/sagemaker/scripts/pytorch/run_ddp.py
tests/sagemaker/scripts/pytorch/run_glue_model_parallelism.py
tests/sagemaker/scripts/tensorflow/requirements.txt
tests/sagemaker/scripts/tensorflow/run_tf.py
tests/sagemaker/scripts/tensorflow/run_tf_dist.py
utils/check_copies.py
utils/check_dummies.py
utils/check_inits.py
utils/check_repo.py
utils/check_table.py
utils/check_tf_ops.py
utils/custom_init_isort.py
utils/documentation_tests.txt
utils/download_glue_data.py
utils/get_modified_files.py
utils/notification_service.py
utils/print_env_pt.py
utils/release.py
utils/style_doc.py
utils/tests_fetcher.py
utils/tf_ops/onnx.json