2022-05-16 11:36:41 +00:00
|
|
|
- sections:
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: index
|
|
|
|
|
title: 🤗 Transformers
|
|
|
|
|
- local: quicktour
|
|
|
|
|
title: Quick tour
|
|
|
|
|
- local: installation
|
|
|
|
|
title: Installation
|
|
|
|
|
title: Get started
|
|
|
|
|
- sections:
|
2022-02-02 00:31:35 +00:00
|
|
|
- local: pipeline_tutorial
|
|
|
|
|
title: Pipelines for inference
|
|
|
|
|
- local: autoclass_tutorial
|
|
|
|
|
title: Load pretrained instances with an AutoClass
|
|
|
|
|
- local: preprocessing
|
|
|
|
|
title: Preprocess
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: training
|
2022-03-22 21:14:58 +00:00
|
|
|
title: Fine-tune a pretrained model
|
2022-01-25 19:46:11 +00:00
|
|
|
- local: accelerate
|
|
|
|
|
title: Distributed training with 🤗 Accelerate
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_sharing
|
2022-01-29 00:49:26 +00:00
|
|
|
title: Share a model
|
2022-02-02 00:31:35 +00:00
|
|
|
title: Tutorials
|
2021-12-01 19:13:02 +00:00
|
|
|
- sections:
|
2022-03-25 19:51:43 +00:00
|
|
|
- local: fast_tokenizers
|
|
|
|
|
title: "Use tokenizers from 🤗 Tokenizers"
|
2022-02-07 18:34:56 +00:00
|
|
|
- local: create_a_model
|
2022-03-25 19:51:43 +00:00
|
|
|
title: Create a custom architecture
|
|
|
|
|
- local: custom_models
|
|
|
|
|
title: Sharing custom models
|
2022-02-23 19:58:33 +00:00
|
|
|
- sections:
|
|
|
|
|
- local: tasks/sequence_classification
|
|
|
|
|
title: Text classification
|
|
|
|
|
- local: tasks/token_classification
|
|
|
|
|
title: Token classification
|
|
|
|
|
- local: tasks/question_answering
|
|
|
|
|
title: Question answering
|
|
|
|
|
- local: tasks/language_modeling
|
|
|
|
|
title: Language modeling
|
|
|
|
|
- local: tasks/translation
|
|
|
|
|
title: Translation
|
|
|
|
|
- local: tasks/summarization
|
|
|
|
|
title: Summarization
|
|
|
|
|
- local: tasks/multiple_choice
|
|
|
|
|
title: Multiple choice
|
2022-03-11 22:43:49 +00:00
|
|
|
- local: tasks/audio_classification
|
|
|
|
|
title: Audio classification
|
|
|
|
|
- local: tasks/asr
|
|
|
|
|
title: Automatic speech recognition
|
|
|
|
|
- local: tasks/image_classification
|
|
|
|
|
title: Image classification
|
2022-02-23 19:58:33 +00:00
|
|
|
title: Fine-tune for downstream tasks
|
2022-03-07 19:29:14 +00:00
|
|
|
- local: run_scripts
|
|
|
|
|
title: Train with a script
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: sagemaker
|
|
|
|
|
title: Run training on Amazon SageMaker
|
2022-03-25 19:51:43 +00:00
|
|
|
- local: multilingual
|
|
|
|
|
title: Inference for multilingual models
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: converting_tensorflow_models
|
2022-03-25 19:51:43 +00:00
|
|
|
title: Converting TensorFlow Checkpoints
|
|
|
|
|
- local: serialization
|
|
|
|
|
title: Export 🤗 Transformers models
|
|
|
|
|
- local: performance
|
2022-05-16 11:36:41 +00:00
|
|
|
title: Performance and scalability
|
2022-05-03 13:55:10 +00:00
|
|
|
- local: big_models
|
|
|
|
|
title: Instantiating a big model
|
2022-03-25 19:51:43 +00:00
|
|
|
- local: benchmarks
|
|
|
|
|
title: Benchmarks
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: migration
|
|
|
|
|
title: Migrating from previous packages
|
2022-03-25 19:51:43 +00:00
|
|
|
- local: troubleshooting
|
|
|
|
|
title: Troubleshoot
|
|
|
|
|
- local: debugging
|
|
|
|
|
title: Debugging
|
|
|
|
|
- local: notebooks
|
|
|
|
|
title: "🤗 Transformers Notebooks"
|
|
|
|
|
- local: community
|
|
|
|
|
title: Community
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: contributing
|
|
|
|
|
title: How to contribute to transformers?
|
|
|
|
|
- local: add_new_model
|
|
|
|
|
title: "How to add a model to 🤗 Transformers?"
|
|
|
|
|
- local: add_new_pipeline
|
|
|
|
|
title: "How to add a pipeline to 🤗 Transformers?"
|
2022-05-16 11:36:41 +00:00
|
|
|
- local: perf_train_gpu_one
|
|
|
|
|
title: Training on one GPU
|
|
|
|
|
- local: perf_train_gpu_many
|
|
|
|
|
title: Training on many GPUs
|
|
|
|
|
- local: perf_hardware
|
|
|
|
|
title: Custom hardware for training
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: testing
|
|
|
|
|
title: Testing
|
2021-12-13 22:15:19 +00:00
|
|
|
- local: pr_checks
|
|
|
|
|
title: Checks on a Pull Request
|
2022-02-23 19:58:33 +00:00
|
|
|
title: How-to guides
|
2021-12-01 19:13:02 +00:00
|
|
|
- sections:
|
2022-03-25 19:51:43 +00:00
|
|
|
- local: philosophy
|
|
|
|
|
title: Philosophy
|
|
|
|
|
- local: glossary
|
|
|
|
|
title: Glossary
|
|
|
|
|
- local: task_summary
|
|
|
|
|
title: Summary of the tasks
|
|
|
|
|
- local: model_summary
|
|
|
|
|
title: Summary of the models
|
|
|
|
|
- local: tokenizer_summary
|
|
|
|
|
title: Summary of the tokenizers
|
|
|
|
|
- local: pad_truncation
|
|
|
|
|
title: Padding and truncation
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: bertology
|
|
|
|
|
title: BERTology
|
|
|
|
|
- local: perplexity
|
|
|
|
|
title: Perplexity of fixed-length models
|
2022-03-25 19:51:43 +00:00
|
|
|
title: Conceptual guides
|
2021-12-01 19:13:02 +00:00
|
|
|
- sections:
|
|
|
|
|
- sections:
|
|
|
|
|
- local: main_classes/callback
|
|
|
|
|
title: Callbacks
|
|
|
|
|
- local: main_classes/configuration
|
|
|
|
|
title: Configuration
|
|
|
|
|
- local: main_classes/data_collator
|
|
|
|
|
title: Data Collator
|
|
|
|
|
- local: main_classes/keras_callbacks
|
|
|
|
|
title: Keras callbacks
|
|
|
|
|
- local: main_classes/logging
|
|
|
|
|
title: Logging
|
|
|
|
|
- local: main_classes/model
|
|
|
|
|
title: Models
|
2022-03-10 10:54:45 +00:00
|
|
|
- local: main_classes/text_generation
|
|
|
|
|
title: Text Generation
|
2022-01-12 15:33:32 +00:00
|
|
|
- local: main_classes/onnx
|
|
|
|
|
title: ONNX
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: main_classes/optimizer_schedules
|
|
|
|
|
title: Optimization
|
|
|
|
|
- local: main_classes/output
|
|
|
|
|
title: Model outputs
|
|
|
|
|
- local: main_classes/pipelines
|
|
|
|
|
title: Pipelines
|
|
|
|
|
- local: main_classes/processors
|
|
|
|
|
title: Processors
|
|
|
|
|
- local: main_classes/tokenizer
|
|
|
|
|
title: Tokenizer
|
|
|
|
|
- local: main_classes/trainer
|
|
|
|
|
title: Trainer
|
|
|
|
|
- local: main_classes/deepspeed
|
|
|
|
|
title: DeepSpeed Integration
|
|
|
|
|
- local: main_classes/feature_extractor
|
|
|
|
|
title: Feature Extractor
|
|
|
|
|
title: Main Classes
|
|
|
|
|
- sections:
|
|
|
|
|
- local: model_doc/albert
|
|
|
|
|
title: ALBERT
|
|
|
|
|
- local: model_doc/auto
|
|
|
|
|
title: Auto Classes
|
|
|
|
|
- local: model_doc/bart
|
|
|
|
|
title: BART
|
|
|
|
|
- local: model_doc/barthez
|
|
|
|
|
title: BARThez
|
|
|
|
|
- local: model_doc/bartpho
|
|
|
|
|
title: BARTpho
|
|
|
|
|
- local: model_doc/beit
|
|
|
|
|
title: BEiT
|
|
|
|
|
- local: model_doc/bert
|
|
|
|
|
title: BERT
|
|
|
|
|
- local: model_doc/bertweet
|
|
|
|
|
title: Bertweet
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/bert-generation
|
2021-12-01 19:13:02 +00:00
|
|
|
title: BertGeneration
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/bert-japanese
|
2021-12-01 19:13:02 +00:00
|
|
|
title: BertJapanese
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/big_bird
|
2021-12-01 19:13:02 +00:00
|
|
|
title: BigBird
|
|
|
|
|
- local: model_doc/bigbird_pegasus
|
|
|
|
|
title: BigBirdPegasus
|
|
|
|
|
- local: model_doc/blenderbot
|
|
|
|
|
title: Blenderbot
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/blenderbot-small
|
2021-12-01 19:13:02 +00:00
|
|
|
title: Blenderbot Small
|
|
|
|
|
- local: model_doc/bort
|
|
|
|
|
title: BORT
|
|
|
|
|
- local: model_doc/byt5
|
|
|
|
|
title: ByT5
|
|
|
|
|
- local: model_doc/camembert
|
|
|
|
|
title: CamemBERT
|
|
|
|
|
- local: model_doc/canine
|
|
|
|
|
title: CANINE
|
2022-02-07 15:11:37 +00:00
|
|
|
- local: model_doc/convnext
|
|
|
|
|
title: ConvNeXT
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/clip
|
|
|
|
|
title: CLIP
|
|
|
|
|
- local: model_doc/convbert
|
|
|
|
|
title: ConvBERT
|
|
|
|
|
- local: model_doc/cpm
|
|
|
|
|
title: CPM
|
|
|
|
|
- local: model_doc/ctrl
|
|
|
|
|
title: CTRL
|
2022-03-01 10:09:20 +00:00
|
|
|
- local: model_doc/data2vec
|
|
|
|
|
title: Data2Vec
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/deberta
|
|
|
|
|
title: DeBERTa
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/deberta-v2
|
2021-12-01 19:13:02 +00:00
|
|
|
title: DeBERTa-v2
|
Decision transformer gym (#15845)
* Created the Decision Transformer Modle
* updating tests, copy to other machine
* Added last hidden size to Decision Transformer modelling outputs
* Removed copy of original DT file
* made a temporary change to gpt2 to have it conform with the Decision Transformer version
* Updated tests
* Ignoring a file used to test the DT model
* added comments to config file
* added comments and argument descriptions to decision transformer file
* Updated doc
* Ran "make style"
* Remove old model imports
* Removed unused imports, cleaned up init file
* Update docs/source/model_doc/decision_transformer.mdx
added my username
Co-authored-by: Lysandre Debut <lysandre@huggingface.co>
* Reverted changes made to gpt2
* Removed datasets submodule
* Update the modeling outputs to include gpt2 attentions, hidden states and last hidden states
* Added support for return of hidden states, attentions and return dict of gpt2 model.
* Updated tests to include many of the ModelTesterMixin tests.
The following tests are skipped: test_generate_without_input_ids, test_pruning, test_resize_embeddings, test_head_masking, test_attention_outputs, test_hidden_states_output, test_inputs_embeds, test_model_common_attributes
* Added missing line to the end of gpt2 file
* Added an integration test for the Decision Transformer
Test performs and autoregressive evaluation for two time steps
* Set done and info to _ to fix failing test
* Updated integration test to be deterministic and check expected outputs
* Apply suggestions from code review
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Removed unnecessary config options
* Cleaned up commented code and old comments.
* Cleaned up commented code.
* Changed DecisionTransformer to Decision Transformer
* Added Decision Transformer to the main README file
* Added copy of GTP2 called DecisionTranformerGPT2Model
* isorted imports
* isorted imports
* Added model to non-English README files
* Ran make fix-copies and corrected some cases.
* Updated index file to include Decision Transformer
* Added gpt2 model as copy inside the Decision Transformer model file
* Added the unit test file to the list of TEST_FILES_WITH_NO_COMMON_TESTS
* Deleted redundant checkpoint files (I don't know how these got committed)
* Removed testing files. (These should have never been committed)
* Removed accidentally committed files
* Moved the Decision Transformer test to its own directory
* Add type hints for Pegasus (#16324)
* Funnel type hints (#16323)
* add pt funnel type hints
* add tf funnel type hints
* Add type hints for ProphetNet PyTorch (#16272)
* [GLPN] Improve docs (#16331)
* Add link to notebook
* Add link
* Fix bug
Co-authored-by: Niels Rogge <nielsrogge@Nielss-MacBook-Pro.local>
* Added type hints for Pytorch Marian calls (#16200)
* Added type hinting for forward functions in pytorch marian
* typo correction
* Removed type hints on functions from BART per Suraj Patil request
* fix import pb
* fix typo
* corrected tuple call
* ran black
* after fix-copies
Some optional tags on primitives were removed, past_key_values in MarianForCausalLM changed from Tuple of Tuple to List
* Fixing copies to roformer and pegasus
Co-authored-by: Clementine Fourrier <cfourrie@inria.fr>
Co-authored-by: matt <rocketknight1@gmail.com>
* Moved DecisionTransformOutput to modeling_decision_transformer
* Moved the example usage to research project and cleaned comments
* Made tests ignore the copy of gpt2 in Decision Transformer
* Added module output to modelling decision transformer
* removed copied gpt2 model from list of transformers models
* Updated tests and created __init__ file for new test location
* Update README.md
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Update src/transformers/models/decision_transformer/configuration_decision_transformer.py
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Removed unneeded summary type from config file
* Fixed copies
* Updated pretrained config map to refer to hopper-medium checkpoint
* done (#16340)
* Added Decision transformer to model docs
* Update src/transformers/models/decision_transformer/modeling_decision_transformer.py
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Update src/transformers/models/decision_transformer/modeling_decision_transformer.py
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Update src/transformers/models/decision_transformer/configuration_decision_transformer.py
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Add type annotations for Rembert/Splinter and copies (#16338)
* undo black autoformat
* minor fix to rembert forward with default
* make fix-copies, make quality
* Adding types to template model
* Removing List from the template types
* Remove `Optional` from a couple of types that don't accept `None`
Co-authored-by: matt <rocketknight1@gmail.com>
* [Bug template] Shift responsibilities for long-range (#16344)
* Fix code repetition in serialization guide (#16346)
* Adopt framework-specific blocks for content (#16342)
* ✨ refactor code samples with framework-specific blocks
* ✨ update training.mdx
* 🖍 apply feedback
* Updates the default branch from master to main (#16326)
* Updates the default branch from master to main
* Links from `master` to `main`
* Typo
* Update examples/flax/README.md
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Updated model with custom docstring example
* Created the Decision Transformer Modle
* updating tests, copy to other machine
* Added last hidden size to Decision Transformer modelling outputs
* Removed copy of original DT file
* made a temporary change to gpt2 to have it conform with the Decision Transformer version
* Updated tests
* Ignoring a file used to test the DT model
* added comments to config file
* added comments and argument descriptions to decision transformer file
* Updated doc
* Ran "make style"
* Remove old model imports
* Removed unused imports, cleaned up init file
* Update docs/source/model_doc/decision_transformer.mdx
added my username
Co-authored-by: Lysandre Debut <lysandre@huggingface.co>
* Reverted changes made to gpt2
* Removed datasets submodule
* Update the modeling outputs to include gpt2 attentions, hidden states and last hidden states
* Added support for return of hidden states, attentions and return dict of gpt2 model.
* Updated tests to include many of the ModelTesterMixin tests.
The following tests are skipped: test_generate_without_input_ids, test_pruning, test_resize_embeddings, test_head_masking, test_attention_outputs, test_hidden_states_output, test_inputs_embeds, test_model_common_attributes
* Added missing line to the end of gpt2 file
* Added an integration test for the Decision Transformer
Test performs and autoregressive evaluation for two time steps
* Set done and info to _ to fix failing test
* Updated integration test to be deterministic and check expected outputs
* Apply suggestions from code review
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Removed unnecessary config options
* Cleaned up commented code and old comments.
* Cleaned up commented code.
* Changed DecisionTransformer to Decision Transformer
* Added Decision Transformer to the main README file
* Added copy of GTP2 called DecisionTranformerGPT2Model
* isorted imports
* isorted imports
* Added model to non-English README files
* Ran make fix-copies and corrected some cases.
* Updated index file to include Decision Transformer
* Added gpt2 model as copy inside the Decision Transformer model file
* Added the unit test file to the list of TEST_FILES_WITH_NO_COMMON_TESTS
* Deleted redundant checkpoint files (I don't know how these got committed)
* Removed testing files. (These should have never been committed)
* Removed accidentally committed files
* Moved the Decision Transformer test to its own directory
* Moved DecisionTransformOutput to modeling_decision_transformer
* Moved the example usage to research project and cleaned comments
* Made tests ignore the copy of gpt2 in Decision Transformer
* Added module output to modelling decision transformer
* removed copied gpt2 model from list of transformers models
* Updated tests and created __init__ file for new test location
* Update README.md
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Update src/transformers/models/decision_transformer/configuration_decision_transformer.py
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Removed unneeded summary type from config file
* Fixed copies
* Updated pretrained config map to refer to hopper-medium checkpoint
* Added Decision transformer to model docs
* Update src/transformers/models/decision_transformer/modeling_decision_transformer.py
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Update src/transformers/models/decision_transformer/modeling_decision_transformer.py
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Update src/transformers/models/decision_transformer/configuration_decision_transformer.py
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
* Updated model with custom docstring example
* Updated copies, config auto, and readme files.
Co-authored-by: Lysandre Debut <lysandre@huggingface.co>
Co-authored-by: Sylvain Gugger <35901082+sgugger@users.noreply.github.com>
Co-authored-by: Dan Tegzes <48134725+Tegzes@users.noreply.github.com>
Co-authored-by: Adam Montgomerie <adam@avanssion.com>
Co-authored-by: NielsRogge <48327001+NielsRogge@users.noreply.github.com>
Co-authored-by: Niels Rogge <nielsrogge@Nielss-MacBook-Pro.local>
Co-authored-by: Clémentine Fourrier <22726840+clefourrier@users.noreply.github.com>
Co-authored-by: Clementine Fourrier <cfourrie@inria.fr>
Co-authored-by: matt <rocketknight1@gmail.com>
Co-authored-by: Francesco Saverio Zuppichini <francesco.zuppichini@gmail.com>
Co-authored-by: Jacob Dineen <54680234+jacobdineen@users.noreply.github.com>
Co-authored-by: Patrick von Platen <patrick.v.platen@gmail.com>
Co-authored-by: Omar Sanseviero <osanseviero@gmail.com>
Co-authored-by: Steven Liu <59462357+stevhliu@users.noreply.github.com>
Co-authored-by: Lysandre Debut <lysandre.debut@reseau.eseo.fr>
2022-03-23 20:18:43 +00:00
|
|
|
- local: model_doc/decision_transformer
|
|
|
|
|
title: Decision Transformer
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/deit
|
|
|
|
|
title: DeiT
|
|
|
|
|
- local: model_doc/detr
|
|
|
|
|
title: DETR
|
|
|
|
|
- local: model_doc/dialogpt
|
|
|
|
|
title: DialoGPT
|
|
|
|
|
- local: model_doc/distilbert
|
|
|
|
|
title: DistilBERT
|
2022-03-10 10:34:44 +00:00
|
|
|
- local: model_doc/dit
|
|
|
|
|
title: DiT
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/dpr
|
|
|
|
|
title: DPR
|
2022-03-28 14:28:10 +00:00
|
|
|
- local: model_doc/dpt
|
|
|
|
|
title: DPT
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/electra
|
|
|
|
|
title: ELECTRA
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/encoder-decoder
|
2021-12-01 19:13:02 +00:00
|
|
|
title: Encoder Decoder Models
|
|
|
|
|
- local: model_doc/flaubert
|
|
|
|
|
title: FlauBERT
|
2022-05-11 21:56:48 +00:00
|
|
|
- local: model_doc/flava
|
|
|
|
|
title: FLAVA
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/fnet
|
2021-12-09 14:25:31 +00:00
|
|
|
title: FNet
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/fsmt
|
|
|
|
|
title: FSMT
|
|
|
|
|
- local: model_doc/funnel
|
|
|
|
|
title: Funnel Transformer
|
2022-03-22 07:51:13 +00:00
|
|
|
- local: model_doc/glpn
|
|
|
|
|
title: GLPN
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/herbert
|
2022-01-03 10:08:55 +00:00
|
|
|
title: HerBERT
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/ibert
|
|
|
|
|
title: I-BERT
|
|
|
|
|
- local: model_doc/imagegpt
|
|
|
|
|
title: ImageGPT
|
|
|
|
|
- local: model_doc/layoutlm
|
|
|
|
|
title: LayoutLM
|
|
|
|
|
- local: model_doc/layoutlmv2
|
|
|
|
|
title: LayoutLMV2
|
|
|
|
|
- local: model_doc/layoutxlm
|
|
|
|
|
title: LayoutXLM
|
|
|
|
|
- local: model_doc/led
|
|
|
|
|
title: LED
|
|
|
|
|
- local: model_doc/longformer
|
|
|
|
|
title: Longformer
|
|
|
|
|
- local: model_doc/luke
|
|
|
|
|
title: LUKE
|
|
|
|
|
- local: model_doc/lxmert
|
|
|
|
|
title: LXMERT
|
|
|
|
|
- local: model_doc/marian
|
|
|
|
|
title: MarianMT
|
2022-03-02 14:48:20 +00:00
|
|
|
- local: model_doc/maskformer
|
|
|
|
|
title: MaskFormer
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/m2m_100
|
|
|
|
|
title: M2M100
|
|
|
|
|
- local: model_doc/mbart
|
|
|
|
|
title: MBart and MBart-50
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/megatron-bert
|
2021-12-01 19:13:02 +00:00
|
|
|
title: MegatronBERT
|
|
|
|
|
- local: model_doc/megatron_gpt2
|
|
|
|
|
title: MegatronGPT2
|
2021-12-22 11:35:59 +00:00
|
|
|
- local: model_doc/mluke
|
2022-03-29 15:34:30 +00:00
|
|
|
title: mLUKE
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/mobilebert
|
|
|
|
|
title: MobileBERT
|
|
|
|
|
- local: model_doc/mpnet
|
|
|
|
|
title: MPNet
|
|
|
|
|
- local: model_doc/mt5
|
|
|
|
|
title: MT5
|
2022-01-11 13:25:49 +00:00
|
|
|
- local: model_doc/nystromformer
|
|
|
|
|
title: Nyströmformer
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/openai-gpt
|
2021-12-01 19:13:02 +00:00
|
|
|
title: OpenAI GPT
|
2022-05-12 10:24:35 +00:00
|
|
|
- local: model_doc/opt
|
|
|
|
|
title: OPT
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/gpt2
|
|
|
|
|
title: OpenAI GPT2
|
|
|
|
|
- local: model_doc/gptj
|
|
|
|
|
title: GPT-J
|
|
|
|
|
- local: model_doc/gpt_neo
|
|
|
|
|
title: GPT Neo
|
|
|
|
|
- local: model_doc/hubert
|
|
|
|
|
title: Hubert
|
2021-12-08 18:52:31 +00:00
|
|
|
- local: model_doc/perceiver
|
|
|
|
|
title: Perceiver
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/pegasus
|
|
|
|
|
title: Pegasus
|
|
|
|
|
- local: model_doc/phobert
|
|
|
|
|
title: PhoBERT
|
2022-02-18 13:17:09 +00:00
|
|
|
- local: model_doc/plbart
|
|
|
|
|
title: PLBart
|
2022-02-17 12:16:37 +00:00
|
|
|
- local: model_doc/poolformer
|
|
|
|
|
title: PoolFormer
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/prophetnet
|
|
|
|
|
title: ProphetNet
|
|
|
|
|
- local: model_doc/qdqbert
|
|
|
|
|
title: QDQBert
|
|
|
|
|
- local: model_doc/rag
|
|
|
|
|
title: RAG
|
2022-01-18 12:24:13 +00:00
|
|
|
- local: model_doc/realm
|
|
|
|
|
title: REALM
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/reformer
|
|
|
|
|
title: Reformer
|
|
|
|
|
- local: model_doc/rembert
|
|
|
|
|
title: RemBERT
|
2022-04-07 19:58:00 +00:00
|
|
|
- local: model_doc/regnet
|
|
|
|
|
title: RegNet
|
2022-03-14 18:57:55 +00:00
|
|
|
- local: model_doc/resnet
|
|
|
|
|
title: ResNet
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/retribert
|
|
|
|
|
title: RetriBERT
|
|
|
|
|
- local: model_doc/roberta
|
|
|
|
|
title: RoBERTa
|
|
|
|
|
- local: model_doc/roformer
|
|
|
|
|
title: RoFormer
|
|
|
|
|
- local: model_doc/segformer
|
|
|
|
|
title: SegFormer
|
|
|
|
|
- local: model_doc/sew
|
|
|
|
|
title: SEW
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/sew-d
|
2021-12-01 19:13:02 +00:00
|
|
|
title: SEW-D
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/speech-encoder-decoder
|
2021-12-01 19:13:02 +00:00
|
|
|
title: Speech Encoder Decoder Models
|
|
|
|
|
- local: model_doc/speech_to_text
|
|
|
|
|
title: Speech2Text
|
|
|
|
|
- local: model_doc/speech_to_text_2
|
|
|
|
|
title: Speech2Text2
|
|
|
|
|
- local: model_doc/splinter
|
|
|
|
|
title: Splinter
|
|
|
|
|
- local: model_doc/squeezebert
|
|
|
|
|
title: SqueezeBERT
|
2022-01-21 11:10:41 +00:00
|
|
|
- local: model_doc/swin
|
|
|
|
|
title: Swin Transformer
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/t5
|
|
|
|
|
title: T5
|
|
|
|
|
- local: model_doc/t5v1.1
|
|
|
|
|
title: T5v1.1
|
|
|
|
|
- local: model_doc/tapas
|
|
|
|
|
title: TAPAS
|
2022-04-08 08:57:51 +00:00
|
|
|
- local: model_doc/tapex
|
|
|
|
|
title: TAPEX
|
2022-05-17 23:07:43 +00:00
|
|
|
- local: model_doc/trajectory_transformer
|
|
|
|
|
title: Trajectory Transformer
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/transfo-xl
|
2021-12-01 19:13:02 +00:00
|
|
|
title: Transformer XL
|
|
|
|
|
- local: model_doc/trocr
|
|
|
|
|
title: TrOCR
|
|
|
|
|
- local: model_doc/unispeech
|
|
|
|
|
title: UniSpeech
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/unispeech-sat
|
2021-12-01 19:13:02 +00:00
|
|
|
title: UniSpeech-SAT
|
2022-03-15 07:47:12 +00:00
|
|
|
- local: model_doc/van
|
|
|
|
|
title: VAN
|
2022-01-19 18:51:59 +00:00
|
|
|
- local: model_doc/vilt
|
|
|
|
|
title: ViLT
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/vision-encoder-decoder
|
2021-12-01 19:13:02 +00:00
|
|
|
title: Vision Encoder Decoder Models
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/vision-text-dual-encoder
|
2021-12-13 22:15:19 +00:00
|
|
|
title: Vision Text Dual Encoder
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/vit
|
|
|
|
|
title: Vision Transformer (ViT)
|
2022-01-18 15:21:32 +00:00
|
|
|
- local: model_doc/vit_mae
|
|
|
|
|
title: ViTMAE
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/visual_bert
|
|
|
|
|
title: VisualBERT
|
|
|
|
|
- local: model_doc/wav2vec2
|
|
|
|
|
title: Wav2Vec2
|
2022-05-16 22:43:16 +00:00
|
|
|
- local: model_doc/wav2vec2-conformer
|
|
|
|
|
title: Wav2Vec2-Conformer
|
2021-12-17 18:56:44 +00:00
|
|
|
- local: model_doc/wav2vec2_phoneme
|
|
|
|
|
title: Wav2Vec2Phoneme
|
2021-12-16 17:57:05 +00:00
|
|
|
- local: model_doc/wavlm
|
|
|
|
|
title: WavLM
|
2022-01-28 17:55:23 +00:00
|
|
|
- local: model_doc/xglm
|
|
|
|
|
title: XGLM
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/xlm
|
|
|
|
|
title: XLM
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/xlm-prophetnet
|
2021-12-01 19:13:02 +00:00
|
|
|
title: XLM-ProphetNet
|
2022-01-03 10:08:55 +00:00
|
|
|
- local: model_doc/xlm-roberta
|
2021-12-01 19:13:02 +00:00
|
|
|
title: XLM-RoBERTa
|
2022-01-29 12:42:37 +00:00
|
|
|
- local: model_doc/xlm-roberta-xl
|
|
|
|
|
title: XLM-RoBERTa-XL
|
2021-12-01 19:13:02 +00:00
|
|
|
- local: model_doc/xlnet
|
|
|
|
|
title: XLNet
|
|
|
|
|
- local: model_doc/xlsr_wav2vec2
|
|
|
|
|
title: XLSR-Wav2Vec2
|
2021-12-17 18:56:44 +00:00
|
|
|
- local: model_doc/xls_r
|
|
|
|
|
title: XLS-R
|
2022-05-02 16:30:55 +00:00
|
|
|
- local: model_doc/yolos
|
|
|
|
|
title: YOLOS
|
2022-01-26 18:18:29 +00:00
|
|
|
- local: model_doc/yoso
|
|
|
|
|
title: YOSO
|
2021-12-01 19:13:02 +00:00
|
|
|
title: Models
|
|
|
|
|
- sections:
|
|
|
|
|
- local: internal/modeling_utils
|
|
|
|
|
title: Custom Layers and Utilities
|
|
|
|
|
- local: internal/pipelines_utils
|
|
|
|
|
title: Utilities for pipelines
|
|
|
|
|
- local: internal/tokenization_utils
|
|
|
|
|
title: Utilities for Tokenizers
|
|
|
|
|
- local: internal/trainer_utils
|
|
|
|
|
title: Utilities for Trainer
|
|
|
|
|
- local: internal/generation_utils
|
|
|
|
|
title: Utilities for Generation
|
|
|
|
|
- local: internal/file_utils
|
|
|
|
|
title: General Utilities
|
|
|
|
|
title: Internal Helpers
|
|
|
|
|
title: API
|