- __config
- __redirects
- __toctree
- _accelerate
- _add_new_model
- _add_new_pipeline
- _add_tensorflow_model
- _attention
- _autoclass_tutorial
- _benchmarks
- _bertology
- _big_models
- _chat_templating
- _community
- _contributing
- _create_a_model
- _custom_models
- _custom_tools
- _debugging
- _deepspeed
- _fast_tokenizers
- _fsdp
- _generation_strategies
- _glossary
- _hf_quantizer
- _hpo_train
- _installation
- _llm_tutorial
- _llm_tutorial_optimization
- _model_memory_anatomy
- _model_sharing
- _model_summary
- _multilingual
- _notebooks
- _pad_truncation
- _perf_hardware
- _perf_infer_cpu
- _perf_infer_gpu_one
- _perf_torch_compile
- _perf_train_cpu
- _perf_train_cpu_many
- _perf_train_gpu_many
- _perf_train_gpu_one
- _perf_train_special
- _perf_train_tpu_tf
- _performance
- _perplexity
- _philosophy
- _pipeline_tutorial
- _pipeline_webserver
- _pr_checks
- _preprocessing
- _quantization
- _quicktour
- _run_scripts
- _sagemaker
- _serialization
- _task_summary
- _tasks_explained
- _testing
- _tf_xla
- _tflite
- _tokenizer_summary
- _torchscript
- _trainer
- _training
- _transformers_agents
- _troubleshooting
- internal_audio_utils
- internal_file_utils
- internal_generation_utils
- internal_image_processing_utils
- internal_modeling_utils
- internal_pipelines_utils
- internal_time_series_utils
- internal_tokenization_utils
- internal_trainer_utils
- main_classes_agent
- main_classes_backbones
- main_classes_callback
- main_classes_configuration
- main_classes_data_collator
- main_classes_deepspeed
- main_classes_feature_extractor
- main_classes_image_processor
- main_classes_keras_callbacks
- main_classes_logging
- main_classes_model
- main_classes_onnx
- main_classes_optimizer_schedules
- main_classes_output
- main_classes_pipelines
- main_classes_processors
- main_classes_quantization
- main_classes_text_generation
- main_classes_tokenizer
- main_classes_trainer
- model_doc_albert
- model_doc_align
- model_doc_altclip
- model_doc_audio-spectrogram-transformer
- model_doc_auto
- model_doc_autoformer
- model_doc_bark
- model_doc_bart
- model_doc_barthez
- model_doc_bartpho
- model_doc_beit
- model_doc_bert-generation
- model_doc_bert-japanese
- model_doc_bert
- model_doc_bertweet
- model_doc_big_bird
- model_doc_bigbird_pegasus
- model_doc_biogpt
- model_doc_bit
- model_doc_blenderbot-small
- model_doc_blenderbot
- model_doc_blip-2
- model_doc_blip
- model_doc_bloom
- model_doc_bort
- model_doc_bridgetower
- model_doc_bros
- model_doc_byt5
- model_doc_camembert
- model_doc_canine
- model_doc_chinese_clip
- model_doc_clap
- model_doc_clip
- model_doc_clipseg
- model_doc_clvp
- model_doc_code_llama
- model_doc_codegen
- model_doc_conditional_detr
- model_doc_convbert
- model_doc_convnext
- model_doc_convnextv2
- model_doc_cpm
- model_doc_cpmant
- model_doc_ctrl
- model_doc_cvt
- model_doc_data2vec
- model_doc_deberta-v2
- model_doc_deberta
- model_doc_decision_transformer
- model_doc_deformable_detr
- model_doc_deit
- model_doc_deplot
- model_doc_depth_anything
- model_doc_deta
- model_doc_detr
- model_doc_dialogpt
- model_doc_dinat
- model_doc_dinov2
- model_doc_distilbert
- model_doc_dit
- model_doc_donut
- model_doc_dpr
- model_doc_dpt
- model_doc_efficientformer
- model_doc_efficientnet
- model_doc_electra
- model_doc_encodec
- model_doc_encoder-decoder
- model_doc_ernie
- model_doc_ernie_m
- model_doc_esm
- model_doc_falcon
- model_doc_fastspeech2_conformer
- model_doc_flan-t5
- model_doc_flan-ul2
- model_doc_flaubert
- model_doc_flava
- model_doc_fnet
- model_doc_focalnet
- model_doc_fsmt
- model_doc_funnel
- model_doc_fuyu
- model_doc_git
- model_doc_glpn
- model_doc_gpt-sw3
- model_doc_gpt2
- model_doc_gpt_bigcode
- model_doc_gpt_neo
- model_doc_gpt_neox
- model_doc_gpt_neox_japanese
- model_doc_gptj
- model_doc_gptsan-japanese
- model_doc_graphormer
- model_doc_groupvit
- model_doc_herbert
- model_doc_hubert
- model_doc_ibert
- model_doc_idefics
- model_doc_imagegpt
- model_doc_informer
- model_doc_instructblip
- model_doc_jukebox
- model_doc_kosmos-2
- model_doc_layoutlm
- model_doc_layoutlmv2
- model_doc_layoutlmv3
- model_doc_layoutxlm
- model_doc_led
- model_doc_levit
- model_doc_lilt
- model_doc_llama
- model_doc_llama2
- model_doc_llava
- model_doc_longformer
- model_doc_longt5
- model_doc_luke
- model_doc_lxmert
- model_doc_m2m_100
- model_doc_madlad-400
- model_doc_marian
- model_doc_markuplm
- model_doc_mask2former
- model_doc_maskformer
- model_doc_matcha
- model_doc_mbart
- model_doc_mctct
- model_doc_mega
- model_doc_megatron-bert
- model_doc_megatron_gpt2
- model_doc_mgp-str
- model_doc_mistral
- model_doc_mixtral
- model_doc_mluke
- model_doc_mms
- model_doc_mobilebert
- model_doc_mobilenet_v1
- model_doc_mobilenet_v2
- model_doc_mobilevit
- model_doc_mobilevitv2
- model_doc_mpnet
- model_doc_mpt
- model_doc_mra
- model_doc_mt5
- model_doc_musicgen
- model_doc_mvp
- model_doc_nat
- model_doc_nezha
- model_doc_nllb-moe
- model_doc_nllb
- model_doc_nougat
- model_doc_nystromformer
- model_doc_oneformer
- model_doc_open-llama
- model_doc_openai-gpt
- model_doc_opt
- model_doc_owlv2
- model_doc_owlvit
- model_doc_patchtsmixer
- model_doc_patchtst
- model_doc_pegasus
- model_doc_pegasus_x
- model_doc_perceiver
- model_doc_persimmon
- model_doc_phi
- model_doc_phobert
- model_doc_pix2struct
- model_doc_plbart
- model_doc_poolformer
- model_doc_pop2piano
- model_doc_prophetnet
- model_doc_pvt
- model_doc_qdqbert
- model_doc_qwen2
- model_doc_rag
- model_doc_realm
- model_doc_reformer
- model_doc_regnet
- model_doc_rembert
- model_doc_resnet
- model_doc_retribert
- model_doc_roberta-prelayernorm
- model_doc_roberta
- model_doc_roc_bert
- model_doc_roformer
- model_doc_rwkv
- model_doc_sam
- model_doc_seamless_m4t
- model_doc_seamless_m4t_v2
- model_doc_segformer
- model_doc_sew-d
- model_doc_sew
- model_doc_siglip
- model_doc_speech-encoder-decoder
- model_doc_speech_to_text
- model_doc_speech_to_text_2
- model_doc_speecht5
- model_doc_splinter
- model_doc_squeezebert
- model_doc_stablelm
- model_doc_swiftformer
- model_doc_swin
- model_doc_swin2sr
- model_doc_swinv2
- model_doc_switch_transformers
- model_doc_t5
- model_doc_t5v1.1
- model_doc_table-transformer
- model_doc_tapas
- model_doc_tapex
- model_doc_time_series_transformer
- model_doc_timesformer
- model_doc_trajectory_transformer
- model_doc_transfo-xl
- model_doc_trocr
- model_doc_tvlt
- model_doc_tvp
- model_doc_ul2
- model_doc_umt5
- model_doc_unispeech-sat
- model_doc_unispeech
- model_doc_univnet
- model_doc_upernet
- model_doc_van
- model_doc_videomae
- model_doc_vilt
- model_doc_vipllava
- model_doc_vision-encoder-decoder
- model_doc_vision-text-dual-encoder
- model_doc_visual_bert
- model_doc_vit
- model_doc_vit_hybrid
- model_doc_vit_mae
- model_doc_vit_msn
- model_doc_vitdet
- model_doc_vitmatte
- model_doc_vits
- model_doc_vivit
- model_doc_wav2vec2-bert
- model_doc_wav2vec2-conformer
- model_doc_wav2vec2
- model_doc_wav2vec2_phoneme
- model_doc_wavlm
- model_doc_whisper
- model_doc_xclip
- model_doc_xglm
- model_doc_xlm-prophetnet
- model_doc_xlm-roberta-xl
- model_doc_xlm-roberta
- model_doc_xlm-v
- model_doc_xlm
- model_doc_xlnet
- model_doc_xls_r
- model_doc_xlsr_wav2vec2
- model_doc_xmod
- model_doc_yolos
- model_doc_yoso
- tasks_asr
- tasks_audio_classification
- tasks_document_question_answering
- tasks_idefics
- tasks_image_captioning
- tasks_image_classification
- tasks_image_to_image
- tasks_knowledge_distillation_for_image_classification
- tasks_language_modeling
- tasks_mask_generation
- tasks_masked_language_modeling
- tasks_monocular_depth_estimation
- tasks_multiple_choice
- tasks_object_detection
- tasks_prompting
- tasks_question_answering
- tasks_semantic_segmentation
- tasks_sequence_classification
- tasks_summarization
- tasks_text-to-speech
- tasks_token_classification
- tasks_translation
- tasks_video_classification
- tasks_visual_question_answering
- tasks_zero_shot_image_classification
- tasks_zero_shot_object_detection