| _app | | | 1,412 items |
| community_integrations | | | 26 items |
| internal | | | 24 items |
| kernel_doc | | | 4 items |
| main_classes | | | 42 items |
| model_doc | | | 884 items |
| _redirects.yml | 128 Bytes | | 03cac062 |
| _toctree.yml | 40.4 kB | | 7190e7de |
| accelerate.html | 30.3 kB | | 3fff0e83 |
| accelerate.md | 6.6 kB | | 1d6de2b4 |
| accelerator_selection.html | 21.1 kB | | ee9fb2c2 |
| accelerator_selection.md | 3.29 kB | | be47a576 |
| add_new_model.html | 136 kB | | 3abd5a82 |
| add_new_model.md | 41.1 kB | | dbbc7724 |
| add_new_pipeline.html | 47.5 kB | | fe79ef8c |
| add_new_pipeline.md | 11 kB | | c8f57afe |
| assisted_decoding.html | 29.6 kB | | cbad63f6 |
| assisted_decoding.md | 7.55 kB | | ec437e5a |
| attention_interface.html | 45.1 kB | | 5d23ddb0 |
| attention_interface.md | 10 kB | | a73a5c69 |
| auto_docstring.html | 44.2 kB | | 9b5a6119 |
| auto_docstring.md | 14.8 kB | | ff25a569 |
| backbones.html | 27.1 kB | | c33570fd |
| backbones.md | 6.15 kB | | 5c87db11 |
| cache_explanation.html | 58.3 kB | | ff345ecb |
| cache_explanation.md | 10 kB | | 01d12136 |
| chat_content_patterns.html | 43.6 kB | | d8ca3705 |
| chat_content_patterns.md | 6.22 kB | | d5f78ca6 |
| chat_extras.html | 42.6 kB | | 94b3470b |
| chat_extras.md | 9.1 kB | | 067f07d0 |
| chat_templating.html | 45.8 kB | | 6c11b85d |
| chat_templating.md | 11.2 kB | | 186deecb |
| chat_templating_multimodal.html | 42.7 kB | | 01ec388c |
| chat_templating_multimodal.md | 10.9 kB | | 8c5c5981 |
| chat_templating_writing.html | 64.6 kB | | cd317b54 |
| chat_templating_writing.md | 13.4 kB | | b596ada3 |
| community.html | 44.5 kB | | 2850cfd4 |
| community.md | 25.9 kB | | 8842cb09 |
| continuous_batching.html | 37.4 kB | | ebf70b27 |
| continuous_batching.md | 8.28 kB | | bae45a3f |
| contributing.html | 89.3 kB | | 0fd5f746 |
| contributing.md | 23.9 kB | | 8654ad23 |
| conversations.html | 28.9 kB | | cbbf9162 |
| conversations.md | 6.74 kB | | 8d5ee927 |
| custom_models.html | 47.7 kB | | 01417292 |
| custom_models.md | 13.6 kB | | 1a41b908 |
| custom_tokenizers.html | 29.9 kB | | b903aada |
| custom_tokenizers.md | 5.86 kB | | 088dad5d |
| data_collators.html | 22.6 kB | | a8475d08 |
| data_collators.md | 4.45 kB | | 6cc9432a |
| debugging.html | 67.4 kB | | 7c2e63fa |
| debugging.md | 15.5 kB | | b4ad91ed |
| deepspeed.html | 159 kB | | dcfa4fcc |
| deepspeed.md | 54.8 kB | | c518e8f7 |
| expert_parallelism.html | 12.9 kB | | 85bb233a |
| expert_parallelism.md | 1.8 kB | | 6b126396 |
| experts_interface.html | 26.1 kB | | e586d139 |
| experts_interface.md | 6.56 kB | | b1ce7e66 |
| fast_tokenizers.html | 58.6 kB | | d940923e |
| fast_tokenizers.md | 12.5 kB | | ab99fd92 |
| favicon.png | 1.57 kB | | 6e06dd7b |
| feature_extractors.html | 41.6 kB | | 6dd6b11f |
| feature_extractors.md | 9.21 kB | | 0c12ede0 |
| fsdp.html | 37.1 kB | | a0ab7420 |
| fsdp.md | 6.77 kB | | 10c24317 |
| generation_features.html | 19.9 kB | | 6522cf2e |
| generation_features.md | 5.17 kB | | dac040fa |
| generation_strategies.html | 67.3 kB | | 60043ab0 |
| generation_strategies.md | 14.5 kB | | 09734b03 |
| gguf.html | 11.9 kB | | e030fd94 |
| gguf.md | 2.08 kB | | 59e79fad |
| glossary.html | 154 kB | | 23c9bfd3 |
| glossary.md | 27.1 kB | | d97c45fc |
| how_to_hack_models.html | 30.9 kB | | 5b1bb7fb |
| how_to_hack_models.md | 7.25 kB | | 0e6c0a7a |
| hpo_train.html | 20.2 kB | | ff1f2aaa |
| hpo_train.md | 6.14 kB | | 7753695d |
| image_processors.html | 43.2 kB | | 8afb194c |
| image_processors.md | 11.9 kB | | ba6c2d06 |
| index.html | 15 kB | | 61ee31d0 |
| index.md | 3.53 kB | | 080f46aa |
| installation.html | 41.7 kB | | 985e2dfe |
| installation.md | 6.31 kB | | f5df8fd6 |
| kv_cache.html | 56.6 kB | | a855a1a1 |
| kv_cache.md | 19.6 kB | | 2773d9de |
| llm_tutorial.html | 63.1 kB | | 4afd141a |
| llm_tutorial.md | 15.8 kB | | c626a487 |
| llm_tutorial_optimization.html | 211 kB | | 23bb3fa3 |
| llm_tutorial_optimization.md | 43.2 kB | | a00e827c |
| llms-full.txt | 24.6 MB | | 1f426557 |
| llms.txt | 57.4 kB | | 743dfc87 |
| model_memory_anatomy.html | 42 kB | | d92075cc |
| model_memory_anatomy.md | 11 kB | | f5dadc84 |
| model_sharing.html | 31.4 kB | | 79033e6a |
| model_sharing.md | 5.86 kB | | 1ff54958 |
| models.html | 48.8 kB | | 2e7fe96f |
| models.md | 12.3 kB | | 66a44b73 |
| models_timeline.html | 7.24 kB | | 944003b4 |
| models_timeline.md | 502 Bytes | | 59a02ee8 |
| modular_transformers.html | 108 kB | | 53b4debd |
|