| _app | | | 3,630 items |
| internal | | | 9 items |
| main_classes | | | 21 items |
| model_doc | | | 302 items |
| quantization | | | 13 items |
| tasks | | | 30 items |
| _redirects.yml | 128 Bytes | | 03cac062 |
| _toctree.yml | 28.4 kB | | 38e4f6ea |
| accelerate.html | 28.1 kB | | 00454a67 |
| add_new_model.html | 140 kB | | 6ecc9348 |
| add_new_pipeline.html | 38.3 kB | | e3e91322 |
| agents.html | 74.1 kB | | ab8eb1ff |
| agents_advanced.html | 41.5 kB | | 77c4de32 |
| attention.html | 24.1 kB | | 29da05e3 |
| autoclass_tutorial.html | 46.1 kB | | a326087d |
| benchmarks.html | 65.9 kB | | e81fc645 |
| bertology.html | 5.97 kB | | 8c8a8fc0 |
| big_models.html | 43.6 kB | | 3242dc92 |
| chat_templating.html | 161 kB | | 7d9f82d6 |
| community.html | 43.3 kB | | a5d60ff6 |
| contributing.html | 72.8 kB | | 215a12e4 |
| conversations.html | 48.5 kB | | 3b41c890 |
| create_a_model.html | 98.9 kB | | a0f0a8a9 |
| custom_models.html | 58.6 kB | | e9b44f23 |
| debugging.html | 84.1 kB | | 36b919e8 |
| deepspeed.html | 150 kB | | 0ac665c9 |
| fast_tokenizers.html | 15.9 kB | | ffd20b35 |
| favicon.png | 1.57 kB | | 6e06dd7b |
| fsdp.html | 34.7 kB | | 3e1edbe1 |
| generation_strategies.html | 90 kB | | d308cdcf |
| gguf.html | 16.6 kB | | 28f315a4 |
| glossary.html | 152 kB | | 567c2077 |
| hpo_train.html | 31.5 kB | | e4222d81 |
| index.html | 60.4 kB | | 10c84dd1 |
| installation.html | 56.5 kB | | c4580e83 |
| kv_cache.html | 86.7 kB | | 254d55c2 |
| llm_optims.html | 44.3 kB | | 11426579 |
| llm_tutorial.html | 56.7 kB | | 34cdcde8 |
| llm_tutorial_optimization.html | 246 kB | | e55a1102 |
| model_memory_anatomy.html | 39.6 kB | | 8839193c |
| model_sharing.html | 65 kB | | fcc16450 |
| model_summary.html | 43.8 kB | | b25e7bd0 |
| modular_transformers.html | 21.2 kB | | ad4eda8e |
| multilingual.html | 39.4 kB | | 2fd2c894 |
| notebooks.html | 71.9 kB | | 61e5f302 |
| objects.inv | 40 kB | | b9f8a304 |
| pad_truncation.html | 10.6 kB | | d693b6ec |
| peft.html | 106 kB | | 4b0e7aaa |
| perf_hardware.html | 25.2 kB | | 3c5b909d |
| perf_infer_cpu.html | 24.9 kB | | fa95ee98 |
| perf_infer_gpu_one.html | 79.6 kB | | d0159c5e |
| perf_torch_compile.html | 67.8 kB | | bb05a9b6 |
| perf_train_cpu.html | 16.2 kB | | e2ceae46 |
| perf_train_cpu_many.html | 53.7 kB | | 3bdb835f |
| perf_train_gpu_many.html | 87.2 kB | | c240f7a5 |
| perf_train_gpu_one.html | 91.4 kB | | c531ad3c |
| perf_train_special.html | 10.2 kB | | 6df4768a |
| perf_train_tpu_tf.html | 40.8 kB | | 4977c99a |
| performance.html | 12.9 kB | | 58a004b5 |
| perplexity.html | 38.2 kB | | 74725432 |
| philosophy.html | 11.6 kB | | 2541762d |
| pipeline_tutorial.html | 75.4 kB | | 21651698 |
| pipeline_webserver.html | 25.2 kB | | 945089e5 |
| pr_checks.html | 44 kB | | ecddd170 |
| preprocessing.html | 129 kB | | 7f514ca1 |
| quicktour.html | 156 kB | | cbf948ee |
| run_scripts.html | 68.7 kB | | b6bcd718 |
| sagemaker.html | 5.86 kB | | 5502f3ac |
| serialization.html | 42.4 kB | | efb5f8e4 |
| task_summary.html | 83.6 kB | | b467eb2d |
| tasks_explained.html | 60.3 kB | | c454f5b2 |
| testing.html | 250 kB | | 0a59f3c5 |
| tf_xla.html | 34.7 kB | | 8b5c3a92 |
| tflite.html | 11.8 kB | | b26313b8 |
| tiktoken.html | 9.44 kB | | 102d241d |
| tokenizer_summary.html | 65.9 kB | | aa15daec |
| torchscript.html | 37.8 kB | | 0e1e5679 |
| trainer.html | 93 kB | | bf3b0240 |
| training.html | 98.3 kB | | 69de1a31 |
| troubleshooting.html | 47 kB | | f55aaf74 |