| _app | | | 498 items |
| internal | | | 9 items |
| main_classes | | | 21 items |
| model_doc | | | 326 items |
| quantization | | | 16 items |
| tasks | | | 30 items |
| _redirects.yml | 128 Bytes | | 03cac062 |
| _toctree.yml | 30.1 kB | | 73e8ada5 |
| accelerate.html | 28.1 kB | | 450ec3b2 |
| add_new_model.html | 140 kB | | 6b456415 |
| add_new_pipeline.html | 41.2 kB | | 2b0ae5c8 |
| agents.html | 74.1 kB | | f42a02b7 |
| agents_advanced.html | 45.7 kB | | 90ff5ec1 |
| attention.html | 24.1 kB | | 264b293e |
| autoclass_tutorial.html | 46.9 kB | | 591b4bb4 |
| bertology.html | 5.97 kB | | d8ac1b3d |
| big_models.html | 43.6 kB | | 502e3417 |
| chat_templating.html | 197 kB | | 9c6169ff |
| community.html | 43.3 kB | | 72e38a53 |
| contributing.html | 72.8 kB | | 9b266f4e |
| conversations.html | 48.5 kB | | 896d0878 |
| create_a_model.html | 98.9 kB | | c97a0fb5 |
| custom_models.html | 58.6 kB | | b0738e7a |
| debugging.html | 84.1 kB | | 11d9c876 |
| deepspeed.html | 154 kB | | 9cfe1942 |
| fast_tokenizers.html | 15.9 kB | | a7892d7f |
| favicon.png | 1.57 kB | | 6e06dd7b |
| fsdp.html | 34.7 kB | | 11b77a69 |
| generation_strategies.html | 106 kB | | a55bdc7b |
| gguf.html | 16.7 kB | | 479adac4 |
| glossary.html | 152 kB | | 3842b778 |
| how_to_hack_models.html | 36.1 kB | | dc34a93b |
| hpo_train.html | 31.5 kB | | 2e85bebe |
| index.html | 64.6 kB | | 777e9676 |
| installation.html | 66.4 kB | | 0930e2f7 |
| kv_cache.html | 88.1 kB | | 61b7a4d7 |
| llm_optims.html | 52 kB | | b8709258 |
| llm_tutorial.html | 57.4 kB | | ba991738 |
| llm_tutorial_optimization.html | 246 kB | | c30e4601 |
| model_memory_anatomy.html | 39.6 kB | | 124f0ce9 |
| model_sharing.html | 65 kB | | bedaa429 |
| model_summary.html | 43.8 kB | | 0cd12770 |
| modular_transformers.html | 124 kB | | 3a5d1600 |
| multilingual.html | 39.4 kB | | 2b9e2833 |
| notebooks.html | 70.2 kB | | 6ad53fb4 |
| objects.inv | 41.6 kB | | 1c671500 |
| pad_truncation.html | 10.6 kB | | 71a7e822 |
| peft.html | 110 kB | | adf18fa6 |
| perf_hardware.html | 25.2 kB | | 984b1d01 |
| perf_infer_cpu.html | 25 kB | | 8b7e2699 |
| perf_infer_gpu_multi.html | 10.9 kB | | 8409b757 |
| perf_infer_gpu_one.html | 86.8 kB | | a15b4695 |
| perf_torch_compile.html | 68.4 kB | | dca47a18 |
| perf_train_cpu.html | 16.4 kB | | 061f77ae |
| perf_train_cpu_many.html | 51.5 kB | | c506524b |
| perf_train_gpu_many.html | 87.2 kB | | c001c934 |
| perf_train_gpu_one.html | 91.4 kB | | 15c6a3bd |
| perf_train_special.html | 10.2 kB | | 1a95c144 |
| perf_train_tpu_tf.html | 40.8 kB | | 4ea9c1d5 |
| performance.html | 12.9 kB | | 3783ce63 |
| perplexity.html | 39.2 kB | | baa8c345 |
| philosophy.html | 11.6 kB | | 61aa0612 |
| pipeline_tutorial.html | 75.6 kB | | 02e8089e |
| pipeline_webserver.html | 25.2 kB | | e3fe4714 |
| pr_checks.html | 44 kB | | fb3aa3b6 |
| preprocessing.html | 129 kB | | 859cd3fc |
| quicktour.html | 162 kB | | 90213f57 |
| run_scripts.html | 68.7 kB | | df2abac4 |
| sagemaker.html | 5.86 kB | | 5d649a44 |
| serialization.html | 42.4 kB | | 0934a889 |
| task_summary.html | 83.6 kB | | cd53e1d2 |
| tasks_explained.html | 60.3 kB | | ee7639e8 |
| testing.html | 250 kB | | ebd57de8 |
| tf_xla.html | 34.7 kB | | f7e2f8a7 |
| tflite.html | 11.8 kB | | 4878e318 |
| tiktoken.html | 14.9 kB | | 67da4187 |
| tokenizer_summary.html | 65.9 kB | | 76cf7717 |
| torchscript.html | 37.8 kB | | 5fd6a9b8 |
| trainer.html | 97.8 kB | | 007e53c9 |
| training.html | 99 kB | | a85cec54 |
| troubleshooting.html | 47 kB | | c66d7538 |