| _app | | | 480 items |
| internal | | | 9 items |
| main_classes | | | 21 items |
| model_doc | | | 309 items |
| quantization | | | 14 items |
| tasks | | | 30 items |
| _redirects.yml | 128 Bytes | | 03cac062 |
| _toctree.yml | 29.1 kB | | 56b18d60 |
| accelerate.html | 28.1 kB | | 23cf7d09 |
| add_new_model.html | 140 kB | | 7c4e363e |
| add_new_pipeline.html | 38.3 kB | | 15ab204f |
| agents.html | 74.1 kB | | c7d648a6 |
| agents_advanced.html | 45.8 kB | | a4bf9ace |
| attention.html | 24.1 kB | | 863a59b7 |
| autoclass_tutorial.html | 46.9 kB | | ccd89214 |
| benchmarks.html | 65.9 kB | | 30c5c471 |
| bertology.html | 5.97 kB | | b401baff |
| big_models.html | 43.6 kB | | 265d5c71 |
| chat_templating.html | 188 kB | | 3ff1e44e |
| community.html | 43.3 kB | | 1a2e8a26 |
| contributing.html | 72.8 kB | | 91475c93 |
| conversations.html | 48.5 kB | | e35a8faa |
| create_a_model.html | 98.9 kB | | 53b54053 |
| custom_models.html | 58.6 kB | | 3fa3a53a |
| debugging.html | 84.1 kB | | a4ce66dc |
| deepspeed.html | 150 kB | | 8423fd6d |
| fast_tokenizers.html | 15.9 kB | | 8764098a |
| favicon.png | 1.57 kB | | 6e06dd7b |
| fsdp.html | 34.7 kB | | 2f3b2842 |
| generation_strategies.html | 102 kB | | 02aaf98c |
| gguf.html | 16.7 kB | | bd891800 |
| glossary.html | 152 kB | | aab8875c |
| how_to_hack_models.html | 36.1 kB | | 868a72f2 |
| hpo_train.html | 31.5 kB | | 829c0f3b |
| index.html | 61.8 kB | | 67970a55 |
| installation.html | 56.5 kB | | 7b3e9093 |
| kv_cache.html | 86.8 kB | | cf7ef96f |
| llm_optims.html | 52.1 kB | | 3d3638ef |
| llm_tutorial.html | 56.7 kB | | 81a7068d |
| llm_tutorial_optimization.html | 246 kB | | a3532880 |
| model_memory_anatomy.html | 39.6 kB | | 78d26f2f |
| model_sharing.html | 65 kB | | b1896a0e |
| model_summary.html | 43.8 kB | | fab4b9ff |
| modular_transformers.html | 40.5 kB | | f7d35292 |
| multilingual.html | 39.4 kB | | d7cac79a |
| notebooks.html | 71.9 kB | | 105112c5 |
| objects.inv | 40.8 kB | | 6f20491c |
| pad_truncation.html | 10.6 kB | | 90480d7d |
| peft.html | 110 kB | | 2850d838 |
| perf_hardware.html | 25.2 kB | | 31a10cf4 |
| perf_infer_cpu.html | 25 kB | | 267207da |
| perf_infer_gpu_multi.html | 10.9 kB | | 16c2b093 |
| perf_infer_gpu_one.html | 84.1 kB | | 90b87a92 |
| perf_torch_compile.html | 68.4 kB | | 0980d086 |
| perf_train_cpu.html | 16.4 kB | | 4f1a55ff |
| perf_train_cpu_many.html | 51.5 kB | | 151c671a |
| perf_train_gpu_many.html | 87.2 kB | | 3a12e2d6 |
| perf_train_gpu_one.html | 91.4 kB | | 3e9e15fb |
| perf_train_special.html | 10.2 kB | | d9911236 |
| perf_train_tpu_tf.html | 40.8 kB | | de586d9f |
| performance.html | 12.9 kB | | fb8acd97 |
| perplexity.html | 39.2 kB | | f20881c1 |
| philosophy.html | 11.6 kB | | 3d936a3b |
| pipeline_tutorial.html | 75.6 kB | | 75d903bd |
| pipeline_webserver.html | 25.2 kB | | 7be75287 |
| pr_checks.html | 44 kB | | 2aa621db |
| preprocessing.html | 129 kB | | 97b680fb |
| quicktour.html | 157 kB | | 3785f44b |
| run_scripts.html | 68.7 kB | | 0fc4d8d6 |
| sagemaker.html | 5.86 kB | | a33b1d78 |
| serialization.html | 42.4 kB | | c5eb3f95 |
| task_summary.html | 83.6 kB | | e07d0186 |
| tasks_explained.html | 60.3 kB | | f87080e2 |
| testing.html | 250 kB | | b70ac159 |
| tf_xla.html | 34.7 kB | | 31b513bd |
| tflite.html | 11.8 kB | | a94f6346 |
| tiktoken.html | 14.9 kB | | 80c6ec38 |
| tokenizer_summary.html | 65.9 kB | | 1fbb6d73 |
| torchscript.html | 37.8 kB | | f5a0631a |
| trainer.html | 97.8 kB | | dd2ffea6 |
| training.html | 99 kB | | 5f03d438 |
| troubleshooting.html | 47 kB | | 26b14f1d |