Buckets:
| import{s as Lo,o as Do,n as H}from"../chunks/scheduler.3a17fb72.js";import{S as zo,i as Eo,e as d,s as l,c as _,h as Wo,a as p,d as i,b as a,f as D,g as h,j as y,k as z,l as r,m,n as u,t as v,o as M,p as b}from"../chunks/index.093f8863.js";import{C as Po,H as R,E as Ao}from"../chunks/MermaidChart.svelte_svelte_type_style_lang.45526a62.js";import{D as X}from"../chunks/Docstring.38455f04.js";import{C as O}from"../chunks/CodeBlock.36d3c07b.js";import{E as Y}from"../chunks/ExampleCodeBlock.ee705a6f.js";function Zo(C){let n,x="Example:",c,o,g;return o=new O({props:{code:"JTIzJTIwTG9hZCUyMGZyb20lMjBZQU1MJTIwZmlsZSUwQWNvbmZpZyUyMCUzRCUyME1vZGVsQ29uZmlnLmZyb21fcGF0aCglMjJtb2RlbF9jb25maWcueWFtbCUyMiklMEElMEElMjMlMjBMb2FkJTIwZnJvbSUyMGNvbW1hbmQlMjBsaW5lJTIwYXJndW1lbnRzJTBBY29uZmlnJTIwJTNEJTIwTW9kZWxDb25maWcuZnJvbV9hcmdzKCUyMm1vZGVsX25hbWUlM0RtZXRhLWxsYW1hJTJGTGxhbWEtMy4xLThCLUluc3RydWN0JTJDc3lzdGVtX3Byb21wdCUzRCdZb3UlMjBhcmUlMjBhJTIwaGVscGZ1bCUyMGFzc2lzdGFudC4nJTJDZ2VuZXJhdGlvbl9wYXJhbWV0ZXJzJTNEJTdCdGVtcGVyYXR1cmUlM0QwLjclN0QlMjIpJTBBJTBBJTIzJTIwRGlyZWN0JTIwaW5zdGFudGlhdGlvbiUwQWNvbmZpZyUyMCUzRCUyME1vZGVsQ29uZmlnKCUwQSUyMCUyMCUyMCUyMG1vZGVsX25hbWUlM0QlMjJtZXRhLWxsYW1hJTJGTGxhbWEtMy4xLThCLUluc3RydWN0JTIyJTJDJTBBJTIwJTIwJTIwJTIwZ2VuZXJhdGlvbl9wYXJhbWV0ZXJzJTNER2VuZXJhdGlvblBhcmFtZXRlcnModGVtcGVyYXR1cmUlM0QwLjcpJTJDJTBBJTIwJTIwJTIwJTIwc3lzdGVtX3Byb21wdCUzRCUyMllvdSUyMGFyZSUyMGElMjBoZWxwZnVsJTIwYXNzaXN0YW50LiUyMiUwQSk=",highlighted:`<span class="hljs-comment"># Load from YAML file</span> | |
| config = ModelConfig.from_path(<span class="hljs-string">"model_config.yaml"</span>) | |
| <span class="hljs-comment"># Load from command line arguments</span> | |
| config = ModelConfig.from_args(<span class="hljs-string">"model_name=meta-llama/Llama-3.1-8B-Instruct,system_prompt='You are a helpful assistant.',generation_parameters={temperature=0.7}"</span>) | |
| <span class="hljs-comment"># Direct instantiation</span> | |
| config = ModelConfig( | |
| model_name=<span class="hljs-string">"meta-llama/Llama-3.1-8B-Instruct"</span>, | |
| generation_parameters=GenerationParameters(temperature=<span class="hljs-number">0.7</span>), | |
| system_prompt=<span class="hljs-string">"You are a helpful assistant."</span> | |
| )`,wrap:!1}}),{c(){n=d("p"),n.textContent=x,c=l(),_(o.$$.fragment)},l(t){n=p(t,"P",{"data-svelte-h":!0}),y(n)!=="svelte-11lpom8"&&(n.textContent=x),c=a(t),h(o.$$.fragment,t)},m(t,f){m(t,n,f),m(t,c,f),u(o,t,f),g=!0},p:H,i(t){g||(v(o.$$.fragment,t),g=!0)},o(t){M(o.$$.fragment,t),g=!1},d(t){t&&(i(n),i(c)),b(o,t)}}}function Vo(C){let n,x="Example:",c,o,g;return o=new O({props:{code:"Y29uZmlnJTIwJTNEJTIwVHJhbnNmb3JtZXJzTW9kZWxDb25maWcoJTBBJTIwJTIwJTIwJTIwbW9kZWxfbmFtZSUzRCUyMm1ldGEtbGxhbWElMkZMbGFtYS0zLjEtOEItSW5zdHJ1Y3QlMjIlMkMlMEElMjAlMjAlMjAlMjBiYXRjaF9zaXplJTNENCUyQyUwQSUyMCUyMCUyMCUyMGR0eXBlJTNEJTIyZmxvYXQxNiUyMiUyQyUwQSUyMCUyMCUyMCUyMGdlbmVyYXRpb25fcGFyYW1ldGVycyUzREdlbmVyYXRpb25QYXJhbWV0ZXJzKCUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMHRlbXBlcmF0dXJlJTNEMC43JTJDJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwbWF4X25ld190b2tlbnMlM0QxMDAlMEElMjAlMjAlMjAlMjApJTBBKQ==",highlighted:`config = TransformersModelConfig( | |
| model_name=<span class="hljs-string">"meta-llama/Llama-3.1-8B-Instruct"</span>, | |
| batch_size=<span class="hljs-number">4</span>, | |
| dtype=<span class="hljs-string">"float16"</span>, | |
| generation_parameters=GenerationParameters( | |
| temperature=<span class="hljs-number">0.7</span>, | |
| max_new_tokens=<span class="hljs-number">100</span> | |
| ) | |
| )`,wrap:!1}}),{c(){n=d("p"),n.textContent=x,c=l(),_(o.$$.fragment)},l(t){n=p(t,"P",{"data-svelte-h":!0}),y(n)!=="svelte-11lpom8"&&(n.textContent=x),c=a(t),h(o.$$.fragment,t)},m(t,f){m(t,n,f),m(t,c,f),u(o,t,f),g=!0},p:H,i(t){g||(v(o.$$.fragment,t),g=!0)},o(t){M(o.$$.fragment,t),g=!1},d(t){t&&(i(n),i(c)),b(o,t)}}}function Bo(C){let n,x="Example:",c,o,g;return o=new O({props:{code:"Y29uZmlnJTIwJTNEJTIwVkxMTU1vZGVsQ29uZmlnKCUwQSUyMCUyMCUyMCUyMG1vZGVsX25hbWUlM0QlMjJtZXRhLWxsYW1hJTJGTGxhbWEtMy4xLThCLUluc3RydWN0JTIyJTJDJTBBJTIwJTIwJTIwJTIwdGVuc29yX3BhcmFsbGVsX3NpemUlM0QyJTJDJTBBJTIwJTIwJTIwJTIwZ3B1X21lbW9yeV91dGlsaXphdGlvbiUzRDAuOCUyQyUwQSUyMCUyMCUyMCUyMG1heF9tb2RlbF9sZW5ndGglM0Q0MDk2JTJDJTBBJTIwJTIwJTIwJTIwZ2VuZXJhdGlvbl9wYXJhbWV0ZXJzJTNER2VuZXJhdGlvblBhcmFtZXRlcnMoJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwdGVtcGVyYXR1cmUlM0QwLjclMkMlMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjBtYXhfbmV3X3Rva2VucyUzRDEwMCUwQSUyMCUyMCUyMCUyMCklMEEp",highlighted:`config = VLLMModelConfig( | |
| model_name=<span class="hljs-string">"meta-llama/Llama-3.1-8B-Instruct"</span>, | |
| tensor_parallel_size=<span class="hljs-number">2</span>, | |
| gpu_memory_utilization=<span class="hljs-number">0.8</span>, | |
| max_model_length=<span class="hljs-number">4096</span>, | |
| generation_parameters=GenerationParameters( | |
| temperature=<span class="hljs-number">0.7</span>, | |
| max_new_tokens=<span class="hljs-number">100</span> | |
| ) | |
| )`,wrap:!1}}),{c(){n=d("p"),n.textContent=x,c=l(),_(o.$$.fragment)},l(t){n=p(t,"P",{"data-svelte-h":!0}),y(n)!=="svelte-11lpom8"&&(n.textContent=x),c=a(t),h(o.$$.fragment,t)},m(t,f){m(t,n,f),m(t,c,f),u(o,t,f),g=!0},p:H,i(t){g||(v(o.$$.fragment,t),g=!0)},o(t){M(o.$$.fragment,t),g=!1},d(t){t&&(i(n),i(c)),b(o,t)}}}function Ro(C){let n,x="Example:",c,o,g;return o=new O({props:{code:"Y29uZmlnJTIwJTNEJTIwU0dMYW5nTW9kZWxDb25maWcoJTBBJTIwJTIwJTIwJTIwbW9kZWxfbmFtZSUzRCUyMm1ldGEtbGxhbWElMkZMbGFtYS0zLjEtOEItSW5zdHJ1Y3QlMjIlMkMlMEElMjAlMjAlMjAlMjB0cF9zaXplJTNEMiUyQyUwQSUyMCUyMCUyMCUyMGNvbnRleHRfbGVuZ3RoJTNEODE5MiUyQyUwQSUyMCUyMCUyMCUyMGdlbmVyYXRpb25fcGFyYW1ldGVycyUzREdlbmVyYXRpb25QYXJhbWV0ZXJzKCUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMHRlbXBlcmF0dXJlJTNEMC43JTJDJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwbWF4X25ld190b2tlbnMlM0QxMDAlMEElMjAlMjAlMjAlMjApJTBBKQ==",highlighted:`config = SGLangModelConfig( | |
| model_name=<span class="hljs-string">"meta-llama/Llama-3.1-8B-Instruct"</span>, | |
| tp_size=<span class="hljs-number">2</span>, | |
| context_length=<span class="hljs-number">8192</span>, | |
| generation_parameters=GenerationParameters( | |
| temperature=<span class="hljs-number">0.7</span>, | |
| max_new_tokens=<span class="hljs-number">100</span> | |
| ) | |
| )`,wrap:!1}}),{c(){n=d("p"),n.textContent=x,c=l(),_(o.$$.fragment)},l(t){n=p(t,"P",{"data-svelte-h":!0}),y(n)!=="svelte-11lpom8"&&(n.textContent=x),c=a(t),h(o.$$.fragment,t)},m(t,f){m(t,n,f),m(t,c,f),u(o,t,f),g=!0},p:H,i(t){g||(v(o.$$.fragment,t),g=!0)},o(t){M(o.$$.fragment,t),g=!1},d(t){t&&(i(n),i(c)),b(o,t)}}}function Xo(C){let n,x="Example:",c,o,g;return o=new O({props:{code:"Y29uZmlnJTIwJTNEJTIwRHVtbXlNb2RlbENvbmZpZyglMEElMjAlMjAlMjAlMjBtb2RlbF9uYW1lJTNEJTIybXlfZHVtbXklMjIlMkMlMEElMjAlMjAlMjAlMjBzZWVkJTNEMTIzJTJDJTBBKQ==",highlighted:`config = DummyModelConfig( | |
| model_name=<span class="hljs-string">"my_dummy"</span>, | |
| seed=<span class="hljs-number">123</span>, | |
| )`,wrap:!1}}),{c(){n=d("p"),n.textContent=x,c=l(),_(o.$$.fragment)},l(t){n=p(t,"P",{"data-svelte-h":!0}),y(n)!=="svelte-11lpom8"&&(n.textContent=x),c=a(t),h(o.$$.fragment,t)},m(t,f){m(t,n,f),m(t,c,f),u(o,t,f),g=!0},p:H,i(t){g||(v(o.$$.fragment,t),g=!0)},o(t){M(o.$$.fragment,t),g=!1},d(t){t&&(i(n),i(c)),b(o,t)}}}function Fo(C){let n,x="Example:",c,o,g;return o=new O({props:{code:"Y29uZmlnJTIwJTNEJTIwSW5mZXJlbmNlUHJvdmlkZXJzTW9kZWxDb25maWcoJTBBJTIwJTIwJTIwJTIwbW9kZWxfbmFtZSUzRCUyMmRlZXBzZWVrLWFpJTJGRGVlcFNlZWstUjEtMDUyOCUyMiUyQyUwQSUyMCUyMCUyMCUyMHByb3ZpZGVyJTNEJTIydG9nZXRoZXIlMjIlMkMlMEElMjAlMjAlMjAlMjBwYXJhbGxlbF9jYWxsc19jb3VudCUzRDUlMkMlMEElMjAlMjAlMjAlMjBnZW5lcmF0aW9uX3BhcmFtZXRlcnMlM0RHZW5lcmF0aW9uUGFyYW1ldGVycyglMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjB0ZW1wZXJhdHVyZSUzRDAuNyUyQyUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMG1heF9uZXdfdG9rZW5zJTNEMTAwJTBBJTIwJTIwJTIwJTIwKSUwQSk=",highlighted:`config = InferenceProvidersModelConfig( | |
| model_name=<span class="hljs-string">"deepseek-ai/DeepSeek-R1-0528"</span>, | |
| provider=<span class="hljs-string">"together"</span>, | |
| parallel_calls_count=<span class="hljs-number">5</span>, | |
| generation_parameters=GenerationParameters( | |
| temperature=<span class="hljs-number">0.7</span>, | |
| max_new_tokens=<span class="hljs-number">100</span> | |
| ) | |
| )`,wrap:!1}}),{c(){n=d("p"),n.textContent=x,c=l(),_(o.$$.fragment)},l(t){n=p(t,"P",{"data-svelte-h":!0}),y(n)!=="svelte-11lpom8"&&(n.textContent=x),c=a(t),h(o.$$.fragment,t)},m(t,f){m(t,n,f),m(t,c,f),u(o,t,f),g=!0},p:H,i(t){g||(v(o.$$.fragment,t),g=!0)},o(t){M(o.$$.fragment,t),g=!1},d(t){t&&(i(n),i(c)),b(o,t)}}}function So(C){let n,x="Example:",c,o,g;return o=new O({props:{code:"Y29uZmlnJTIwJTNEJTIwSW5mZXJlbmNlRW5kcG9pbnRNb2RlbENvbmZpZyglMEElMjAlMjAlMjAlMjBtb2RlbF9uYW1lJTNEJTIybWljcm9zb2Z0JTJGRGlhbG9HUFQtbWVkaXVtJTIyJTJDJTBBJTIwJTIwJTIwJTIwaW5zdGFuY2VfdHlwZSUzRCUyMm52aWRpYS1hMTAwJTIyJTJDJTBBJTIwJTIwJTIwJTIwaW5zdGFuY2Vfc2l6ZSUzRCUyMngxJTIyJTJDJTBBJTIwJTIwJTIwJTIwdmVuZG9yJTNEJTIyYXdzJTIyJTJDJTBBJTIwJTIwJTIwJTIwcmVnaW9uJTNEJTIydXMtZWFzdC0xJTIyJTJDJTBBJTIwJTIwJTIwJTIwZHR5cGUlM0QlMjJmbG9hdDE2JTIyJTJDJTBBJTIwJTIwJTIwJTIwZ2VuZXJhdGlvbl9wYXJhbWV0ZXJzJTNER2VuZXJhdGlvblBhcmFtZXRlcnMoJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwdGVtcGVyYXR1cmUlM0QwLjclMkMlMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjBtYXhfbmV3X3Rva2VucyUzRDEwMCUwQSUyMCUyMCUyMCUyMCklMEEp",highlighted:`config = InferenceEndpointModelConfig( | |
| model_name=<span class="hljs-string">"microsoft/DialoGPT-medium"</span>, | |
| instance_type=<span class="hljs-string">"nvidia-a100"</span>, | |
| instance_size=<span class="hljs-string">"x1"</span>, | |
| vendor=<span class="hljs-string">"aws"</span>, | |
| region=<span class="hljs-string">"us-east-1"</span>, | |
| dtype=<span class="hljs-string">"float16"</span>, | |
| generation_parameters=GenerationParameters( | |
| temperature=<span class="hljs-number">0.7</span>, | |
| max_new_tokens=<span class="hljs-number">100</span> | |
| ) | |
| )`,wrap:!1}}),{c(){n=d("p"),n.textContent=x,c=l(),_(o.$$.fragment)},l(t){n=p(t,"P",{"data-svelte-h":!0}),y(n)!=="svelte-11lpom8"&&(n.textContent=x),c=a(t),h(o.$$.fragment,t)},m(t,f){m(t,n,f),m(t,c,f),u(o,t,f),g=!0},p:H,i(t){g||(v(o.$$.fragment,t),g=!0)},o(t){M(o.$$.fragment,t),g=!1},d(t){t&&(i(n),i(c)),b(o,t)}}}function qo(C){let n,x="Example:",c,o,g;return o=new O({props:{code:"Y29uZmlnJTIwJTNEJTIwU2VydmVybGVzc0VuZHBvaW50TW9kZWxDb25maWcoJTBBJTIwJTIwJTIwJTIwbW9kZWxfbmFtZSUzRCUyMm1ldGEtbGxhbWElMkZMbGFtYS0zLjEtOEItSW5zdHJ1Y3QlMjIlMkMlMEElMjAlMjAlMjAlMjBnZW5lcmF0aW9uX3BhcmFtZXRlcnMlM0RHZW5lcmF0aW9uUGFyYW1ldGVycyglMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjB0ZW1wZXJhdHVyZSUzRDAuNyUyQyUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMG1heF9uZXdfdG9rZW5zJTNEMTAwJTBBJTIwJTIwJTIwJTIwKSUwQSk=",highlighted:`config = ServerlessEndpointModelConfig( | |
| model_name=<span class="hljs-string">"meta-llama/Llama-3.1-8B-Instruct"</span>, | |
| generation_parameters=GenerationParameters( | |
| temperature=<span class="hljs-number">0.7</span>, | |
| max_new_tokens=<span class="hljs-number">100</span> | |
| ) | |
| )`,wrap:!1}}),{c(){n=d("p"),n.textContent=x,c=l(),_(o.$$.fragment)},l(t){n=p(t,"P",{"data-svelte-h":!0}),y(n)!=="svelte-11lpom8"&&(n.textContent=x),c=a(t),h(o.$$.fragment,t)},m(t,f){m(t,n,f),m(t,c,f),u(o,t,f),g=!0},p:H,i(t){g||(v(o.$$.fragment,t),g=!0)},o(t){M(o.$$.fragment,t),g=!1},d(t){t&&(i(n),i(c)),b(o,t)}}}function Qo(C){let n,x="Example:",c,o,g;return o=new O({props:{code:"Y29uZmlnJTIwJTNEJTIwVEdJTW9kZWxDb25maWcoJTBBJTIwJTIwJTIwJTIwaW5mZXJlbmNlX3NlcnZlcl9hZGRyZXNzJTNEJTIyaHR0cCUzQSUyRiUyRmxvY2FsaG9zdCUzQTgwODAlMjIlMkMlMEElMjAlMjAlMjAlMjBpbmZlcmVuY2Vfc2VydmVyX2F1dGglM0QlMjJ5b3VyLWF1dGgtdG9rZW4lMjIlMkMlMEElMjAlMjAlMjAlMjBtb2RlbF9uYW1lJTNEJTIybWV0YS1sbGFtYSUyRkxsYW1hLTMuMS04Qi1JbnN0cnVjdCUyMiUyQyUwQSUyMCUyMCUyMCUyMGdlbmVyYXRpb25fcGFyYW1ldGVycyUzREdlbmVyYXRpb25QYXJhbWV0ZXJzKCUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMHRlbXBlcmF0dXJlJTNEMC43JTJDJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwbWF4X25ld190b2tlbnMlM0QxMDAlMEElMjAlMjAlMjAlMjApJTBBKQ==",highlighted:`config = TGIModelConfig( | |
| inference_server_address=<span class="hljs-string">"http://localhost:8080"</span>, | |
| inference_server_auth=<span class="hljs-string">"your-auth-token"</span>, | |
| model_name=<span class="hljs-string">"meta-llama/Llama-3.1-8B-Instruct"</span>, | |
| generation_parameters=GenerationParameters( | |
| temperature=<span class="hljs-number">0.7</span>, | |
| max_new_tokens=<span class="hljs-number">100</span> | |
| ) | |
| )`,wrap:!1}}),{c(){n=d("p"),n.textContent=x,c=l(),_(o.$$.fragment)},l(t){n=p(t,"P",{"data-svelte-h":!0}),y(n)!=="svelte-11lpom8"&&(n.textContent=x),c=a(t),h(o.$$.fragment,t)},m(t,f){m(t,n,f),m(t,c,f),u(o,t,f),g=!0},p:H,i(t){g||(v(o.$$.fragment,t),g=!0)},o(t){M(o.$$.fragment,t),g=!1},d(t){t&&(i(n),i(c)),b(o,t)}}}function Yo(C){let n,x="Example:",c,o,g;return o=new O({props:{code:"Y29uZmlnJTIwJTNEJTIwTGl0ZUxMTU1vZGVsQ29uZmlnKCUwQSUyMCUyMCUyMCUyMG1vZGVsX25hbWUlM0QlMjJncHQtNCUyMiUyQyUwQSUyMCUyMCUyMCUyMHByb3ZpZGVyJTNEJTIyb3BlbmFpJTIyJTJDJTBBJTIwJTIwJTIwJTIwYmFzZV91cmwlM0QlMjJodHRwcyUzQSUyRiUyRmFwaS5vcGVuYWkuY29tJTJGdjElMjIlMkMlMEElMjAlMjAlMjAlMjBjb25jdXJyZW50X3JlcXVlc3RzJTNENSUyQyUwQSUyMCUyMCUyMCUyMGdlbmVyYXRpb25fcGFyYW1ldGVycyUzREdlbmVyYXRpb25QYXJhbWV0ZXJzKCUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMHRlbXBlcmF0dXJlJTNEMC43JTJDJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwbWF4X25ld190b2tlbnMlM0QxMDAlMEElMjAlMjAlMjAlMjApJTBBKQ==",highlighted:`config = LiteLLMModelConfig( | |
| model_name=<span class="hljs-string">"gpt-4"</span>, | |
| provider=<span class="hljs-string">"openai"</span>, | |
| base_url=<span class="hljs-string">"https://api.openai.com/v1"</span>, | |
| concurrent_requests=<span class="hljs-number">5</span>, | |
| generation_parameters=GenerationParameters( | |
| temperature=<span class="hljs-number">0.7</span>, | |
| max_new_tokens=<span class="hljs-number">100</span> | |
| ) | |
| )`,wrap:!1}}),{c(){n=d("p"),n.textContent=x,c=l(),_(o.$$.fragment)},l(t){n=p(t,"P",{"data-svelte-h":!0}),y(n)!=="svelte-11lpom8"&&(n.textContent=x),c=a(t),h(o.$$.fragment,t)},m(t,f){m(t,n,f),m(t,c,f),u(o,t,f),g=!0},p:H,i(t){g||(v(o.$$.fragment,t),g=!0)},o(t){M(o.$$.fragment,t),g=!1},d(t){t&&(i(n),i(c)),b(o,t)}}}function Ho(C){let n,x="Example usage:",c,o,g;return o=new O({props:{code:"JTIzJTIwRGVmaW5lJTIwY29uZmlnJTBBY29uZmlnJTIwJTNEJTIwQ3VzdG9tTW9kZWxDb25maWcoJTBBJTIwJTIwJTIwJTIwbW9kZWwlM0QlMjJteS1jdXN0b20tbW9kZWwlMjIlMkMlMEElMjAlMjAlMjAlMjBtb2RlbF9kZWZpbml0aW9uX2ZpbGVfcGF0aCUzRCUyMnBhdGglMkZ0byUyRm15X21vZGVsLnB5JTIyJTBBKSUwQSUwQSUyMyUyMEV4YW1wbGUlMjBjdXN0b20lMjBtb2RlbCUyMGZpbGUlMjAobXlfbW9kZWwucHkpJTNBJTBBZnJvbSUyMGxpZ2h0ZXZhbC5tb2RlbHMuYWJzdHJhY3RfbW9kZWwlMjBpbXBvcnQlMjBMaWdodGV2YWxNb2RlbCUwQSUwQWNsYXNzJTIwTXlDdXN0b21Nb2RlbChMaWdodGV2YWxNb2RlbCklM0ElMEElMjAlMjAlMjAlMjBkZWYlMjBfX2luaXRfXyhzZWxmJTJDJTIwY29uZmlnJTJDJTIwZW52X2NvbmZpZyklM0ElMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjBzdXBlcigpLl9faW5pdF9fKGNvbmZpZyUyQyUyMGVudl9jb25maWcpJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIzJTIwQ3VzdG9tJTIwaW5pdGlhbGl6YXRpb24uLi4lMEElMEElMjAlMjAlMjAlMjBkZWYlMjBncmVlZHlfdW50aWwoc2VsZiUyQyUyMGRvY3MlM0ElMjBsaXN0JTVCRG9jJTVEKSUyMC0lM0UlMjBsaXN0JTVCTW9kZWxSZXNwb25zZSU1RCUzQSUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMyUyMEN1c3RvbSUyMGdlbmVyYXRpb24lMjBsb2dpYy4uLiUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMHBhc3MlMEElMEElMjAlMjAlMjAlMjBkZWYlMjBsb2dsaWtlbGlob29kKHNlbGYlMkMlMjBkb2NzJTNBJTIwbGlzdCU1QkRvYyU1RCklMjAtJTNFJTIwbGlzdCU1Qk1vZGVsUmVzcG9uc2UlNUQlM0ElMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjBwYXNz",highlighted:`<span class="hljs-comment"># Define config</span> | |
| config = CustomModelConfig( | |
| model=<span class="hljs-string">"my-custom-model"</span>, | |
| model_definition_file_path=<span class="hljs-string">"path/to/my_model.py"</span> | |
| ) | |
| <span class="hljs-comment"># Example custom model file (my_model.py):</span> | |
| <span class="hljs-keyword">from</span> lighteval.models.abstract_model <span class="hljs-keyword">import</span> LightevalModel | |
| <span class="hljs-keyword">class</span> <span class="hljs-title class_">MyCustomModel</span>(<span class="hljs-title class_ inherited__">LightevalModel</span>): | |
| <span class="hljs-keyword">def</span> <span class="hljs-title function_">__init__</span>(<span class="hljs-params">self, config, env_config</span>): | |
| <span class="hljs-built_in">super</span>().__init__(config, env_config) | |
| <span class="hljs-comment"># Custom initialization...</span> | |
| <span class="hljs-keyword">def</span> <span class="hljs-title function_">greedy_until</span>(<span class="hljs-params">self, docs: <span class="hljs-built_in">list</span>[Doc]</span>) -> <span class="hljs-built_in">list</span>[ModelResponse]: | |
| <span class="hljs-comment"># Custom generation logic...</span> | |
| <span class="hljs-keyword">pass</span> | |
| <span class="hljs-keyword">def</span> <span class="hljs-title function_">loglikelihood</span>(<span class="hljs-params">self, docs: <span class="hljs-built_in">list</span>[Doc]</span>) -> <span class="hljs-built_in">list</span>[ModelResponse]: | |
| <span class="hljs-keyword">pass</span>`,wrap:!1}}),{c(){n=d("p"),n.textContent=x,c=l(),_(o.$$.fragment)},l(t){n=p(t,"P",{"data-svelte-h":!0}),y(n)!=="svelte-1ni337v"&&(n.textContent=x),c=a(t),h(o.$$.fragment,t)},m(t,f){m(t,n,f),m(t,c,f),u(o,t,f),g=!0},p:H,i(t){g||(v(o.$$.fragment,t),g=!0)},o(t){M(o.$$.fragment,t),g=!1},d(t){t&&(i(n),i(c)),b(o,t)}}}function Oo(C){let n,x,c,o,g,t,f,$t,ge,Qn=`The model configs are used to define the model and its parameters. All the parameters can be | |
| set in the <code>model-args</code> or in the model yaml file (see example | |
| <a href="https://github.com/huggingface/lighteval/blob/main/examples/model_configs/vllm_model_config.yaml" rel="nofollow">here</a>).`,Tt,ce,wt,J,fe,en,Ae,Yn="Base configuration class for all model types in Lighteval.",tn,Ze,Hn=`This is the foundation class that all specific model configurations inherit from. | |
| It provides common functionality for parsing configuration from files and command-line arguments, | |
| as well as shared attributes that are used by all models like generation parameters and system prompts.`,nn,Ve,On=`Methods: | |
| from_path(path: str): | |
| Load configuration from a YAML file. | |
| from_args(args: str): | |
| Parse configuration from a command-line argument string. | |
| _parse_args(args: str): | |
| Static method to parse argument strings into configuration dictionaries.`,on,te,Jt,_e,It,he,kt,I,ue,ln,Be,Kn="Configuration class for HuggingFace Transformers models.",an,Re,eo="This configuration is used to load and configure models from the HuggingFace Transformers library.",sn,ne,rn,Xe,to=`Note: | |
| This configuration supports quantization (4-bit and 8-bit) through the dtype parameter. | |
| When using quantization, ensure you have the required dependencies installed | |
| (bitsandbytes for 4-bit/8-bit quantization).`,Ut,ve,Me,Gt,S,be,mn,Fe,no="Configuration class for delta models (weight difference models).",dn,Se,oo=`This configuration is used to load models that represent the difference between a | |
| fine-tuned model and its base model. The delta weights are added to the base model | |
| during loading to reconstruct the full fine-tuned model.`,jt,ye,Lt,k,xe,pn,qe,lo="Configuration class for VLLM inference engine.",gn,Qe,ao=`This configuration is used to load and configure models using the VLLM inference engine, | |
| which provides high-performance inference for large language models with features like | |
| PagedAttention, continuous batching, and efficient memory management.`,cn,Ye,so='vllm doc: <a href="https://docs.vllm.ai/en/v0.7.1/serving/engine_args.html" rel="nofollow">https://docs.vllm.ai/en/v0.7.1/serving/engine_args.html</a>',fn,oe,Dt,Ce,zt,U,Ne,_n,He,ro="Configuration class for SGLang inference engine.",hn,Oe,io=`This configuration is used to load and configure models using the SGLang inference engine, | |
| which provides high-performance inference.`,un,Ke,mo='sglang doc: <a href="https://docs.sglang.ai/index.html#" rel="nofollow">https://docs.sglang.ai/index.html#</a>',vn,le,Et,$e,Wt,E,Te,Mn,et,po="Configuration class for dummy models used for testing and baselines.",bn,tt,go=`This configuration is used to create dummy models that generate random responses | |
| or baselines for evaluation purposes. Useful for testing evaluation pipelines | |
| without requiring actual model inference.`,yn,ae,Pt,we,At,Je,Zt,$,Ie,xn,nt,co="Configuration class for HuggingFace’s inference providers (like Together AI, Anyscale, etc.).",Cn,ot,fo='inference providers doc: <a href="https://huggingface.co/docs/inference-providers/en/index" rel="nofollow">https://huggingface.co/docs/inference-providers/en/index</a>',Nn,se,$n,lt,_o="Note:",Tn,at,ho="<li>Requires HF API keys to be set in environment variable</li> <li>Different providers have different rate limits and pricing</li>",Vt,ke,Bt,N,Ue,wn,st,uo="Configuration class for HuggingFace Inference Endpoints (dedicated infrastructure).",Jn,rt,vo=`This configuration is used to create and manage dedicated inference endpoints | |
| on HuggingFace’s infrastructure. These endpoints provide dedicated compute | |
| resources and can handle larger batch sizes and higher throughput.`,In,it,Mo=`Methods: | |
| model_post_init(): | |
| Validates configuration and ensures proper parameter combinations. | |
| get_dtype_args(): | |
| Returns environment variables for dtype configuration. | |
| get_custom_env_vars(): | |
| Returns custom environment variables for the endpoint.`,kn,re,Un,mt,bo="Note:",Gn,dt,yo="<li>Creates dedicated infrastructure for model inference</li> <li>Supports various quantization methods and hardware configurations</li> <li>Auto-scaling available for optimal resource utilization</li> <li>Requires HuggingFace Pro subscription for most features</li> <li>Endpoints can take several minutes to start up</li> <li>Billed based on compute usage and duration</li>",Rt,W,Ge,jn,pt,xo="Configuration class for HuggingFace Inference API (inference endpoints).",Ln,gt,Co='<a href="https://huggingface.co/inference-endpoints/dedicated" rel="nofollow">https://huggingface.co/inference-endpoints/dedicated</a>',Dn,ie,Xt,je,Ft,G,Le,zn,ct,No="Configuration class for Text Generation Inference (TGI) backend.",En,ft,$o='doc: <a href="https://huggingface.co/docs/text-generation-inference/en/index" rel="nofollow">https://huggingface.co/docs/text-generation-inference/en/index</a>',Wn,_t,To=`This configuration is used to connect to TGI servers that serve HuggingFace models | |
| using the text-generation-inference library. TGI provides high-performance inference | |
| with features like continuous batching and efficient memory management.`,Pn,me,St,De,qt,j,ze,An,ht,wo="Configuration class for LiteLLM unified API client.",Zn,ut,Jo=`This configuration is used to connect to various LLM providers through the LiteLLM | |
| unified API. LiteLLM provides a consistent interface to multiple providers including | |
| OpenAI, Anthropic, Google, and many others.`,Vn,vt,Io='litellm doc: <a href="https://docs.litellm.ai/docs/" rel="nofollow">https://docs.litellm.ai/docs/</a>',Bn,de,Qt,Ee,Yt,T,We,Rn,Mt,ko="Configuration class for loading custom model implementations in Lighteval.",Xn,bt,Uo=`This config allows users to define and load their own model implementations by specifying | |
| a Python file containing a custom model class that inherits from LightevalModel.`,Fn,yt,Go=`The custom model file should contain exactly one class that inherits from LightevalModel. | |
| This class will be automatically detected and instantiated when loading the model.`,Sn,pe,qn,xt,jo="An example of a custom model can be found in <code>examples/custom_models/google_translate_model.py</code>.",Ht,Pe,Ot,Ct,Kt;return g=new Po({props:{containerStyle:"float: right; margin-left: 10px; display: inline-flex; position: relative; z-index: 10;"}}),f=new R({props:{title:"Model Configs",local:"model-configs",headingTag:"h1"}}),ce=new R({props:{title:"Base model config",local:"lighteval.models.abstract_model.ModelConfig",headingTag:"h3"}}),fe=new X({props:{name:"class lighteval.models.abstract_model.ModelConfig",anchor:"lighteval.models.abstract_model.ModelConfig",parameters:[{name:"model_name",val:": str = None"},{name:"generation_parameters",val:": GenerationParameters = GenerationParameters(num_blocks=None, block_size=None, early_stopping=None, repetition_penalty=None, frequency_penalty=None, length_penalty=None, presence_penalty=None, max_new_tokens=None, min_new_tokens=None, seed=None, stop_tokens=None, temperature=0, top_k=None, min_p=None, top_p=None, truncate_prompt=None, cache_implementation=None, response_format=None)"},{name:"system_prompt",val:": str | None = None"},{name:"cache_dir",val:": str = '~/.cache/huggingface/lighteval'"}],parametersDescription:[{anchor:"lighteval.models.abstract_model.ModelConfig.model_name",description:`<strong>model_name</strong> (str) — | |
| The model name or unique id`,name:"model_name"},{anchor:"lighteval.models.abstract_model.ModelConfig.generation_parameters",description:`<strong>generation_parameters</strong> (GenerationParameters) — | |
| Configuration parameters that control text generation behavior, including | |
| temperature, top_p, max_new_tokens, etc. Defaults to empty GenerationParameters.`,name:"generation_parameters"},{anchor:"lighteval.models.abstract_model.ModelConfig.system_prompt",description:`<strong>system_prompt</strong> (str | None) — | |
| Optional system prompt to be used with chat models. This prompt sets the | |
| behavior and context for the model during evaluation.`,name:"system_prompt"},{anchor:"lighteval.models.abstract_model.ModelConfig.cache_dir",description:`<strong>cache_dir</strong> (str) — | |
| Directory to cache the model. Defaults to ”~/.cache/huggingface/lighteval”.`,name:"cache_dir"}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/abstract_model.py#L41"}}),te=new Y({props:{anchor:"lighteval.models.abstract_model.ModelConfig.example",$$slots:{default:[Zo]},$$scope:{ctx:C}}}),_e=new R({props:{title:"Local Models",local:"local-models",headingTag:"h2"}}),he=new R({props:{title:"Transformers Model",local:"lighteval.models.transformers.transformers_model.TransformersModelConfig",headingTag:"h3"}}),ue=new X({props:{name:"class lighteval.models.transformers.transformers_model.TransformersModelConfig",anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig",parameters:[{name:"model_name",val:": str"},{name:"generation_parameters",val:": GenerationParameters = GenerationParameters(num_blocks=None, block_size=None, early_stopping=None, repetition_penalty=None, frequency_penalty=None, length_penalty=None, presence_penalty=None, max_new_tokens=None, min_new_tokens=None, seed=None, stop_tokens=None, temperature=0, top_k=None, min_p=None, top_p=None, truncate_prompt=None, cache_implementation=None, response_format=None)"},{name:"system_prompt",val:": str | None = None"},{name:"cache_dir",val:": str = '~/.cache/huggingface/lighteval'"},{name:"tokenizer",val:": str | None = None"},{name:"subfolder",val:": str | None = None"},{name:"revision",val:": str = 'main'"},{name:"batch_size",val:": typing.Optional[typing.Annotated[int, Gt(gt=0)]] = None"},{name:"max_length",val:": typing.Optional[typing.Annotated[int, Gt(gt=0)]] = None"},{name:"model_loading_kwargs",val:": dict = <factory>"},{name:"add_special_tokens",val:": bool = True"},{name:"skip_special_tokens",val:": bool = True"},{name:"model_parallel",val:": bool | None = None"},{name:"dtype",val:": str | None = None"},{name:"device",val:": typing.Union[int, str] = 'cuda'"},{name:"trust_remote_code",val:": bool = False"},{name:"compile",val:": bool = False"},{name:"multichoice_continuations_start_space",val:": bool | None = None"},{name:"pairwise_tokenization",val:": bool = False"},{name:"continuous_batching",val:": bool = False"},{name:"override_chat_template",val:": bool = None"}],parametersDescription:[{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.model_name",description:`<strong>model_name</strong> (str) — | |
| HuggingFace Hub model ID or path to a pre-trained model. This corresponds to the | |
| <code>pretrained_model_name_or_path</code> argument in HuggingFace’s <code>from_pretrained</code> method.`,name:"model_name"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.tokenizer",description:`<strong>tokenizer</strong> (str | None) — | |
| Optional HuggingFace Hub tokenizer ID. If not specified, uses the same ID as model_name. | |
| Useful when the tokenizer is different from the model (e.g., for multilingual models).`,name:"tokenizer"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.subfolder",description:`<strong>subfolder</strong> (str | None) — | |
| Subfolder within the model repository. Used when models are stored in subdirectories.`,name:"subfolder"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.revision",description:`<strong>revision</strong> (str) — | |
| Git revision of the model to load. Defaults to “main”.`,name:"revision"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.batch_size",description:`<strong>batch_size</strong> (PositiveInt | None) — | |
| Batch size for model inference. If None, will be automatically determined.`,name:"batch_size"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.max_length",description:`<strong>max_length</strong> (PositiveInt | None) — | |
| Maximum sequence length for the model. If None, uses model’s default.`,name:"max_length"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.model_loading_kwargs",description:`<strong>model_loading_kwargs</strong> (dict) — | |
| Additional keyword arguments passed to <code>from_pretrained</code>. Defaults to empty dict.`,name:"model_loading_kwargs"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.add_special_tokens",description:`<strong>add_special_tokens</strong> (bool) — | |
| Whether to add special tokens during tokenization. Defaults to True.`,name:"add_special_tokens"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.skip_special_tokens",description:`<strong>skip_special_tokens</strong> (bool) — | |
| Whether the tokenizer should output special tokens back during generation. Needed for reasoning models. Defaults to True`,name:"skip_special_tokens"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.model_parallel",description:`<strong>model_parallel</strong> (bool | None) — | |
| Whether to use model parallelism across multiple GPUs. If None, automatically | |
| determined based on available GPUs and model size.`,name:"model_parallel"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.dtype",description:`<strong>dtype</strong> (str | None) — | |
| Data type for model weights. Can be “float16”, “bfloat16”, “float32”, “auto”, “4bit”, “8bit”. | |
| If “auto”, uses the model’s default dtype.`,name:"dtype"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.device",description:`<strong>device</strong> (Union[int, str]) — | |
| Device to load the model on. Can be “cuda”, “cpu”, or GPU index. Defaults to “cuda”.`,name:"device"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.trust_remote_code",description:`<strong>trust_remote_code</strong> (bool) — | |
| Whether to trust remote code when loading models. Defaults to False.`,name:"trust_remote_code"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.compile",description:`<strong>compile</strong> (bool) — | |
| Whether to compile the model using torch.compile for optimization. Defaults to False.`,name:"compile"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.multichoice_continuations_start_space",description:`<strong>multichoice_continuations_start_space</strong> (bool | None) — | |
| Whether to add a space before multiple choice continuations. If None, uses model default. | |
| True forces adding space, False removes leading space if present.`,name:"multichoice_continuations_start_space"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.pairwise_tokenization",description:`<strong>pairwise_tokenization</strong> (bool) — | |
| Whether to tokenize context and continuation separately or together. Defaults to False.`,name:"pairwise_tokenization"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.continuous_batching",description:`<strong>continuous_batching</strong> (bool) — | |
| Whether to use continuous batching for generation. Defaults to False.`,name:"continuous_batching"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.override_chat_template",description:`<strong>override_chat_template</strong> (bool) — | |
| If True, we force the model to use a chat template. If alse, we prevent the model from using | |
| a chat template. If None, we use the default (true if present in the tokenizer, false otherwise)`,name:"override_chat_template"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.generation_parameters",description:`<strong>generation_parameters</strong> (GenerationParameters, optional, defaults to empty GenerationParameters) — | |
| Configuration parameters that control text generation behavior, including | |
| temperature, top_p, max_new_tokens, etc.`,name:"generation_parameters"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.system_prompt",description:`<strong>system_prompt</strong> (str | None, optional, defaults to None) — Optional system prompt to be used with chat models. | |
| This prompt sets the behavior and context for the model during evaluation.`,name:"system_prompt"},{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.cache_dir",description:"<strong>cache_dir</strong> (str, optional, defaults to ”~/.cache/huggingface/lighteval”) — Directory to cache the model.",name:"cache_dir"}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/transformers/transformers_model.py#L73"}}),ne=new Y({props:{anchor:"lighteval.models.transformers.transformers_model.TransformersModelConfig.example",$$slots:{default:[Vo]},$$scope:{ctx:C}}}),Me=new X({props:{name:"class lighteval.models.transformers.adapter_model.requires.<locals>.inner_fn.<locals>.Placeholder",anchor:"lighteval.models.transformers.adapter_model.requires.<locals>.inner_fn.<locals>.Placeholder",parameters:[{name:"*args",val:""},{name:"**kwargs",val:""}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/transformers/adapter_model.py#L43"}}),be=new X({props:{name:"class lighteval.models.transformers.delta_model.DeltaModelConfig",anchor:"lighteval.models.transformers.delta_model.DeltaModelConfig",parameters:[{name:"model_name",val:": str"},{name:"generation_parameters",val:": GenerationParameters = GenerationParameters(num_blocks=None, block_size=None, early_stopping=None, repetition_penalty=None, frequency_penalty=None, length_penalty=None, presence_penalty=None, max_new_tokens=None, min_new_tokens=None, seed=None, stop_tokens=None, temperature=0, top_k=None, min_p=None, top_p=None, truncate_prompt=None, cache_implementation=None, response_format=None)"},{name:"system_prompt",val:": str | None = None"},{name:"cache_dir",val:": str = '~/.cache/huggingface/lighteval'"},{name:"tokenizer",val:": str | None = None"},{name:"subfolder",val:": str | None = None"},{name:"revision",val:": str = 'main'"},{name:"batch_size",val:": typing.Optional[typing.Annotated[int, Gt(gt=0)]] = None"},{name:"max_length",val:": typing.Optional[typing.Annotated[int, Gt(gt=0)]] = None"},{name:"model_loading_kwargs",val:": dict = <factory>"},{name:"add_special_tokens",val:": bool = True"},{name:"skip_special_tokens",val:": bool = True"},{name:"model_parallel",val:": bool | None = None"},{name:"dtype",val:": str | None = None"},{name:"device",val:": typing.Union[int, str] = 'cuda'"},{name:"trust_remote_code",val:": bool = False"},{name:"compile",val:": bool = False"},{name:"multichoice_continuations_start_space",val:": bool | None = None"},{name:"pairwise_tokenization",val:": bool = False"},{name:"continuous_batching",val:": bool = False"},{name:"override_chat_template",val:": bool = None"},{name:"base_model",val:": str"}],parametersDescription:[{anchor:"lighteval.models.transformers.delta_model.DeltaModelConfig.base_model",description:`<strong>base_model</strong> (str) — | |
| HuggingFace Hub model ID or path to the base model. This is the original | |
| pre-trained model that the delta was computed from.`,name:"base_model"}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/transformers/delta_model.py#L38"}}),ye=new R({props:{title:"VLLM Model",local:"lighteval.models.vllm.vllm_model.VLLMModelConfig",headingTag:"h3"}}),xe=new X({props:{name:"class lighteval.models.vllm.vllm_model.VLLMModelConfig",anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig",parameters:[{name:"model_name",val:": str"},{name:"generation_parameters",val:": GenerationParameters = GenerationParameters(num_blocks=None, block_size=None, early_stopping=None, repetition_penalty=None, frequency_penalty=None, length_penalty=None, presence_penalty=None, max_new_tokens=None, min_new_tokens=None, seed=None, stop_tokens=None, temperature=0, top_k=None, min_p=None, top_p=None, truncate_prompt=None, cache_implementation=None, response_format=None)"},{name:"system_prompt",val:": str | None = None"},{name:"cache_dir",val:": str = '~/.cache/huggingface/lighteval'"},{name:"tokenizer",val:": str | None = None"},{name:"revision",val:": str = 'main'"},{name:"dtype",val:": str = 'bfloat16'"},{name:"tensor_parallel_size",val:": typing.Annotated[int, Gt(gt=0)] = 1"},{name:"data_parallel_size",val:": typing.Annotated[int, Gt(gt=0)] = 1"},{name:"pipeline_parallel_size",val:": typing.Annotated[int, Gt(gt=0)] = 1"},{name:"gpu_memory_utilization",val:": typing.Annotated[float, Ge(ge=0)] = 0.9"},{name:"enable_prefix_caching",val:": bool = None"},{name:"max_model_length",val:": typing.Optional[typing.Annotated[int, Gt(gt=0)]] = None"},{name:"quantization",val:": str | None = None"},{name:"load_format",val:": str | None = None"},{name:"swap_space",val:": typing.Annotated[int, Gt(gt=0)] = 4"},{name:"seed",val:": typing.Annotated[int, Ge(ge=0)] = 1234"},{name:"trust_remote_code",val:": bool = False"},{name:"add_special_tokens",val:": bool = True"},{name:"multichoice_continuations_start_space",val:": bool = True"},{name:"pairwise_tokenization",val:": bool = False"},{name:"max_num_seqs",val:": typing.Annotated[int, Gt(gt=0)] = 128"},{name:"max_num_batched_tokens",val:": typing.Annotated[int, Gt(gt=0)] = 2048"},{name:"subfolder",val:": str | None = None"},{name:"is_async",val:": bool = False"},{name:"override_chat_template",val:": bool = None"}],parametersDescription:[{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.model_name",description:`<strong>model_name</strong> (str) — | |
| HuggingFace Hub model ID or path to the model to load.`,name:"model_name"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.tokenizer",description:`<strong>tokenizer</strong> (str | None) — | |
| HuggingFace Hub model ID or path to the tokenizer to load.`,name:"tokenizer"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.revision",description:`<strong>revision</strong> (str) — | |
| Git revision of the model. Defaults to “main”.`,name:"revision"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.dtype",description:`<strong>dtype</strong> (str) — | |
| Data type for model weights. Defaults to “bfloat16”. Options: “float16”, “bfloat16”, “float32”.`,name:"dtype"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.tensor_parallel_size",description:`<strong>tensor_parallel_size</strong> (PositiveInt) — | |
| Number of GPUs to use for tensor parallelism. Defaults to 1.`,name:"tensor_parallel_size"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.data_parallel_size",description:`<strong>data_parallel_size</strong> (PositiveInt) — | |
| Number of GPUs to use for data parallelism. Defaults to 1.`,name:"data_parallel_size"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.pipeline_parallel_size",description:`<strong>pipeline_parallel_size</strong> (PositiveInt) — | |
| Number of GPUs to use for pipeline parallelism. Defaults to 1.`,name:"pipeline_parallel_size"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.gpu_memory_utilization",description:`<strong>gpu_memory_utilization</strong> (NonNegativeFloat) — | |
| Fraction of GPU memory to use. Lower this if running out of memory. Defaults to 0.9.`,name:"gpu_memory_utilization"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.enable_prefix_caching",description:`<strong>enable_prefix_caching</strong> (bool) — | |
| Whether to enable prefix caching to speed up generation. May use more memory. Should be disabled for LFM2. Defaults to True.`,name:"enable_prefix_caching"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.max_model_length",description:`<strong>max_model_length</strong> (PositiveInt | None) — | |
| Maximum sequence length for the model. If None, automatically inferred. | |
| Reduce this if encountering OOM issues (4096 is usually sufficient).`,name:"max_model_length"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.quantization",description:`<strong>quantization</strong> (str | None) — | |
| Quantization method.`,name:"quantization"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.load_format",description:`<strong>load_format</strong> (str | None) — | |
| The format of the model weights to load. choices: auto, pt, safetensors, npcache, dummy, tensorizer, sharded_state, gguf, bitsandbytes, mistral, runai_streamer.`,name:"load_format"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.swap_space",description:`<strong>swap_space</strong> (PositiveInt) — | |
| CPU swap space size in GiB per GPU. Defaults to 4.`,name:"swap_space"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.seed",description:`<strong>seed</strong> (NonNegativeInt) — | |
| Random seed for reproducibility. Defaults to 1234.`,name:"seed"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.trust_remote_code",description:`<strong>trust_remote_code</strong> (bool) — | |
| Whether to trust remote code when loading models. Defaults to False.`,name:"trust_remote_code"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.add_special_tokens",description:`<strong>add_special_tokens</strong> (bool) — | |
| Whether to add special tokens during tokenization. Defaults to True.`,name:"add_special_tokens"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.multichoice_continuations_start_space",description:`<strong>multichoice_continuations_start_space</strong> (bool) — | |
| Whether to add a space before multiple choice continuations. Defaults to True.`,name:"multichoice_continuations_start_space"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.pairwise_tokenization",description:`<strong>pairwise_tokenization</strong> (bool) — | |
| Whether to tokenize context and continuation separately for loglikelihood evals. Defaults to False.`,name:"pairwise_tokenization"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.max_num_seqs",description:`<strong>max_num_seqs</strong> (PositiveInt) — | |
| Maximum number of sequences per iteration. Controls batch size at prefill stage. Defaults to 128.`,name:"max_num_seqs"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.max_num_batched_tokens",description:`<strong>max_num_batched_tokens</strong> (PositiveInt) — | |
| Maximum number of tokens per batch. Defaults to 2048.`,name:"max_num_batched_tokens"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.subfolder",description:`<strong>subfolder</strong> (str | None) — | |
| Subfolder within the model repository. Defaults to None.`,name:"subfolder"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.is_async",description:`<strong>is_async</strong> (bool) — | |
| Whether to use the async version of VLLM. Defaults to False.`,name:"is_async"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.override_chat_template",description:`<strong>override_chat_template</strong> (bool) — | |
| If True, we force the model to use a chat template. If alse, we prevent the model from using | |
| a chat template. If None, we use the default (true if present in the tokenizer, false otherwise)`,name:"override_chat_template"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.generation_parameters",description:`<strong>generation_parameters</strong> (GenerationParameters, optional, defaults to empty GenerationParameters) — | |
| Configuration parameters that control text generation behavior, including | |
| temperature, top_p, max_new_tokens, etc.`,name:"generation_parameters"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.system_prompt",description:`<strong>system_prompt</strong> (str | None, optional, defaults to None) — Optional system prompt to be used with chat models. | |
| This prompt sets the behavior and context for the model during evaluation.`,name:"system_prompt"},{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.cache_dir",description:"<strong>cache_dir</strong> (str, optional, defaults to ”~/.cache/huggingface/lighteval”) — Directory to cache the model.",name:"cache_dir"}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/vllm/vllm_model.py#L76"}}),oe=new Y({props:{anchor:"lighteval.models.vllm.vllm_model.VLLMModelConfig.example",$$slots:{default:[Bo]},$$scope:{ctx:C}}}),Ce=new R({props:{title:"SGLang Model",local:"lighteval.models.sglang.sglang_model.SGLangModelConfig",headingTag:"h3"}}),Ne=new X({props:{name:"class lighteval.models.sglang.sglang_model.SGLangModelConfig",anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig",parameters:[{name:"model_name",val:": str"},{name:"generation_parameters",val:": GenerationParameters = GenerationParameters(num_blocks=None, block_size=None, early_stopping=None, repetition_penalty=None, frequency_penalty=None, length_penalty=None, presence_penalty=None, max_new_tokens=None, min_new_tokens=None, seed=None, stop_tokens=None, temperature=0, top_k=None, min_p=None, top_p=None, truncate_prompt=None, cache_implementation=None, response_format=None)"},{name:"system_prompt",val:": str | None = None"},{name:"cache_dir",val:": str = '~/.cache/huggingface/lighteval'"},{name:"load_format",val:": str = 'auto'"},{name:"dtype",val:": str = 'auto'"},{name:"tp_size",val:": typing.Annotated[int, Gt(gt=0)] = 1"},{name:"dp_size",val:": typing.Annotated[int, Gt(gt=0)] = 1"},{name:"context_length",val:": typing.Optional[typing.Annotated[int, Gt(gt=0)]] = None"},{name:"random_seed",val:": typing.Optional[typing.Annotated[int, Gt(gt=0)]] = 1234"},{name:"trust_remote_code",val:": bool = False"},{name:"device",val:": str = 'cuda'"},{name:"skip_tokenizer_init",val:": bool = False"},{name:"kv_cache_dtype",val:": str = 'auto'"},{name:"add_special_tokens",val:": bool = True"},{name:"pairwise_tokenization",val:": bool = False"},{name:"sampling_backend",val:": str | None = None"},{name:"attention_backend",val:": str | None = None"},{name:"mem_fraction_static",val:": typing.Annotated[float, Gt(gt=0)] = 0.8"},{name:"chunked_prefill_size",val:": typing.Annotated[int, Gt(gt=0)] = 4096"},{name:"override_chat_template",val:": bool = None"}],parametersDescription:[{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.model_name",description:`<strong>model_name</strong> (str) — | |
| HuggingFace Hub model ID or path to the model to load.`,name:"model_name"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.load_format",description:`<strong>load_format</strong> (str) — | |
| The format of the model weights to load. choices: auto, pt, safetensors, npcache, dummy, tensorizer, sharded_state, gguf, bitsandbytes, mistral, runai_streamer.`,name:"load_format"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.dtype",description:`<strong>dtype</strong> (str) — | |
| Data type for model weights. Defaults to “auto”. Options: “auto”, “float16”, “bfloat16”, “float32”.`,name:"dtype"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.tp_size",description:`<strong>tp_size</strong> (PositiveInt) — | |
| Number of GPUs to use for tensor parallelism. Defaults to 1.`,name:"tp_size"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.dp_size",description:`<strong>dp_size</strong> (PositiveInt) — | |
| Number of GPUs to use for data parallelism. Defaults to 1.`,name:"dp_size"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.context_length",description:`<strong>context_length</strong> (PositiveInt | None) — | |
| Maximum context length for the model.`,name:"context_length"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.random_seed",description:`<strong>random_seed</strong> (PositiveInt | None) — | |
| Random seed for reproducibility. Defaults to 1234.`,name:"random_seed"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.trust_remote_code",description:`<strong>trust_remote_code</strong> (bool) — | |
| Whether to trust remote code when loading models. Defaults to False.`,name:"trust_remote_code"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.device",description:`<strong>device</strong> (str) — | |
| Device to load the model on. Defaults to “cuda”.`,name:"device"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.skip_tokenizer_init",description:`<strong>skip_tokenizer_init</strong> (bool) — | |
| Whether to skip tokenizer initialization. Defaults to False.`,name:"skip_tokenizer_init"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.kv_cache_dtype",description:`<strong>kv_cache_dtype</strong> (str) — | |
| Data type for key-value cache. Defaults to “auto”.`,name:"kv_cache_dtype"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.add_special_tokens",description:`<strong>add_special_tokens</strong> (bool) — | |
| Whether to add special tokens during tokenization. Defaults to True.`,name:"add_special_tokens"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.pairwise_tokenization",description:`<strong>pairwise_tokenization</strong> (bool) — | |
| Whether to tokenize context and continuation separately for loglikelihood evals. Defaults to False.`,name:"pairwise_tokenization"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.sampling_backend",description:`<strong>sampling_backend</strong> (str | None) — | |
| Sampling backend to use. If None, uses default.`,name:"sampling_backend"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.attention_backend",description:`<strong>attention_backend</strong> (str | None) — | |
| Attention backend to use. If None, uses default.`,name:"attention_backend"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.mem_fraction_static",description:`<strong>mem_fraction_static</strong> (PositiveFloat) — | |
| Fraction of GPU memory to use for static allocation. Defaults to 0.8.`,name:"mem_fraction_static"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.chunked_prefill_size",description:`<strong>chunked_prefill_size</strong> (PositiveInt) — | |
| Size of chunks for prefill operations. Defaults to 4096.`,name:"chunked_prefill_size"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.override_chat_template",description:`<strong>override_chat_template</strong> (bool) — | |
| If True, we force the model to use a chat template. If alse, we prevent the model from using | |
| a chat template. If None, we use the default (true if present in the tokenizer, false otherwise)`,name:"override_chat_template"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.generation_parameters",description:`<strong>generation_parameters</strong> (GenerationParameters, optional, defaults to empty GenerationParameters) — | |
| Configuration parameters that control text generation behavior, including | |
| temperature, top_p, max_new_tokens, etc.`,name:"generation_parameters"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.system_prompt",description:`<strong>system_prompt</strong> (str | None, optional, defaults to None) — Optional system prompt to be used with chat models. | |
| This prompt sets the behavior and context for the model during evaluation.`,name:"system_prompt"},{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.cache_dir",description:"<strong>cache_dir</strong> (str, optional, defaults to ”~/.cache/huggingface/lighteval”) — Directory to cache the model.",name:"cache_dir"}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/sglang/sglang_model.py#L54"}}),le=new Y({props:{anchor:"lighteval.models.sglang.sglang_model.SGLangModelConfig.example",$$slots:{default:[Ro]},$$scope:{ctx:C}}}),$e=new R({props:{title:"Dummy Model",local:"lighteval.models.dummy.dummy_model.DummyModelConfig",headingTag:"h3"}}),Te=new X({props:{name:"class lighteval.models.dummy.dummy_model.DummyModelConfig",anchor:"lighteval.models.dummy.dummy_model.DummyModelConfig",parameters:[{name:"model_name",val:": str = 'dummy'"},{name:"generation_parameters",val:": GenerationParameters = GenerationParameters(num_blocks=None, block_size=None, early_stopping=None, repetition_penalty=None, frequency_penalty=None, length_penalty=None, presence_penalty=None, max_new_tokens=None, min_new_tokens=None, seed=None, stop_tokens=None, temperature=0, top_k=None, min_p=None, top_p=None, truncate_prompt=None, cache_implementation=None, response_format=None)"},{name:"system_prompt",val:": str | None = None"},{name:"cache_dir",val:": str = '~/.cache/huggingface/lighteval'"},{name:"seed",val:": int = 42"}],parametersDescription:[{anchor:"lighteval.models.dummy.dummy_model.DummyModelConfig.model_name",description:`<strong>model_name</strong> (str) — | |
| Name of your choice - “dummy” by default`,name:"model_name"},{anchor:"lighteval.models.dummy.dummy_model.DummyModelConfig.seed",description:`<strong>seed</strong> (int) — | |
| Random seed for reproducible dummy responses. Defaults to 42. | |
| This seed controls the randomness of the generated responses and log probabilities.`,name:"seed"}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/dummy/dummy_model.py#L35"}}),ae=new Y({props:{anchor:"lighteval.models.dummy.dummy_model.DummyModelConfig.example",$$slots:{default:[Xo]},$$scope:{ctx:C}}}),we=new R({props:{title:"Endpoints-based Models",local:"endpoints-based-models",headingTag:"h2"}}),Je=new R({props:{title:"Inference Providers Model",local:"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig",headingTag:"h3"}}),Ie=new X({props:{name:"class lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig",anchor:"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig",parameters:[{name:"model_name",val:": str"},{name:"generation_parameters",val:": GenerationParameters = GenerationParameters(num_blocks=None, block_size=None, early_stopping=None, repetition_penalty=None, frequency_penalty=None, length_penalty=None, presence_penalty=None, max_new_tokens=None, min_new_tokens=None, seed=None, stop_tokens=None, temperature=0, top_k=None, min_p=None, top_p=None, truncate_prompt=None, cache_implementation=None, response_format=None)"},{name:"system_prompt",val:": str | None = None"},{name:"cache_dir",val:": str = '~/.cache/huggingface/lighteval'"},{name:"provider",val:": str"},{name:"timeout",val:": int | None = None"},{name:"proxies",val:": typing.Optional[typing.Any] = None"},{name:"org_to_bill",val:": str | None = None"},{name:"parallel_calls_count",val:": typing.Annotated[int, Ge(ge=0)] = 10"}],parametersDescription:[{anchor:"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig.model_name",description:`<strong>model_name</strong> (str) — | |
| Name or identifier of the model to use.`,name:"model_name"},{anchor:"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig.provider",description:`<strong>provider</strong> (str) — | |
| Name of the inference provider. Examples: “together”, “anyscale”, “runpod”, etc.`,name:"provider"},{anchor:"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig.timeout",description:`<strong>timeout</strong> (int | None) — | |
| Request timeout in seconds. If None, uses provider default.`,name:"timeout"},{anchor:"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig.proxies",description:`<strong>proxies</strong> (Any | None) — | |
| Proxy configuration for requests. Can be a dict or proxy URL string.`,name:"proxies"},{anchor:"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig.org_to_bill",description:`<strong>org_to_bill</strong> (str | None) — | |
| Organization to bill for API usage. If None, bills the user’s account.`,name:"org_to_bill"},{anchor:"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig.parallel_calls_count",description:`<strong>parallel_calls_count</strong> (NonNegativeInt) — | |
| Number of parallel API calls to make. Defaults to 10. | |
| Higher values increase throughput but may hit rate limits.`,name:"parallel_calls_count"},{anchor:"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig.generation_parameters",description:`<strong>generation_parameters</strong> (GenerationParameters, optional, defaults to empty GenerationParameters) — | |
| Configuration parameters that control text generation behavior, including | |
| temperature, top_p, max_new_tokens, etc.`,name:"generation_parameters"},{anchor:"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig.system_prompt",description:`<strong>system_prompt</strong> (str | None, optional, defaults to None) — Optional system prompt to be used with chat models. | |
| This prompt sets the behavior and context for the model during evaluation.`,name:"system_prompt"},{anchor:"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig.cache_dir",description:"<strong>cache_dir</strong> (str, optional, defaults to ”~/.cache/huggingface/lighteval”) — Directory to cache the model.",name:"cache_dir"}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/endpoints/inference_providers_model.py#L45"}}),se=new Y({props:{anchor:"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig.example",$$slots:{default:[Fo]},$$scope:{ctx:C}}}),ke=new R({props:{title:"InferenceEndpointModel",local:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig",headingTag:"h3"}}),Ue=new X({props:{name:"class lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig",anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig",parameters:[{name:"model_name",val:": str | None = None"},{name:"generation_parameters",val:": GenerationParameters = GenerationParameters(num_blocks=None, block_size=None, early_stopping=None, repetition_penalty=None, frequency_penalty=None, length_penalty=None, presence_penalty=None, max_new_tokens=None, min_new_tokens=None, seed=None, stop_tokens=None, temperature=0, top_k=None, min_p=None, top_p=None, truncate_prompt=None, cache_implementation=None, response_format=None)"},{name:"system_prompt",val:": str | None = None"},{name:"cache_dir",val:": str = '~/.cache/huggingface/lighteval'"},{name:"endpoint_name",val:": str | None = None"},{name:"reuse_existing",val:": bool = False"},{name:"accelerator",val:": str = 'gpu'"},{name:"dtype",val:": str | None = None"},{name:"vendor",val:": str = 'aws'"},{name:"region",val:": str = 'us-east-1'"},{name:"instance_size",val:": str | None = None"},{name:"instance_type",val:": str | None = None"},{name:"framework",val:": str = 'pytorch'"},{name:"endpoint_type",val:": str = 'protected'"},{name:"add_special_tokens",val:": bool = True"},{name:"revision",val:": str = 'main'"},{name:"namespace",val:": str | None = None"},{name:"image_url",val:": str | None = None"},{name:"env_vars",val:": dict | None = None"},{name:"batch_size",val:": int = 1"}],parametersDescription:[{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.endpoint_name",description:`<strong>endpoint_name</strong> (str | None) — | |
| Name for the inference endpoint. If None, auto-generated from model_name.`,name:"endpoint_name"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.model_name",description:`<strong>model_name</strong> (str | None) — | |
| HuggingFace Hub model ID to deploy. Required if endpoint_name is None.`,name:"model_name"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.reuse_existing",description:`<strong>reuse_existing</strong> (bool) — | |
| Whether to reuse an existing endpoint with the same name. Defaults to False.`,name:"reuse_existing"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.accelerator",description:`<strong>accelerator</strong> (str) — | |
| Type of accelerator to use. Defaults to “gpu”. Options: “gpu”, “cpu”.`,name:"accelerator"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.dtype",description:`<strong>dtype</strong> (str | None) — | |
| Model data type. If None, uses model default. Options: “float16”, “bfloat16”, “awq”, “gptq”, “8bit”, “4bit”.`,name:"dtype"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.vendor",description:`<strong>vendor</strong> (str) — | |
| Cloud vendor for the endpoint. Defaults to “aws”. Options: “aws”, “azure”, “gcp”.`,name:"vendor"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.region",description:`<strong>region</strong> (str) — | |
| Cloud region for the endpoint. Defaults to “us-east-1”.`,name:"region"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.instance_size",description:`<strong>instance_size</strong> (str | None) — | |
| Instance size for the endpoint. If None, auto-scaled.`,name:"instance_size"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.instance_type",description:`<strong>instance_type</strong> (str | None) — | |
| Instance type for the endpoint. If None, auto-scaled.`,name:"instance_type"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.framework",description:`<strong>framework</strong> (str) — | |
| ML framework to use. Defaults to “pytorch”.`,name:"framework"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.endpoint_type",description:`<strong>endpoint_type</strong> (str) — | |
| Type of endpoint. Defaults to “protected”. Options: “protected”, “public”.`,name:"endpoint_type"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.add_special_tokens",description:`<strong>add_special_tokens</strong> (bool) — | |
| Whether to add special tokens during tokenization. Defaults to True.`,name:"add_special_tokens"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.revision",description:`<strong>revision</strong> (str) — | |
| Git revision of the model. Defaults to “main”.`,name:"revision"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.namespace",description:`<strong>namespace</strong> (str | None) — | |
| Namespace for the endpoint. If None, uses current user’s namespace.`,name:"namespace"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.image_url",description:`<strong>image_url</strong> (str | None) — | |
| Custom Docker image URL. If None, uses default TGI image.`,name:"image_url"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.env_vars",description:`<strong>env_vars</strong> (dict | None) — | |
| Additional environment variables for the endpoint.`,name:"env_vars"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.batch_size",description:`<strong>batch_size</strong> (int) — | |
| Batch size for requests. Defaults to 1.`,name:"batch_size"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.generation_parameters",description:`<strong>generation_parameters</strong> (GenerationParameters, optional, defaults to empty GenerationParameters) — | |
| Configuration parameters that control text generation behavior, including | |
| temperature, top_p, max_new_tokens, etc.`,name:"generation_parameters"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.system_prompt",description:`<strong>system_prompt</strong> (str | None, optional, defaults to None) — Optional system prompt to be used with chat models. | |
| This prompt sets the behavior and context for the model during evaluation.`,name:"system_prompt"},{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.cache_dir",description:"<strong>cache_dir</strong> (str, optional, defaults to ”~/.cache/huggingface/lighteval”) — Directory to cache the model.",name:"cache_dir"}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/endpoints/endpoint_model.py#L108"}}),re=new Y({props:{anchor:"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig.example",$$slots:{default:[So]},$$scope:{ctx:C}}}),Ge=new X({props:{name:"class lighteval.models.endpoints.endpoint_model.ServerlessEndpointModelConfig",anchor:"lighteval.models.endpoints.endpoint_model.ServerlessEndpointModelConfig",parameters:[{name:"model_name",val:": str"},{name:"generation_parameters",val:": GenerationParameters = GenerationParameters(num_blocks=None, block_size=None, early_stopping=None, repetition_penalty=None, frequency_penalty=None, length_penalty=None, presence_penalty=None, max_new_tokens=None, min_new_tokens=None, seed=None, stop_tokens=None, temperature=0, top_k=None, min_p=None, top_p=None, truncate_prompt=None, cache_implementation=None, response_format=None)"},{name:"system_prompt",val:": str | None = None"},{name:"cache_dir",val:": str = '~/.cache/huggingface/lighteval'"},{name:"add_special_tokens",val:": bool = True"},{name:"batch_size",val:": int = 1"}],parametersDescription:[{anchor:"lighteval.models.endpoints.endpoint_model.ServerlessEndpointModelConfig.model_name",description:`<strong>model_name</strong> (str) — | |
| HuggingFace Hub model ID to use with the Inference API. | |
| Example: “meta-llama/Llama-3.1-8B-Instruct”`,name:"model_name"},{anchor:"lighteval.models.endpoints.endpoint_model.ServerlessEndpointModelConfig.add_special_tokens",description:`<strong>add_special_tokens</strong> (bool) — | |
| Whether to add special tokens during tokenization. Defaults to True.`,name:"add_special_tokens"},{anchor:"lighteval.models.endpoints.endpoint_model.ServerlessEndpointModelConfig.batch_size",description:`<strong>batch_size</strong> (int) — | |
| Batch size for requests. Defaults to 1 (serverless API limitation).`,name:"batch_size"},{anchor:"lighteval.models.endpoints.endpoint_model.ServerlessEndpointModelConfig.generation_parameters",description:`<strong>generation_parameters</strong> (GenerationParameters, optional, defaults to empty GenerationParameters) — | |
| Configuration parameters that control text generation behavior, including | |
| temperature, top_p, max_new_tokens, etc.`,name:"generation_parameters"},{anchor:"lighteval.models.endpoints.endpoint_model.ServerlessEndpointModelConfig.system_prompt",description:`<strong>system_prompt</strong> (str | None, optional, defaults to None) — Optional system prompt to be used with chat models. | |
| This prompt sets the behavior and context for the model during evaluation.`,name:"system_prompt"},{anchor:"lighteval.models.endpoints.endpoint_model.ServerlessEndpointModelConfig.cache_dir",description:"<strong>cache_dir</strong> (str, optional, defaults to ”~/.cache/huggingface/lighteval”) — Directory to cache the model.",name:"cache_dir"}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/endpoints/endpoint_model.py#L71"}}),ie=new Y({props:{anchor:"lighteval.models.endpoints.endpoint_model.ServerlessEndpointModelConfig.example",$$slots:{default:[qo]},$$scope:{ctx:C}}}),je=new R({props:{title:"TGI ModelClient",local:"lighteval.models.endpoints.tgi_model.TGIModelConfig",headingTag:"h3"}}),Le=new X({props:{name:"class lighteval.models.endpoints.tgi_model.TGIModelConfig",anchor:"lighteval.models.endpoints.tgi_model.TGIModelConfig",parameters:[{name:"model_name",val:": str | None"},{name:"generation_parameters",val:": GenerationParameters = GenerationParameters(num_blocks=None, block_size=None, early_stopping=None, repetition_penalty=None, frequency_penalty=None, length_penalty=None, presence_penalty=None, max_new_tokens=None, min_new_tokens=None, seed=None, stop_tokens=None, temperature=0, top_k=None, min_p=None, top_p=None, truncate_prompt=None, cache_implementation=None, response_format=None)"},{name:"system_prompt",val:": str | None = None"},{name:"cache_dir",val:": str = '~/.cache/huggingface/lighteval'"},{name:"inference_server_address",val:": str | None = None"},{name:"inference_server_auth",val:": str | None = None"},{name:"model_info",val:": dict | None = None"},{name:"batch_size",val:": int = 1"}],parametersDescription:[{anchor:"lighteval.models.endpoints.tgi_model.TGIModelConfig.inference_server_address",description:`<strong>inference_server_address</strong> (str | None) — | |
| Address of the TGI server. Format: “http://host:port” or “https://host:port”. | |
| Example: “http://localhost:8080”`,name:"inference_server_address"},{anchor:"lighteval.models.endpoints.tgi_model.TGIModelConfig.inference_server_auth",description:`<strong>inference_server_auth</strong> (str | None) — | |
| Authentication token for the TGI server. If None, no authentication is used.`,name:"inference_server_auth"},{anchor:"lighteval.models.endpoints.tgi_model.TGIModelConfig.model_name",description:`<strong>model_name</strong> (str | None) — | |
| Optional model name override. If None, uses the model name from server info.`,name:"model_name"},{anchor:"lighteval.models.endpoints.tgi_model.TGIModelConfig.generation_parameters",description:`<strong>generation_parameters</strong> (GenerationParameters, optional, defaults to empty GenerationParameters) — | |
| Configuration parameters that control text generation behavior, including | |
| temperature, top_p, max_new_tokens, etc.`,name:"generation_parameters"},{anchor:"lighteval.models.endpoints.tgi_model.TGIModelConfig.system_prompt",description:`<strong>system_prompt</strong> (str | None, optional, defaults to None) — Optional system prompt to be used with chat models. | |
| This prompt sets the behavior and context for the model during evaluation.`,name:"system_prompt"},{anchor:"lighteval.models.endpoints.tgi_model.TGIModelConfig.cache_dir",description:"<strong>cache_dir</strong> (str, optional, defaults to ”~/.cache/huggingface/lighteval”) — Directory to cache the model.",name:"cache_dir"}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/endpoints/tgi_model.py#L55"}}),me=new Y({props:{anchor:"lighteval.models.endpoints.tgi_model.TGIModelConfig.example",$$slots:{default:[Qo]},$$scope:{ctx:C}}}),De=new R({props:{title:"Litellm Model",local:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig",headingTag:"h3"}}),ze=new X({props:{name:"class lighteval.models.endpoints.litellm_model.LiteLLMModelConfig",anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig",parameters:[{name:"model_name",val:": str"},{name:"generation_parameters",val:": GenerationParameters = GenerationParameters(num_blocks=None, block_size=None, early_stopping=None, repetition_penalty=None, frequency_penalty=None, length_penalty=None, presence_penalty=None, max_new_tokens=None, min_new_tokens=None, seed=None, stop_tokens=None, temperature=0, top_k=None, min_p=None, top_p=None, truncate_prompt=None, cache_implementation=None, response_format=None)"},{name:"system_prompt",val:": str | None = None"},{name:"cache_dir",val:": str = '~/.cache/huggingface/lighteval'"},{name:"provider",val:": str | None = None"},{name:"base_url",val:": str | None = None"},{name:"api_key",val:": str | None = None"},{name:"concurrent_requests",val:": int = 10"},{name:"verbose",val:": bool = False"},{name:"max_model_length",val:": int | None = None"},{name:"api_max_retry",val:": int = 8"},{name:"api_retry_sleep",val:": float = 1.0"},{name:"api_retry_multiplier",val:": float = 2.0"},{name:"timeout",val:": float | None = None"}],parametersDescription:[{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.model_name",description:`<strong>model_name</strong> (str) — | |
| Model identifier. Can include provider prefix (e.g., “gpt-4”, “claude-3-sonnet”) | |
| or use provider/model format (e.g., “openai/gpt-4”, “anthropic/claude-3-sonnet”).`,name:"model_name"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.provider",description:`<strong>provider</strong> (str | None) — | |
| Optional provider name override. If None, inferred from model_name. | |
| Examples: “openai”, “anthropic”, “google”, “cohere”, etc.`,name:"provider"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.base_url",description:`<strong>base_url</strong> (str | None) — | |
| Custom base URL for the API. If None, uses provider’s default URL. | |
| Useful for using custom endpoints or local deployments.`,name:"base_url"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.api_key",description:`<strong>api_key</strong> (str | None) — | |
| API key for authentication. If None, reads from environment variables. | |
| Environment variable names are provider-specific (e.g., OPENAI_API_KEY).`,name:"api_key"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.concurrent_requests",description:`<strong>concurrent_requests</strong> (int) — | |
| Maximum number of concurrent API requests to execute in parallel. | |
| Higher values can improve throughput for batch processing but may hit rate limits | |
| or exhaust API quotas faster. Default is 10.`,name:"concurrent_requests"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.verbose",description:`<strong>verbose</strong> (bool) — | |
| Whether to enable verbose logging. Default is False.`,name:"verbose"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.max_model_length",description:`<strong>max_model_length</strong> (int | None) — | |
| Maximum context length for the model. If None, infers the model’s default max length.`,name:"max_model_length"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.api_max_retry",description:`<strong>api_max_retry</strong> (int) — | |
| Maximum number of retries for API requests. Default is 8.`,name:"api_max_retry"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.api_retry_sleep",description:`<strong>api_retry_sleep</strong> (float) — | |
| Initial sleep time (in seconds) between retries. Default is 1.0.`,name:"api_retry_sleep"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.api_retry_multiplier",description:`<strong>api_retry_multiplier</strong> (float) — | |
| Multiplier for increasing sleep time between retries. Default is 2.0.`,name:"api_retry_multiplier"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.timeout",description:`<strong>timeout</strong> (float) — | |
| Request timeout in seconds. Default is None (no timeout).`,name:"timeout"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.generation_parameters",description:`<strong>generation_parameters</strong> (GenerationParameters, optional, defaults to empty GenerationParameters) — | |
| Configuration parameters that control text generation behavior, including | |
| temperature, top_p, max_new_tokens, etc.`,name:"generation_parameters"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.system_prompt",description:`<strong>system_prompt</strong> (str | None, optional, defaults to None) — Optional system prompt to be used with chat models. | |
| This prompt sets the behavior and context for the model during evaluation.`,name:"system_prompt"},{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.cache_dir",description:"<strong>cache_dir</strong> (str, optional, defaults to ”~/.cache/huggingface/lighteval”) — Directory to cache the model.",name:"cache_dir"}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/endpoints/litellm_model.py#L61"}}),de=new Y({props:{anchor:"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig.example",$$slots:{default:[Yo]},$$scope:{ctx:C}}}),Ee=new R({props:{title:"Custom Model",local:"lighteval.models.custom.custom_model.CustomModelConfig",headingTag:"h2"}}),We=new X({props:{name:"class lighteval.models.custom.custom_model.CustomModelConfig",anchor:"lighteval.models.custom.custom_model.CustomModelConfig",parameters:[{name:"model_name",val:": str"},{name:"generation_parameters",val:": GenerationParameters = GenerationParameters(num_blocks=None, block_size=None, early_stopping=None, repetition_penalty=None, frequency_penalty=None, length_penalty=None, presence_penalty=None, max_new_tokens=None, min_new_tokens=None, seed=None, stop_tokens=None, temperature=0, top_k=None, min_p=None, top_p=None, truncate_prompt=None, cache_implementation=None, response_format=None)"},{name:"system_prompt",val:": str | None = None"},{name:"cache_dir",val:": str = '~/.cache/huggingface/lighteval'"},{name:"model_definition_file_path",val:": str"}],parametersDescription:[{anchor:"lighteval.models.custom.custom_model.CustomModelConfig.model",description:`<strong>model</strong> (str) — | |
| An identifier for the model. This can be used to track which model was evaluated | |
| in the results and logs.`,name:"model"},{anchor:"lighteval.models.custom.custom_model.CustomModelConfig.model_definition_file_path",description:`<strong>model_definition_file_path</strong> (str) — | |
| Path to a Python file containing the custom model implementation. This file must | |
| define exactly one class that inherits from LightevalModel. The class should | |
| implement all required methods from the LightevalModel interface.`,name:"model_definition_file_path"}],source:"https://github.com/huggingface/lighteval/blob/vr_1027/src/lighteval/models/custom/custom_model.py#L26"}}),pe=new Y({props:{anchor:"lighteval.models.custom.custom_model.CustomModelConfig.example",$$slots:{default:[Ho]},$$scope:{ctx:C}}}),Pe=new Ao({props:{source:"https://github.com/huggingface/lighteval/blob/main/docs/source/package_reference/models.mdx"}}),{c(){n=d("meta"),x=l(),c=d("p"),o=l(),_(g.$$.fragment),t=l(),_(f.$$.fragment),$t=l(),ge=d("p"),ge.innerHTML=Qn,Tt=l(),_(ce.$$.fragment),wt=l(),J=d("div"),_(fe.$$.fragment),en=l(),Ae=d("p"),Ae.textContent=Yn,tn=l(),Ze=d("p"),Ze.textContent=Hn,nn=l(),Ve=d("p"),Ve.textContent=On,on=l(),_(te.$$.fragment),Jt=l(),_(_e.$$.fragment),It=l(),_(he.$$.fragment),kt=l(),I=d("div"),_(ue.$$.fragment),ln=l(),Be=d("p"),Be.textContent=Kn,an=l(),Re=d("p"),Re.textContent=eo,sn=l(),_(ne.$$.fragment),rn=l(),Xe=d("p"),Xe.textContent=to,Ut=l(),ve=d("div"),_(Me.$$.fragment),Gt=l(),S=d("div"),_(be.$$.fragment),mn=l(),Fe=d("p"),Fe.textContent=no,dn=l(),Se=d("p"),Se.textContent=oo,jt=l(),_(ye.$$.fragment),Lt=l(),k=d("div"),_(xe.$$.fragment),pn=l(),qe=d("p"),qe.textContent=lo,gn=l(),Qe=d("p"),Qe.textContent=ao,cn=l(),Ye=d("p"),Ye.innerHTML=so,fn=l(),_(oe.$$.fragment),Dt=l(),_(Ce.$$.fragment),zt=l(),U=d("div"),_(Ne.$$.fragment),_n=l(),He=d("p"),He.textContent=ro,hn=l(),Oe=d("p"),Oe.textContent=io,un=l(),Ke=d("p"),Ke.innerHTML=mo,vn=l(),_(le.$$.fragment),Et=l(),_($e.$$.fragment),Wt=l(),E=d("div"),_(Te.$$.fragment),Mn=l(),et=d("p"),et.textContent=po,bn=l(),tt=d("p"),tt.textContent=go,yn=l(),_(ae.$$.fragment),Pt=l(),_(we.$$.fragment),At=l(),_(Je.$$.fragment),Zt=l(),$=d("div"),_(Ie.$$.fragment),xn=l(),nt=d("p"),nt.textContent=co,Cn=l(),ot=d("p"),ot.innerHTML=fo,Nn=l(),_(se.$$.fragment),$n=l(),lt=d("p"),lt.textContent=_o,Tn=l(),at=d("ul"),at.innerHTML=ho,Vt=l(),_(ke.$$.fragment),Bt=l(),N=d("div"),_(Ue.$$.fragment),wn=l(),st=d("p"),st.textContent=uo,Jn=l(),rt=d("p"),rt.textContent=vo,In=l(),it=d("p"),it.textContent=Mo,kn=l(),_(re.$$.fragment),Un=l(),mt=d("p"),mt.textContent=bo,Gn=l(),dt=d("ul"),dt.innerHTML=yo,Rt=l(),W=d("div"),_(Ge.$$.fragment),jn=l(),pt=d("p"),pt.textContent=xo,Ln=l(),gt=d("p"),gt.innerHTML=Co,Dn=l(),_(ie.$$.fragment),Xt=l(),_(je.$$.fragment),Ft=l(),G=d("div"),_(Le.$$.fragment),zn=l(),ct=d("p"),ct.textContent=No,En=l(),ft=d("p"),ft.innerHTML=$o,Wn=l(),_t=d("p"),_t.textContent=To,Pn=l(),_(me.$$.fragment),St=l(),_(De.$$.fragment),qt=l(),j=d("div"),_(ze.$$.fragment),An=l(),ht=d("p"),ht.textContent=wo,Zn=l(),ut=d("p"),ut.textContent=Jo,Vn=l(),vt=d("p"),vt.innerHTML=Io,Bn=l(),_(de.$$.fragment),Qt=l(),_(Ee.$$.fragment),Yt=l(),T=d("div"),_(We.$$.fragment),Rn=l(),Mt=d("p"),Mt.textContent=ko,Xn=l(),bt=d("p"),bt.textContent=Uo,Fn=l(),yt=d("p"),yt.textContent=Go,Sn=l(),_(pe.$$.fragment),qn=l(),xt=d("p"),xt.innerHTML=jo,Ht=l(),_(Pe.$$.fragment),Ot=l(),Ct=d("p"),this.h()},l(e){const s=Wo("svelte-u9bgzb",document.head);n=p(s,"META",{name:!0,content:!0}),s.forEach(i),x=a(e),c=p(e,"P",{}),D(c).forEach(i),o=a(e),h(g.$$.fragment,e),t=a(e),h(f.$$.fragment,e),$t=a(e),ge=p(e,"P",{"data-svelte-h":!0}),y(ge)!=="svelte-y8a0ub"&&(ge.innerHTML=Qn),Tt=a(e),h(ce.$$.fragment,e),wt=a(e),J=p(e,"DIV",{class:!0});var P=D(J);h(fe.$$.fragment,P),en=a(P),Ae=p(P,"P",{"data-svelte-h":!0}),y(Ae)!=="svelte-13egyki"&&(Ae.textContent=Yn),tn=a(P),Ze=p(P,"P",{"data-svelte-h":!0}),y(Ze)!=="svelte-kze4a9"&&(Ze.textContent=Hn),nn=a(P),Ve=p(P,"P",{"data-svelte-h":!0}),y(Ve)!=="svelte-1pezkfn"&&(Ve.textContent=On),on=a(P),h(te.$$.fragment,P),P.forEach(i),Jt=a(e),h(_e.$$.fragment,e),It=a(e),h(he.$$.fragment,e),kt=a(e),I=p(e,"DIV",{class:!0});var A=D(I);h(ue.$$.fragment,A),ln=a(A),Be=p(A,"P",{"data-svelte-h":!0}),y(Be)!=="svelte-jfdmvv"&&(Be.textContent=Kn),an=a(A),Re=p(A,"P",{"data-svelte-h":!0}),y(Re)!=="svelte-1p0fyj7"&&(Re.textContent=eo),sn=a(A),h(ne.$$.fragment,A),rn=a(A),Xe=p(A,"P",{"data-svelte-h":!0}),y(Xe)!=="svelte-5e5uz9"&&(Xe.textContent=to),A.forEach(i),Ut=a(e),ve=p(e,"DIV",{class:!0});var Nt=D(ve);h(Me.$$.fragment,Nt),Nt.forEach(i),Gt=a(e),S=p(e,"DIV",{class:!0});var ee=D(S);h(be.$$.fragment,ee),mn=a(ee),Fe=p(ee,"P",{"data-svelte-h":!0}),y(Fe)!=="svelte-1qnf2gp"&&(Fe.textContent=no),dn=a(ee),Se=p(ee,"P",{"data-svelte-h":!0}),y(Se)!=="svelte-upaa77"&&(Se.textContent=oo),ee.forEach(i),jt=a(e),h(ye.$$.fragment,e),Lt=a(e),k=p(e,"DIV",{class:!0});var Z=D(k);h(xe.$$.fragment,Z),pn=a(Z),qe=p(Z,"P",{"data-svelte-h":!0}),y(qe)!=="svelte-n349gz"&&(qe.textContent=lo),gn=a(Z),Qe=p(Z,"P",{"data-svelte-h":!0}),y(Qe)!=="svelte-1r03hj9"&&(Qe.textContent=ao),cn=a(Z),Ye=p(Z,"P",{"data-svelte-h":!0}),y(Ye)!=="svelte-1etqvmy"&&(Ye.innerHTML=so),fn=a(Z),h(oe.$$.fragment,Z),Z.forEach(i),Dt=a(e),h(Ce.$$.fragment,e),zt=a(e),U=p(e,"DIV",{class:!0});var V=D(U);h(Ne.$$.fragment,V),_n=a(V),He=p(V,"P",{"data-svelte-h":!0}),y(He)!=="svelte-i5i6i"&&(He.textContent=ro),hn=a(V),Oe=p(V,"P",{"data-svelte-h":!0}),y(Oe)!=="svelte-dxxmje"&&(Oe.textContent=io),un=a(V),Ke=p(V,"P",{"data-svelte-h":!0}),y(Ke)!=="svelte-1n8isjp"&&(Ke.innerHTML=mo),vn=a(V),h(le.$$.fragment,V),V.forEach(i),Et=a(e),h($e.$$.fragment,e),Wt=a(e),E=p(e,"DIV",{class:!0});var q=D(E);h(Te.$$.fragment,q),Mn=a(q),et=p(q,"P",{"data-svelte-h":!0}),y(et)!=="svelte-1vba8l6"&&(et.textContent=po),bn=a(q),tt=p(q,"P",{"data-svelte-h":!0}),y(tt)!=="svelte-1rsrr3u"&&(tt.textContent=go),yn=a(q),h(ae.$$.fragment,q),q.forEach(i),Pt=a(e),h(we.$$.fragment,e),At=a(e),h(Je.$$.fragment,e),Zt=a(e),$=p(e,"DIV",{class:!0});var L=D($);h(Ie.$$.fragment,L),xn=a(L),nt=p(L,"P",{"data-svelte-h":!0}),y(nt)!=="svelte-gecoou"&&(nt.textContent=co),Cn=a(L),ot=p(L,"P",{"data-svelte-h":!0}),y(ot)!=="svelte-18hwmzg"&&(ot.innerHTML=fo),Nn=a(L),h(se.$$.fragment,L),$n=a(L),lt=p(L,"P",{"data-svelte-h":!0}),y(lt)!=="svelte-fovr4a"&&(lt.textContent=_o),Tn=a(L),at=p(L,"UL",{"data-svelte-h":!0}),y(at)!=="svelte-1r9m7vj"&&(at.innerHTML=ho),L.forEach(i),Vt=a(e),h(ke.$$.fragment,e),Bt=a(e),N=p(e,"DIV",{class:!0});var w=D(N);h(Ue.$$.fragment,w),wn=a(w),st=p(w,"P",{"data-svelte-h":!0}),y(st)!=="svelte-1klsw5l"&&(st.textContent=uo),Jn=a(w),rt=p(w,"P",{"data-svelte-h":!0}),y(rt)!=="svelte-wo0tsj"&&(rt.textContent=vo),In=a(w),it=p(w,"P",{"data-svelte-h":!0}),y(it)!=="svelte-15132n7"&&(it.textContent=Mo),kn=a(w),h(re.$$.fragment,w),Un=a(w),mt=p(w,"P",{"data-svelte-h":!0}),y(mt)!=="svelte-fovr4a"&&(mt.textContent=bo),Gn=a(w),dt=p(w,"UL",{"data-svelte-h":!0}),y(dt)!=="svelte-1qs4d43"&&(dt.innerHTML=yo),w.forEach(i),Rt=a(e),W=p(e,"DIV",{class:!0});var Q=D(W);h(Ge.$$.fragment,Q),jn=a(Q),pt=p(Q,"P",{"data-svelte-h":!0}),y(pt)!=="svelte-z3ujua"&&(pt.textContent=xo),Ln=a(Q),gt=p(Q,"P",{"data-svelte-h":!0}),y(gt)!=="svelte-5jbc87"&&(gt.innerHTML=Co),Dn=a(Q),h(ie.$$.fragment,Q),Q.forEach(i),Xt=a(e),h(je.$$.fragment,e),Ft=a(e),G=p(e,"DIV",{class:!0});var B=D(G);h(Le.$$.fragment,B),zn=a(B),ct=p(B,"P",{"data-svelte-h":!0}),y(ct)!=="svelte-1ot4eb4"&&(ct.textContent=No),En=a(B),ft=p(B,"P",{"data-svelte-h":!0}),y(ft)!=="svelte-6bmr55"&&(ft.innerHTML=$o),Wn=a(B),_t=p(B,"P",{"data-svelte-h":!0}),y(_t)!=="svelte-cmee8i"&&(_t.textContent=To),Pn=a(B),h(me.$$.fragment,B),B.forEach(i),St=a(e),h(De.$$.fragment,e),qt=a(e),j=p(e,"DIV",{class:!0});var K=D(j);h(ze.$$.fragment,K),An=a(K),ht=p(K,"P",{"data-svelte-h":!0}),y(ht)!=="svelte-1ic97p7"&&(ht.textContent=wo),Zn=a(K),ut=p(K,"P",{"data-svelte-h":!0}),y(ut)!=="svelte-cuvhk5"&&(ut.textContent=Jo),Vn=a(K),vt=p(K,"P",{"data-svelte-h":!0}),y(vt)!=="svelte-6ax2ai"&&(vt.innerHTML=Io),Bn=a(K),h(de.$$.fragment,K),K.forEach(i),Qt=a(e),h(Ee.$$.fragment,e),Yt=a(e),T=p(e,"DIV",{class:!0});var F=D(T);h(We.$$.fragment,F),Rn=a(F),Mt=p(F,"P",{"data-svelte-h":!0}),y(Mt)!=="svelte-1bspzi1"&&(Mt.textContent=ko),Xn=a(F),bt=p(F,"P",{"data-svelte-h":!0}),y(bt)!=="svelte-12bfx7b"&&(bt.textContent=Uo),Fn=a(F),yt=p(F,"P",{"data-svelte-h":!0}),y(yt)!=="svelte-3nnpa5"&&(yt.textContent=Go),Sn=a(F),h(pe.$$.fragment,F),qn=a(F),xt=p(F,"P",{"data-svelte-h":!0}),y(xt)!=="svelte-1w0ij7s"&&(xt.innerHTML=jo),F.forEach(i),Ht=a(e),h(Pe.$$.fragment,e),Ot=a(e),Ct=p(e,"P",{}),D(Ct).forEach(i),this.h()},h(){z(n,"name","hf:doc:metadata"),z(n,"content",Ko),z(J,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8"),z(I,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8"),z(ve,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8"),z(S,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8"),z(k,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8"),z(U,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8"),z(E,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8"),z($,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8"),z(N,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8"),z(W,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8"),z(G,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8"),z(j,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8"),z(T,"class","docstring border-l-2 border-t-2 pl-4 pt-3.5 border-gray-100 rounded-tl-xl mb-6 mt-8")},m(e,s){r(document.head,n),m(e,x,s),m(e,c,s),m(e,o,s),u(g,e,s),m(e,t,s),u(f,e,s),m(e,$t,s),m(e,ge,s),m(e,Tt,s),u(ce,e,s),m(e,wt,s),m(e,J,s),u(fe,J,null),r(J,en),r(J,Ae),r(J,tn),r(J,Ze),r(J,nn),r(J,Ve),r(J,on),u(te,J,null),m(e,Jt,s),u(_e,e,s),m(e,It,s),u(he,e,s),m(e,kt,s),m(e,I,s),u(ue,I,null),r(I,ln),r(I,Be),r(I,an),r(I,Re),r(I,sn),u(ne,I,null),r(I,rn),r(I,Xe),m(e,Ut,s),m(e,ve,s),u(Me,ve,null),m(e,Gt,s),m(e,S,s),u(be,S,null),r(S,mn),r(S,Fe),r(S,dn),r(S,Se),m(e,jt,s),u(ye,e,s),m(e,Lt,s),m(e,k,s),u(xe,k,null),r(k,pn),r(k,qe),r(k,gn),r(k,Qe),r(k,cn),r(k,Ye),r(k,fn),u(oe,k,null),m(e,Dt,s),u(Ce,e,s),m(e,zt,s),m(e,U,s),u(Ne,U,null),r(U,_n),r(U,He),r(U,hn),r(U,Oe),r(U,un),r(U,Ke),r(U,vn),u(le,U,null),m(e,Et,s),u($e,e,s),m(e,Wt,s),m(e,E,s),u(Te,E,null),r(E,Mn),r(E,et),r(E,bn),r(E,tt),r(E,yn),u(ae,E,null),m(e,Pt,s),u(we,e,s),m(e,At,s),u(Je,e,s),m(e,Zt,s),m(e,$,s),u(Ie,$,null),r($,xn),r($,nt),r($,Cn),r($,ot),r($,Nn),u(se,$,null),r($,$n),r($,lt),r($,Tn),r($,at),m(e,Vt,s),u(ke,e,s),m(e,Bt,s),m(e,N,s),u(Ue,N,null),r(N,wn),r(N,st),r(N,Jn),r(N,rt),r(N,In),r(N,it),r(N,kn),u(re,N,null),r(N,Un),r(N,mt),r(N,Gn),r(N,dt),m(e,Rt,s),m(e,W,s),u(Ge,W,null),r(W,jn),r(W,pt),r(W,Ln),r(W,gt),r(W,Dn),u(ie,W,null),m(e,Xt,s),u(je,e,s),m(e,Ft,s),m(e,G,s),u(Le,G,null),r(G,zn),r(G,ct),r(G,En),r(G,ft),r(G,Wn),r(G,_t),r(G,Pn),u(me,G,null),m(e,St,s),u(De,e,s),m(e,qt,s),m(e,j,s),u(ze,j,null),r(j,An),r(j,ht),r(j,Zn),r(j,ut),r(j,Vn),r(j,vt),r(j,Bn),u(de,j,null),m(e,Qt,s),u(Ee,e,s),m(e,Yt,s),m(e,T,s),u(We,T,null),r(T,Rn),r(T,Mt),r(T,Xn),r(T,bt),r(T,Fn),r(T,yt),r(T,Sn),u(pe,T,null),r(T,qn),r(T,xt),m(e,Ht,s),u(Pe,e,s),m(e,Ot,s),m(e,Ct,s),Kt=!0},p(e,[s]){const P={};s&2&&(P.$$scope={dirty:s,ctx:e}),te.$set(P);const A={};s&2&&(A.$$scope={dirty:s,ctx:e}),ne.$set(A);const Nt={};s&2&&(Nt.$$scope={dirty:s,ctx:e}),oe.$set(Nt);const ee={};s&2&&(ee.$$scope={dirty:s,ctx:e}),le.$set(ee);const Z={};s&2&&(Z.$$scope={dirty:s,ctx:e}),ae.$set(Z);const V={};s&2&&(V.$$scope={dirty:s,ctx:e}),se.$set(V);const q={};s&2&&(q.$$scope={dirty:s,ctx:e}),re.$set(q);const L={};s&2&&(L.$$scope={dirty:s,ctx:e}),ie.$set(L);const w={};s&2&&(w.$$scope={dirty:s,ctx:e}),me.$set(w);const Q={};s&2&&(Q.$$scope={dirty:s,ctx:e}),de.$set(Q);const B={};s&2&&(B.$$scope={dirty:s,ctx:e}),pe.$set(B)},i(e){Kt||(v(g.$$.fragment,e),v(f.$$.fragment,e),v(ce.$$.fragment,e),v(fe.$$.fragment,e),v(te.$$.fragment,e),v(_e.$$.fragment,e),v(he.$$.fragment,e),v(ue.$$.fragment,e),v(ne.$$.fragment,e),v(Me.$$.fragment,e),v(be.$$.fragment,e),v(ye.$$.fragment,e),v(xe.$$.fragment,e),v(oe.$$.fragment,e),v(Ce.$$.fragment,e),v(Ne.$$.fragment,e),v(le.$$.fragment,e),v($e.$$.fragment,e),v(Te.$$.fragment,e),v(ae.$$.fragment,e),v(we.$$.fragment,e),v(Je.$$.fragment,e),v(Ie.$$.fragment,e),v(se.$$.fragment,e),v(ke.$$.fragment,e),v(Ue.$$.fragment,e),v(re.$$.fragment,e),v(Ge.$$.fragment,e),v(ie.$$.fragment,e),v(je.$$.fragment,e),v(Le.$$.fragment,e),v(me.$$.fragment,e),v(De.$$.fragment,e),v(ze.$$.fragment,e),v(de.$$.fragment,e),v(Ee.$$.fragment,e),v(We.$$.fragment,e),v(pe.$$.fragment,e),v(Pe.$$.fragment,e),Kt=!0)},o(e){M(g.$$.fragment,e),M(f.$$.fragment,e),M(ce.$$.fragment,e),M(fe.$$.fragment,e),M(te.$$.fragment,e),M(_e.$$.fragment,e),M(he.$$.fragment,e),M(ue.$$.fragment,e),M(ne.$$.fragment,e),M(Me.$$.fragment,e),M(be.$$.fragment,e),M(ye.$$.fragment,e),M(xe.$$.fragment,e),M(oe.$$.fragment,e),M(Ce.$$.fragment,e),M(Ne.$$.fragment,e),M(le.$$.fragment,e),M($e.$$.fragment,e),M(Te.$$.fragment,e),M(ae.$$.fragment,e),M(we.$$.fragment,e),M(Je.$$.fragment,e),M(Ie.$$.fragment,e),M(se.$$.fragment,e),M(ke.$$.fragment,e),M(Ue.$$.fragment,e),M(re.$$.fragment,e),M(Ge.$$.fragment,e),M(ie.$$.fragment,e),M(je.$$.fragment,e),M(Le.$$.fragment,e),M(me.$$.fragment,e),M(De.$$.fragment,e),M(ze.$$.fragment,e),M(de.$$.fragment,e),M(Ee.$$.fragment,e),M(We.$$.fragment,e),M(pe.$$.fragment,e),M(Pe.$$.fragment,e),Kt=!1},d(e){e&&(i(x),i(c),i(o),i(t),i($t),i(ge),i(Tt),i(wt),i(J),i(Jt),i(It),i(kt),i(I),i(Ut),i(ve),i(Gt),i(S),i(jt),i(Lt),i(k),i(Dt),i(zt),i(U),i(Et),i(Wt),i(E),i(Pt),i(At),i(Zt),i($),i(Vt),i(Bt),i(N),i(Rt),i(W),i(Xt),i(Ft),i(G),i(St),i(qt),i(j),i(Qt),i(Yt),i(T),i(Ht),i(Ot),i(Ct)),i(n),b(g,e),b(f,e),b(ce,e),b(fe),b(te),b(_e,e),b(he,e),b(ue),b(ne),b(Me),b(be),b(ye,e),b(xe),b(oe),b(Ce,e),b(Ne),b(le),b($e,e),b(Te),b(ae),b(we,e),b(Je,e),b(Ie),b(se),b(ke,e),b(Ue),b(re),b(Ge),b(ie),b(je,e),b(Le),b(me),b(De,e),b(ze),b(de),b(Ee,e),b(We),b(pe),b(Pe,e)}}}const Ko='{"title":"Model Configs","local":"model-configs","sections":[{"title":"Base model config","local":"lighteval.models.abstract_model.ModelConfig","sections":[],"depth":3},{"title":"Local Models","local":"local-models","sections":[{"title":"Transformers Model","local":"lighteval.models.transformers.transformers_model.TransformersModelConfig","sections":[],"depth":3},{"title":"VLLM Model","local":"lighteval.models.vllm.vllm_model.VLLMModelConfig","sections":[],"depth":3},{"title":"SGLang Model","local":"lighteval.models.sglang.sglang_model.SGLangModelConfig","sections":[],"depth":3},{"title":"Dummy Model","local":"lighteval.models.dummy.dummy_model.DummyModelConfig","sections":[],"depth":3}],"depth":2},{"title":"Endpoints-based Models","local":"endpoints-based-models","sections":[{"title":"Inference Providers Model","local":"lighteval.models.endpoints.inference_providers_model.InferenceProvidersModelConfig","sections":[],"depth":3},{"title":"InferenceEndpointModel","local":"lighteval.models.endpoints.endpoint_model.InferenceEndpointModelConfig","sections":[],"depth":3},{"title":"TGI ModelClient","local":"lighteval.models.endpoints.tgi_model.TGIModelConfig","sections":[],"depth":3},{"title":"Litellm Model","local":"lighteval.models.endpoints.litellm_model.LiteLLMModelConfig","sections":[],"depth":3}],"depth":2},{"title":"Custom Model","local":"lighteval.models.custom.custom_model.CustomModelConfig","sections":[],"depth":2}],"depth":1}';function el(C){return Do(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class rl extends zo{constructor(n){super(),Eo(this,n,el,Oo,Lo,{})}}export{rl as component}; | |
Xet Storage Details
- Size:
- 95.3 kB
- Xet hash:
- 3d52aa83ec06230c09ccdcbe03c29e6e96824f9cb43186352d8b8c1e1749308e
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.