Buckets:
| import{s as Gt,n as Ct,o as xt}from"../chunks/scheduler.7da89386.js";import{S as Zt,i as Wt,g as d,s as i,r as a,A as Et,h as u,f as n,c as s,j as It,u as r,x as M,k as vt,y as Ht,a as l,v as o,d as p,t as m,w as g}from"../chunks/index.20910acc.js";import{C as me}from"../chunks/CodeBlock.143bd81e.js";import{H as f,E as Bt}from"../chunks/getInferenceSnippets.375cdad5.js";function _t(pt){let c,de,ge,ue,y,Me,$,mt=`An alternative to launching the evaluation locally is to serve the model on a | |
| TGI-compatible server/container and then run the evaluation by sending requests | |
| to the server. The command is the same as before, except you specify a path to | |
| a YAML configuration file (detailed below):`,ce,h,ye,T,gt=`There are two types of configuration files that can be provided for running on | |
| the server:`,$e,w,he,U,ft=`To launch a model using Hugging Face’s Inference Endpoints, you need to provide | |
| the following file: <code>endpoint_model.yaml</code>. Lighteval will automatically deploy | |
| the endpoint, run the evaluation, and finally delete the endpoint (unless you | |
| specify an endpoint that was already launched, in which case the endpoint won’t | |
| be deleted afterwards).`,Te,j,we,J,Ue,b,je,I,dt=`To use a model already deployed on a TGI server, for example on Hugging Face’s | |
| serverless inference.`,Je,v,be,G,Ie,C,ve,x,Ge,Z,Ce,W,ut="<li><code>model_name</code>: The Hugging Face model ID to deploy</li> <li><code>revision</code>: Model revision (defaults to “main”)</li> <li><code>dtype</code>: Data type for model weights (“float16”, “bfloat16”, “4bit”, “8bit”, etc.)</li> <li><code>framework</code>: Framework to use (“pytorch”, “tensorflow”)</li>",xe,E,Ze,H,Mt="<li><code>accelerator</code>: Hardware accelerator (“gpu”, “cpu”)</li> <li><code>region</code>: AWS region for deployment</li> <li><code>vendor</code>: Cloud vendor (“aws”, “azure”, “gcp”)</li> <li><code>instance_type</code>: Instance type (e.g., “nvidia-a10g”, “nvidia-t4”)</li> <li><code>instance_size</code>: Instance size (“x1”, “x2”, etc.)</li>",We,B,Ee,_,ct="<li><code>endpoint_type</code>: Endpoint access level (“public”, “protected”, “private”)</li> <li><code>namespace</code>: Organization namespace for deployment</li> <li><code>reuse_existing</code>: Whether to reuse an existing endpoint</li> <li><code>endpoint_name</code>: Custom endpoint name (lowercase, no special characters)</li>",He,k,Be,q,yt="<li><code>image_url</code>: Custom Docker image URL</li> <li><code>env_vars</code>: Environment variables for the endpoint</li>",_e,A,ke,F,qe,S,$t="<li><code>inference_server_address</code>: URL of the TGI server</li> <li><code>inference_server_auth</code>: Authentication credentials</li> <li><code>model_id</code>: Model identifier (if using local model directory)</li>",Ae,V,Fe,L,Se,R,Ve,z,Le,X,Re,Y,ze,N,Xe,Q,Ye,D,Ne,P,ht='<li>Endpoints are automatically deleted after evaluation (unless <code>reuse_existing: true</code>)</li> <li>Costs are based on instance type and runtime</li> <li>Monitor usage in the <a href="https://huggingface.co/settings/billing" rel="nofollow">Hugging Face billing dashboard</a></li>',Qe,O,De,K,Tt="<li>No additional costs beyond your existing server infrastructure</li> <li>Useful for cost-effective evaluation of already-deployed models</li>",Pe,ee,Oe,te,Ke,ne,wt="<li><strong>Endpoint Deployment Failures</strong>: Check instance availability in your region</li> <li><strong>Authentication Errors</strong>: Ensure proper Hugging Face token permissions</li> <li><strong>Model Loading Errors</strong>: Verify model name and revision are correct</li> <li><strong>Resource Constraints</strong>: Choose appropriate instance type for your model size</li>",et,le,tt,ie,Ut="<li>Use appropriate instance types for your model size</li> <li>Consider using quantized models (4bit, 8bit) for cost savings</li> <li>Reuse existing endpoints for multiple evaluations</li> <li>Use serverless TGI for cost-effective evaluation</li>",nt,se,lt,ae,jt="Common error messages and solutions:",it,re,Jt="<li><strong>“Instance not available”</strong>: Try a different region or instance type</li> <li><strong>“Model not found”</strong>: Check the model name and revision</li> <li><strong>“Insufficient permissions”</strong>: Verify your Hugging Face token has endpoint deployment permissions</li> <li><strong>“Endpoint already exists”</strong>: Use <code>reuse_existing: true</code> or choose a different endpoint name</li>",st,oe,bt='For more detailed information about Hugging Face Inference Endpoints, see the <a href="https://huggingface.co/docs/inference-endpoints/" rel="nofollow">official documentation</a>.',at,pe,rt,fe,ot;return y=new f({props:{title:"Using Hugging Face Inference Endpoints or TGI as Backend",local:"using-hugging-face-inference-endpoints-or-tgi-as-backend",headingTag:"h1"}}),h=new me({props:{code:"bGlnaHRldmFsJTIwZW5kcG9pbnQlMjAlN0J0Z2klMkNpbmZlcmVuY2UtZW5kcG9pbnQlN0QlMjAlNUMlMEElMjAlMjAlMjAlMjAlMjIlMkZwYXRoJTJGdG8lMkZjb25maWclMkZmaWxlJTIyJTIwJTVDJTBBJTIwJTIwJTIwJTIwJTNDdGFza19wYXJhbWV0ZXJzJTNF",highlighted:`lighteval endpoint {tgi,inference-endpoint} \\ | |
| <span class="hljs-string">"/path/to/config/file"</span> \\ | |
| <task_parameters>`,wrap:!1}}),w=new f({props:{title:"Hugging Face Inference Endpoints",local:"hugging-face-inference-endpoints",headingTag:"h2"}}),j=new f({props:{title:"Configuration File Example",local:"configuration-file-example",headingTag:"h3"}}),J=new me({props:{code:"bW9kZWxfcGFyYW1ldGVycyUzQSUwQSUyMCUyMCUyMCUyMHJldXNlX2V4aXN0aW5nJTNBJTIwZmFsc2UlMjAlMjMlMjBJZiUyMHRydWUlMkMlMjBpZ25vcmUlMjBhbGwlMjBwYXJhbXMlMjBpbiUyMGluc3RhbmNlJTJDJTIwYW5kJTIwZG9uJ3QlMjBkZWxldGUlMjB0aGUlMjBlbmRwb2ludCUyMGFmdGVyJTIwZXZhbHVhdGlvbiUwQSUyMCUyMCUyMCUyMCUyMyUyMGVuZHBvaW50X25hbWUlM0ElMjAlMjJsbGFtYS0yLTdCLWxpZ2h0ZXZhbCUyMiUyMCUyMyUyME5lZWRzJTIwdG8lMjBiZSUyMGxvd2VyY2FzZSUyMHdpdGhvdXQlMjBzcGVjaWFsJTIwY2hhcmFjdGVycyUwQSUyMCUyMCUyMCUyMG1vZGVsX25hbWUlM0ElMjAlMjJtZXRhLWxsYW1hJTJGTGxhbWEtMi03Yi1oZiUyMiUwQSUyMCUyMCUyMCUyMHJldmlzaW9uJTNBJTIwJTIybWFpbiUyMiUyMCUyMCUyMyUyMERlZmF1bHRzJTIwdG8lMjAlMjJtYWluJTIyJTBBJTIwJTIwJTIwJTIwZHR5cGUlM0ElMjAlMjJmbG9hdDE2JTIyJTIwJTIzJTIwQ2FuJTIwYmUlMjBhbnklMjBvZiUyMCUyMmF3cSUyMiUyQyUyMCUyMmVldHElMjIlMkMlMjAlMjJncHRxJTIyJTJDJTIwJTIyNGJpdCUyMiUyMG9yJTIwJTIyOGJpdCUyMiUyMCh3aWxsJTIwdXNlJTIwYml0c2FuZGJ5dGVzKSUyQyUyMCUyMmJmbG9hdDE2JTIyJTIwb3IlMjAlMjJmbG9hdDE2JTIyJTBBJTIwJTIwJTIwJTIwYWNjZWxlcmF0b3IlM0ElMjAlMjJncHUlMjIlMEElMjAlMjAlMjAlMjByZWdpb24lM0ElMjAlMjJldS13ZXN0LTElMjIlMEElMjAlMjAlMjAlMjB2ZW5kb3IlM0ElMjAlMjJhd3MlMjIlMEElMjAlMjAlMjAlMjBpbnN0YW5jZV90eXBlJTNBJTIwJTIybnZpZGlhLWExMGclMjIlMEElMjAlMjAlMjAlMjBpbnN0YW5jZV9zaXplJTNBJTIwJTIyeDElMjIlMEElMjAlMjAlMjAlMjBmcmFtZXdvcmslM0ElMjAlMjJweXRvcmNoJTIyJTBBJTIwJTIwJTIwJTIwZW5kcG9pbnRfdHlwZSUzQSUyMCUyMnByb3RlY3RlZCUyMiUwQSUyMCUyMCUyMCUyMG5hbWVzcGFjZSUzQSUyMG51bGwlMjAlMjMlMjBUaGUlMjBuYW1lc3BhY2UlMjB1bmRlciUyMHdoaWNoJTIwdG8lMjBsYXVuY2glMjB0aGUlMjBlbmRwb2ludC4lMjBEZWZhdWx0cyUyMHRvJTIwdGhlJTIwY3VycmVudCUyMHVzZXIncyUyMG5hbWVzcGFjZSUwQSUyMCUyMCUyMCUyMGltYWdlX3VybCUzQSUyMG51bGwlMjAlMjMlMjBPcHRpb25hbGx5JTIwc3BlY2lmeSUyMHRoZSUyMGRvY2tlciUyMGltYWdlJTIwdG8lMjB1c2UlMjB3aGVuJTIwbGF1bmNoaW5nJTIwdGhlJTIwZW5kcG9pbnQlMjBtb2RlbC4lMjBFLmcuJTJDJTIwbGF1bmNoaW5nJTIwbW9kZWxzJTIwd2l0aCUyMGxhdGVyJTIwcmVsZWFzZXMlMjBvZiUyMHRoZSUyMFRHSSUyMGNvbnRhaW5lciUyMHdpdGglMjBzdXBwb3J0JTIwZm9yJTIwbmV3ZXIlMjBtb2RlbHMuJTBBJTIwJTIwJTIwJTIwZW52X3ZhcnMlM0ElMjBudWxsJTIwJTIzJTIwT3B0aW9uYWwlMjBlbnZpcm9ubWVudCUyMHZhcmlhYmxlcyUyMHRvJTIwaW5jbHVkZSUyMHdoZW4lMjBsYXVuY2hpbmclMjB0aGUlMjBlbmRwb2ludC4lMjBlLmcuJTJDJTIwJTYwTUFYX0lOUFVUX0xFTkdUSCUzQSUyMDIwNDglNjA=",highlighted:`<span class="hljs-attr">model_parameters:</span> | |
| <span class="hljs-attr">reuse_existing:</span> <span class="hljs-literal">false</span> <span class="hljs-comment"># If true, ignore all params in instance, and don't delete the endpoint after evaluation</span> | |
| <span class="hljs-comment"># endpoint_name: "llama-2-7B-lighteval" # Needs to be lowercase without special characters</span> | |
| <span class="hljs-attr">model_name:</span> <span class="hljs-string">"meta-llama/Llama-2-7b-hf"</span> | |
| <span class="hljs-attr">revision:</span> <span class="hljs-string">"main"</span> <span class="hljs-comment"># Defaults to "main"</span> | |
| <span class="hljs-attr">dtype:</span> <span class="hljs-string">"float16"</span> <span class="hljs-comment"># Can be any of "awq", "eetq", "gptq", "4bit" or "8bit" (will use bitsandbytes), "bfloat16" or "float16"</span> | |
| <span class="hljs-attr">accelerator:</span> <span class="hljs-string">"gpu"</span> | |
| <span class="hljs-attr">region:</span> <span class="hljs-string">"eu-west-1"</span> | |
| <span class="hljs-attr">vendor:</span> <span class="hljs-string">"aws"</span> | |
| <span class="hljs-attr">instance_type:</span> <span class="hljs-string">"nvidia-a10g"</span> | |
| <span class="hljs-attr">instance_size:</span> <span class="hljs-string">"x1"</span> | |
| <span class="hljs-attr">framework:</span> <span class="hljs-string">"pytorch"</span> | |
| <span class="hljs-attr">endpoint_type:</span> <span class="hljs-string">"protected"</span> | |
| <span class="hljs-attr">namespace:</span> <span class="hljs-literal">null</span> <span class="hljs-comment"># The namespace under which to launch the endpoint. Defaults to the current user's namespace</span> | |
| <span class="hljs-attr">image_url:</span> <span class="hljs-literal">null</span> <span class="hljs-comment"># Optionally specify the docker image to use when launching the endpoint model. E.g., launching models with later releases of the TGI container with support for newer models.</span> | |
| <span class="hljs-attr">env_vars:</span> <span class="hljs-literal">null</span> <span class="hljs-comment"># Optional environment variables to include when launching the endpoint. e.g., \`MAX_INPUT_LENGTH: 2048\`</span>`,wrap:!1}}),b=new f({props:{title:"Text Generation Inference (TGI)",local:"text-generation-inference-tgi",headingTag:"h2"}}),v=new f({props:{title:"Configuration File Example",local:"configuration-file-example",headingTag:"h3"}}),G=new me({props:{code:"bW9kZWxfcGFyYW1ldGVycyUzQSUwQSUyMCUyMCUyMCUyMGluZmVyZW5jZV9zZXJ2ZXJfYWRkcmVzcyUzQSUyMCUyMiUyMiUwQSUyMCUyMCUyMCUyMGluZmVyZW5jZV9zZXJ2ZXJfYXV0aCUzQSUyMG51bGwlMEElMjAlMjAlMjAlMjBtb2RlbF9pZCUzQSUyMG51bGwlMjAlMjMlMjBPcHRpb25hbCUyQyUyMG9ubHklMjByZXF1aXJlZCUyMGlmJTIwdGhlJTIwVEdJJTIwY29udGFpbmVyJTIwd2FzJTIwbGF1bmNoZWQlMjB3aXRoJTIwbW9kZWxfaWQlMjBwb2ludGluZyUyMHRvJTIwYSUyMGxvY2FsJTIwZGlyZWN0b3J5",highlighted:`<span class="hljs-attr">model_parameters:</span> | |
| <span class="hljs-attr">inference_server_address:</span> <span class="hljs-string">""</span> | |
| <span class="hljs-attr">inference_server_auth:</span> <span class="hljs-literal">null</span> | |
| <span class="hljs-attr">model_id:</span> <span class="hljs-literal">null</span> <span class="hljs-comment"># Optional, only required if the TGI container was launched with model_id pointing to a local directory</span>`,wrap:!1}}),C=new f({props:{title:"Key Parameters",local:"key-parameters",headingTag:"h2"}}),x=new f({props:{title:"Hugging Face Inference Endpoints",local:"hugging-face-inference-endpoints",headingTag:"h3"}}),Z=new f({props:{title:"Model Configuration",local:"model-configuration",headingTag:"h4"}}),E=new f({props:{title:"Infrastructure Settings",local:"infrastructure-settings",headingTag:"h4"}}),B=new f({props:{title:"Endpoint Configuration",local:"endpoint-configuration",headingTag:"h4"}}),k=new f({props:{title:"Advanced Settings",local:"advanced-settings",headingTag:"h4"}}),A=new f({props:{title:"Text Generation Inference (TGI)",local:"text-generation-inference-tgi",headingTag:"h3"}}),F=new f({props:{title:"Server Configuration",local:"server-configuration",headingTag:"h4"}}),V=new f({props:{title:"Usage Examples",local:"usage-examples",headingTag:"h2"}}),L=new f({props:{title:"Deploying a New Inference Endpoint",local:"deploying-a-new-inference-endpoint",headingTag:"h3"}}),R=new me({props:{code:"bGlnaHRldmFsJTIwZW5kcG9pbnQlMjBpbmZlcmVuY2UtZW5kcG9pbnQlMjAlNUMlMEElMjAlMjAlMjAlMjAlMjJjb25maWdzJTJGZW5kcG9pbnRfbW9kZWwueWFtbCUyMiUyMCU1QyUwQSUyMCUyMCUyMCUyMCUyMmxpZ2h0ZXZhbCU3Q2dzbThrJTdDMCUyMg==",highlighted:`lighteval endpoint inference-endpoint \\ | |
| <span class="hljs-string">"configs/endpoint_model.yaml"</span> \\ | |
| <span class="hljs-string">"lighteval|gsm8k|0"</span>`,wrap:!1}}),z=new f({props:{title:"Using an Existing TGI Server",local:"using-an-existing-tgi-server",headingTag:"h3"}}),X=new me({props:{code:"bGlnaHRldmFsJTIwZW5kcG9pbnQlMjB0Z2klMjAlNUMlMEElMjAlMjAlMjAlMjAlMjJjb25maWdzJTJGdGdpX3NlcnZlci55YW1sJTIyJTIwJTVDJTBBJTIwJTIwJTIwJTIwJTIybGlnaHRldmFsJTdDZ3NtOGslN0MwJTIy",highlighted:`lighteval endpoint tgi \\ | |
| <span class="hljs-string">"configs/tgi_server.yaml"</span> \\ | |
| <span class="hljs-string">"lighteval|gsm8k|0"</span>`,wrap:!1}}),Y=new f({props:{title:"Reusing an Existing Endpoint",local:"reusing-an-existing-endpoint",headingTag:"h3"}}),N=new me({props:{code:"bW9kZWxfcGFyYW1ldGVycyUzQSUwQSUyMCUyMCUyMCUyMHJldXNlX2V4aXN0aW5nJTNBJTIwdHJ1ZSUwQSUyMCUyMCUyMCUyMGVuZHBvaW50X25hbWUlM0ElMjAlMjJteS1leGlzdGluZy1lbmRwb2ludCUyMiUwQSUyMCUyMCUyMCUyMCUyMyUyME90aGVyJTIwcGFyYW1ldGVycyUyMHdpbGwlMjBiZSUyMGlnbm9yZWQlMjB3aGVuJTIwcmV1c2VfZXhpc3RpbmclMjBpcyUyMHRydWU=",highlighted:`<span class="hljs-attr">model_parameters:</span> | |
| <span class="hljs-attr">reuse_existing:</span> <span class="hljs-literal">true</span> | |
| <span class="hljs-attr">endpoint_name:</span> <span class="hljs-string">"my-existing-endpoint"</span> | |
| <span class="hljs-comment"># Other parameters will be ignored when reuse_existing is true</span>`,wrap:!1}}),Q=new f({props:{title:"Cost Management",local:"cost-management",headingTag:"h2"}}),D=new f({props:{title:"Inference Endpoints",local:"inference-endpoints",headingTag:"h3"}}),O=new f({props:{title:"TGI Servers",local:"tgi-servers",headingTag:"h3"}}),ee=new f({props:{title:"Troubleshooting",local:"troubleshooting",headingTag:"h2"}}),te=new f({props:{title:"Common Issues",local:"common-issues",headingTag:"h3"}}),le=new f({props:{title:"Performance Tips",local:"performance-tips",headingTag:"h3"}}),se=new f({props:{title:"Error Handling",local:"error-handling",headingTag:"h3"}}),pe=new Bt({props:{source:"https://github.com/huggingface/lighteval/blob/main/docs/source/use-huggingface-inference-endpoints-or-tgi-as-backend.mdx"}}),{c(){c=d("meta"),de=i(),ge=d("p"),ue=i(),a(y.$$.fragment),Me=i(),$=d("p"),$.textContent=mt,ce=i(),a(h.$$.fragment),ye=i(),T=d("p"),T.textContent=gt,$e=i(),a(w.$$.fragment),he=i(),U=d("p"),U.innerHTML=ft,Te=i(),a(j.$$.fragment),we=i(),a(J.$$.fragment),Ue=i(),a(b.$$.fragment),je=i(),I=d("p"),I.textContent=dt,Je=i(),a(v.$$.fragment),be=i(),a(G.$$.fragment),Ie=i(),a(C.$$.fragment),ve=i(),a(x.$$.fragment),Ge=i(),a(Z.$$.fragment),Ce=i(),W=d("ul"),W.innerHTML=ut,xe=i(),a(E.$$.fragment),Ze=i(),H=d("ul"),H.innerHTML=Mt,We=i(),a(B.$$.fragment),Ee=i(),_=d("ul"),_.innerHTML=ct,He=i(),a(k.$$.fragment),Be=i(),q=d("ul"),q.innerHTML=yt,_e=i(),a(A.$$.fragment),ke=i(),a(F.$$.fragment),qe=i(),S=d("ul"),S.innerHTML=$t,Ae=i(),a(V.$$.fragment),Fe=i(),a(L.$$.fragment),Se=i(),a(R.$$.fragment),Ve=i(),a(z.$$.fragment),Le=i(),a(X.$$.fragment),Re=i(),a(Y.$$.fragment),ze=i(),a(N.$$.fragment),Xe=i(),a(Q.$$.fragment),Ye=i(),a(D.$$.fragment),Ne=i(),P=d("ul"),P.innerHTML=ht,Qe=i(),a(O.$$.fragment),De=i(),K=d("ul"),K.innerHTML=Tt,Pe=i(),a(ee.$$.fragment),Oe=i(),a(te.$$.fragment),Ke=i(),ne=d("ol"),ne.innerHTML=wt,et=i(),a(le.$$.fragment),tt=i(),ie=d("ul"),ie.innerHTML=Ut,nt=i(),a(se.$$.fragment),lt=i(),ae=d("p"),ae.textContent=jt,it=i(),re=d("ul"),re.innerHTML=Jt,st=i(),oe=d("p"),oe.innerHTML=bt,at=i(),a(pe.$$.fragment),rt=i(),fe=d("p"),this.h()},l(e){const t=Et("svelte-u9bgzb",document.head);c=u(t,"META",{name:!0,content:!0}),t.forEach(n),de=s(e),ge=u(e,"P",{}),It(ge).forEach(n),ue=s(e),r(y.$$.fragment,e),Me=s(e),$=u(e,"P",{"data-svelte-h":!0}),M($)!=="svelte-ik3alt"&&($.textContent=mt),ce=s(e),r(h.$$.fragment,e),ye=s(e),T=u(e,"P",{"data-svelte-h":!0}),M(T)!=="svelte-198jur5"&&(T.textContent=gt),$e=s(e),r(w.$$.fragment,e),he=s(e),U=u(e,"P",{"data-svelte-h":!0}),M(U)!=="svelte-13g2grh"&&(U.innerHTML=ft),Te=s(e),r(j.$$.fragment,e),we=s(e),r(J.$$.fragment,e),Ue=s(e),r(b.$$.fragment,e),je=s(e),I=u(e,"P",{"data-svelte-h":!0}),M(I)!=="svelte-s83khs"&&(I.textContent=dt),Je=s(e),r(v.$$.fragment,e),be=s(e),r(G.$$.fragment,e),Ie=s(e),r(C.$$.fragment,e),ve=s(e),r(x.$$.fragment,e),Ge=s(e),r(Z.$$.fragment,e),Ce=s(e),W=u(e,"UL",{"data-svelte-h":!0}),M(W)!=="svelte-catr4m"&&(W.innerHTML=ut),xe=s(e),r(E.$$.fragment,e),Ze=s(e),H=u(e,"UL",{"data-svelte-h":!0}),M(H)!=="svelte-wyhyn3"&&(H.innerHTML=Mt),We=s(e),r(B.$$.fragment,e),Ee=s(e),_=u(e,"UL",{"data-svelte-h":!0}),M(_)!=="svelte-zesftx"&&(_.innerHTML=ct),He=s(e),r(k.$$.fragment,e),Be=s(e),q=u(e,"UL",{"data-svelte-h":!0}),M(q)!=="svelte-chc4s7"&&(q.innerHTML=yt),_e=s(e),r(A.$$.fragment,e),ke=s(e),r(F.$$.fragment,e),qe=s(e),S=u(e,"UL",{"data-svelte-h":!0}),M(S)!=="svelte-x57ldu"&&(S.innerHTML=$t),Ae=s(e),r(V.$$.fragment,e),Fe=s(e),r(L.$$.fragment,e),Se=s(e),r(R.$$.fragment,e),Ve=s(e),r(z.$$.fragment,e),Le=s(e),r(X.$$.fragment,e),Re=s(e),r(Y.$$.fragment,e),ze=s(e),r(N.$$.fragment,e),Xe=s(e),r(Q.$$.fragment,e),Ye=s(e),r(D.$$.fragment,e),Ne=s(e),P=u(e,"UL",{"data-svelte-h":!0}),M(P)!=="svelte-1hz2o9r"&&(P.innerHTML=ht),Qe=s(e),r(O.$$.fragment,e),De=s(e),K=u(e,"UL",{"data-svelte-h":!0}),M(K)!=="svelte-rh1fr3"&&(K.innerHTML=Tt),Pe=s(e),r(ee.$$.fragment,e),Oe=s(e),r(te.$$.fragment,e),Ke=s(e),ne=u(e,"OL",{"data-svelte-h":!0}),M(ne)!=="svelte-1p1agi9"&&(ne.innerHTML=wt),et=s(e),r(le.$$.fragment,e),tt=s(e),ie=u(e,"UL",{"data-svelte-h":!0}),M(ie)!=="svelte-p8wan0"&&(ie.innerHTML=Ut),nt=s(e),r(se.$$.fragment,e),lt=s(e),ae=u(e,"P",{"data-svelte-h":!0}),M(ae)!=="svelte-19pa54u"&&(ae.textContent=jt),it=s(e),re=u(e,"UL",{"data-svelte-h":!0}),M(re)!=="svelte-1rwk4qm"&&(re.innerHTML=Jt),st=s(e),oe=u(e,"P",{"data-svelte-h":!0}),M(oe)!=="svelte-1o55mx1"&&(oe.innerHTML=bt),at=s(e),r(pe.$$.fragment,e),rt=s(e),fe=u(e,"P",{}),It(fe).forEach(n),this.h()},h(){vt(c,"name","hf:doc:metadata"),vt(c,"content",kt)},m(e,t){Ht(document.head,c),l(e,de,t),l(e,ge,t),l(e,ue,t),o(y,e,t),l(e,Me,t),l(e,$,t),l(e,ce,t),o(h,e,t),l(e,ye,t),l(e,T,t),l(e,$e,t),o(w,e,t),l(e,he,t),l(e,U,t),l(e,Te,t),o(j,e,t),l(e,we,t),o(J,e,t),l(e,Ue,t),o(b,e,t),l(e,je,t),l(e,I,t),l(e,Je,t),o(v,e,t),l(e,be,t),o(G,e,t),l(e,Ie,t),o(C,e,t),l(e,ve,t),o(x,e,t),l(e,Ge,t),o(Z,e,t),l(e,Ce,t),l(e,W,t),l(e,xe,t),o(E,e,t),l(e,Ze,t),l(e,H,t),l(e,We,t),o(B,e,t),l(e,Ee,t),l(e,_,t),l(e,He,t),o(k,e,t),l(e,Be,t),l(e,q,t),l(e,_e,t),o(A,e,t),l(e,ke,t),o(F,e,t),l(e,qe,t),l(e,S,t),l(e,Ae,t),o(V,e,t),l(e,Fe,t),o(L,e,t),l(e,Se,t),o(R,e,t),l(e,Ve,t),o(z,e,t),l(e,Le,t),o(X,e,t),l(e,Re,t),o(Y,e,t),l(e,ze,t),o(N,e,t),l(e,Xe,t),o(Q,e,t),l(e,Ye,t),o(D,e,t),l(e,Ne,t),l(e,P,t),l(e,Qe,t),o(O,e,t),l(e,De,t),l(e,K,t),l(e,Pe,t),o(ee,e,t),l(e,Oe,t),o(te,e,t),l(e,Ke,t),l(e,ne,t),l(e,et,t),o(le,e,t),l(e,tt,t),l(e,ie,t),l(e,nt,t),o(se,e,t),l(e,lt,t),l(e,ae,t),l(e,it,t),l(e,re,t),l(e,st,t),l(e,oe,t),l(e,at,t),o(pe,e,t),l(e,rt,t),l(e,fe,t),ot=!0},p:Ct,i(e){ot||(p(y.$$.fragment,e),p(h.$$.fragment,e),p(w.$$.fragment,e),p(j.$$.fragment,e),p(J.$$.fragment,e),p(b.$$.fragment,e),p(v.$$.fragment,e),p(G.$$.fragment,e),p(C.$$.fragment,e),p(x.$$.fragment,e),p(Z.$$.fragment,e),p(E.$$.fragment,e),p(B.$$.fragment,e),p(k.$$.fragment,e),p(A.$$.fragment,e),p(F.$$.fragment,e),p(V.$$.fragment,e),p(L.$$.fragment,e),p(R.$$.fragment,e),p(z.$$.fragment,e),p(X.$$.fragment,e),p(Y.$$.fragment,e),p(N.$$.fragment,e),p(Q.$$.fragment,e),p(D.$$.fragment,e),p(O.$$.fragment,e),p(ee.$$.fragment,e),p(te.$$.fragment,e),p(le.$$.fragment,e),p(se.$$.fragment,e),p(pe.$$.fragment,e),ot=!0)},o(e){m(y.$$.fragment,e),m(h.$$.fragment,e),m(w.$$.fragment,e),m(j.$$.fragment,e),m(J.$$.fragment,e),m(b.$$.fragment,e),m(v.$$.fragment,e),m(G.$$.fragment,e),m(C.$$.fragment,e),m(x.$$.fragment,e),m(Z.$$.fragment,e),m(E.$$.fragment,e),m(B.$$.fragment,e),m(k.$$.fragment,e),m(A.$$.fragment,e),m(F.$$.fragment,e),m(V.$$.fragment,e),m(L.$$.fragment,e),m(R.$$.fragment,e),m(z.$$.fragment,e),m(X.$$.fragment,e),m(Y.$$.fragment,e),m(N.$$.fragment,e),m(Q.$$.fragment,e),m(D.$$.fragment,e),m(O.$$.fragment,e),m(ee.$$.fragment,e),m(te.$$.fragment,e),m(le.$$.fragment,e),m(se.$$.fragment,e),m(pe.$$.fragment,e),ot=!1},d(e){e&&(n(de),n(ge),n(ue),n(Me),n($),n(ce),n(ye),n(T),n($e),n(he),n(U),n(Te),n(we),n(Ue),n(je),n(I),n(Je),n(be),n(Ie),n(ve),n(Ge),n(Ce),n(W),n(xe),n(Ze),n(H),n(We),n(Ee),n(_),n(He),n(Be),n(q),n(_e),n(ke),n(qe),n(S),n(Ae),n(Fe),n(Se),n(Ve),n(Le),n(Re),n(ze),n(Xe),n(Ye),n(Ne),n(P),n(Qe),n(De),n(K),n(Pe),n(Oe),n(Ke),n(ne),n(et),n(tt),n(ie),n(nt),n(lt),n(ae),n(it),n(re),n(st),n(oe),n(at),n(rt),n(fe)),n(c),g(y,e),g(h,e),g(w,e),g(j,e),g(J,e),g(b,e),g(v,e),g(G,e),g(C,e),g(x,e),g(Z,e),g(E,e),g(B,e),g(k,e),g(A,e),g(F,e),g(V,e),g(L,e),g(R,e),g(z,e),g(X,e),g(Y,e),g(N,e),g(Q,e),g(D,e),g(O,e),g(ee,e),g(te,e),g(le,e),g(se,e),g(pe,e)}}}const kt='{"title":"Using Hugging Face Inference Endpoints or TGI as Backend","local":"using-hugging-face-inference-endpoints-or-tgi-as-backend","sections":[{"title":"Hugging Face Inference Endpoints","local":"hugging-face-inference-endpoints","sections":[{"title":"Configuration File Example","local":"configuration-file-example","sections":[],"depth":3}],"depth":2},{"title":"Text Generation Inference (TGI)","local":"text-generation-inference-tgi","sections":[{"title":"Configuration File Example","local":"configuration-file-example","sections":[],"depth":3}],"depth":2},{"title":"Key Parameters","local":"key-parameters","sections":[{"title":"Hugging Face Inference Endpoints","local":"hugging-face-inference-endpoints","sections":[{"title":"Model Configuration","local":"model-configuration","sections":[],"depth":4},{"title":"Infrastructure Settings","local":"infrastructure-settings","sections":[],"depth":4},{"title":"Endpoint Configuration","local":"endpoint-configuration","sections":[],"depth":4},{"title":"Advanced Settings","local":"advanced-settings","sections":[],"depth":4}],"depth":3},{"title":"Text Generation Inference (TGI)","local":"text-generation-inference-tgi","sections":[{"title":"Server Configuration","local":"server-configuration","sections":[],"depth":4}],"depth":3}],"depth":2},{"title":"Usage Examples","local":"usage-examples","sections":[{"title":"Deploying a New Inference Endpoint","local":"deploying-a-new-inference-endpoint","sections":[],"depth":3},{"title":"Using an Existing TGI Server","local":"using-an-existing-tgi-server","sections":[],"depth":3},{"title":"Reusing an Existing Endpoint","local":"reusing-an-existing-endpoint","sections":[],"depth":3}],"depth":2},{"title":"Cost Management","local":"cost-management","sections":[{"title":"Inference Endpoints","local":"inference-endpoints","sections":[],"depth":3},{"title":"TGI Servers","local":"tgi-servers","sections":[],"depth":3}],"depth":2},{"title":"Troubleshooting","local":"troubleshooting","sections":[{"title":"Common Issues","local":"common-issues","sections":[],"depth":3},{"title":"Performance Tips","local":"performance-tips","sections":[],"depth":3},{"title":"Error Handling","local":"error-handling","sections":[],"depth":3}],"depth":2}],"depth":1}';function qt(pt){return xt(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class Lt extends Zt{constructor(c){super(),Wt(this,c,qt,_t,Gt,{})}}export{Lt as component}; | |
Xet Storage Details
- Size:
- 23.7 kB
- Xet hash:
- 8eb1fd5090652ee054f90b1f604dcbdb5b874061420ad1c556b27403a77b5e52
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.