Buckets:
| import{s as lt,n as it,o as st}from"../chunks/scheduler.389d799c.js";import{S as rt,i as ot,g as s,s as l,r as f,A as ut,h as r,f as n,c as i,j as nt,u as p,x as o,k as at,y as ft,a,v as c,d as h,t as m,w as g}from"../chunks/index.8f81d18f.js";import{C as pt}from"../chunks/CodeBlock.c0898180.js";import{H as z,E as ct}from"../chunks/getInferenceSnippets.9d198f97.js";function ht(Ie){let u,K,B,Q,d,O,b,je="Below you can find a listing of all the Deep Learning Containers (DLCs) available on AWS.",ee,T,Ze="For each supported combination of use-case (training, inference), accelerator type (CPU, GPU, Neuron), and framework (PyTorch, TGI, TEI) containers are created.",te,y,ne,x,Ae="Pytorch Training DLC: For training, our DLCs are available for PyTorch via Transformers. They include support for training on GPUs and AWS AI chips with libraries such as TRL, Sentence Transformers, or Diffusers.",ae,C,Ge='You can also keep track of the latest Pytorch Training DLC releases <a href="https://github.com/aws/deep-learning-containers/releases?q=huggingface-training+AND+NOT+neuronx&expanded=true" rel="nofollow">here</a>.',le,$,Se="<thead><tr><th>Container URI</th> <th>Accelerator</th></tr></thead> <tbody><tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-training:2.5.1-transformers4.49.0-gpu-py311-cu124-ubuntu22.04</td> <td>GPU</td></tr> <tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-training-neuronx:2.1.2-transformers4.48.1-neuronx-py310-sdk2.20.0-ubuntu20.04</td> <td>Neuron</td></tr></tbody>",ie,v,se,w,re,L,Ee="For inference, we have a general-purpose PyTorch inference DLC, for serving models trained with any of those frameworks mentioned before on CPU, GPU, and AWS AI chips.",oe,_,We='You can also keep track of the latest Pytorch Inference DLC releases <a href="https://github.com/aws/deep-learning-containers/releases?q=huggingface-inference+AND+NOT+tgi+AND+NOT+neuronx&expanded=true" rel="nofollow">here</a>.',ue,M,De="<thead><tr><th>Container URI</th> <th>Accelerator</th></tr></thead> <tbody><tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-inference:2.6.0-transformers4.49.0-cpu-py312-ubuntu22.04-</td> <td>CPU</td></tr> <tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-inference:2.6.0-transformers4.49.0-gpu-py312-cu124-ubuntu22.04</td> <td>GPU</td></tr> <tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-inference-neuronx:2.1.2-transformers4.43.2-neuronx-py310-sdk2.20.0-ubuntu20.04</td> <td>Neuron</td></tr></tbody>",fe,P,pe,U,Ve="There is also the LLM Text Generation Inference (TGI) DLC for high-performance text generation of LLMs on GPU and AWS AI chips.",ce,k,Ne='You can also keep track of the latest LLM TGI DLC releases <a href="https://github.com/aws/deep-learning-containers/releases?q=tgi+AND+gpu&expanded=true" rel="nofollow">here</a>.',he,H,Ye="<thead><tr><th>Container URI</th> <th>Accelerator</th></tr></thead> <tbody><tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-tgi-inference:2.6.0-tgi3.2.3-gpu-py311-cu124-ubuntu22.04</td> <td>GPU</td></tr> <tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-tgi-inference:2.1.2-optimum0.0.28-neuronx-py310-ubuntu22.04</td> <td>Neuron</td></tr></tbody>",me,I,ge,j,Re="Finally, there is a Text Embeddings Inference (TEI) DLC for high-performance serving of embedding models on CPU and GPU.",de,Z,Je="<thead><tr><th>Container URI</th> <th>Accelerator</th></tr></thead> <tbody><tr><td>683313688378.dkr.ecr.us-east-1.amazonaws.com/tei-cpu:2.0.1-tei1.7.0-cpu-py310-ubuntu22.04</td> <td>CPU</td></tr> <tr><td>683313688378.dkr.ecr.us-east-1.amazonaws.com/tei:2.0.1-tei1.7.0-gpu-py310-cu122-ubuntu22.04</td> <td>GPU</td></tr></tbody>",be,A,Te,G,Xe="<strong>How to choose the right inference container for my use case?</strong>",ye,S,qe='<img src="https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/sagemaker/inference-dlc-decision-tree.png" alt="inference-dlc-decision-tree"/>',xe,E,ze='<em>Note:</em> See <a href="https://huggingface.co/docs/sagemaker/main/en/reference/inference-toolkit" rel="nofollow">here</a> for the list of supported task in the inference toolkit.',Ce,W,Be='<em>Note:</em> Browse through the Hub to see if you model is tagged <a href="https://huggingface.co/models?other=text-generation-inference" rel="nofollow">“text-generation-inference”</a> or <a href="https://huggingface.co/models?other=text-embeddings-inference" rel="nofollow">“text-embeddings-inference”</a>',$e,D,Fe="<strong>How to find the URI of my container?</strong>",ve,V,Ke=`The URI is built with an AWS account ID and an AWS region. Those two values need to be replaced depending on your use case. | |
| Let’s say you want to use the training DLC for GPUs in`,we,N,Qe='<li><code>dlc-aws-account-id</code>: The AWS account ID of the account that owns the ECR repository. You can find them in the <a href="https://github.com/aws/sagemaker-python-sdk/blob/e0b9d38e1e3b48647a02af23c4be54980e53dc61/src/sagemaker/image_uri_config/huggingface.json#L21" rel="nofollow">here</a></li> <li><code>region</code>: The AWS region where you want to use it.</li>',Le,Y,Oe="<strong>How to find the URI of my container but simpler?</strong>",_e,R,et="The Python SagemMaker SDK util functions are not always up to date but it is much simpler than reconstructing the image URI yourself.",Me,J,Pe,X,tt="For Pytorch Training and Pytorch Inference DLCs, there is no such utility.",Ue,q,ke,F,He;return d=new z({props:{title:"Available DLCs on AWS",local:"available-dlcs-on-aws",headingTag:"h1"}}),y=new z({props:{title:"Training",local:"training",headingTag:"h2"}}),v=new z({props:{title:"Inference",local:"inference",headingTag:"h2"}}),w=new z({props:{title:"Pytorch Inference DLC",local:"pytorch-inference-dlc",headingTag:"h3"}}),P=new z({props:{title:"LLM TGI",local:"llm-tgi",headingTag:"h3"}}),I=new z({props:{title:"Text Embedding Inference",local:"text-embedding-inference",headingTag:"h3"}}),A=new z({props:{title:"FAQ",local:"faq",headingTag:"h2"}}),J=new pt({props:{code:"ZnJvbSUyMHNhZ2VtYWtlci5odWdnaW5nZmFjZSUyMGltcG9ydCUyMEh1Z2dpbmdGYWNlTW9kZWwlMkMlMjBnZXRfaHVnZ2luZ2ZhY2VfbGxtX2ltYWdlX3VyaSUwQSUwQXByaW50KGYlMjJUR0klMjBHUFUlM0ElMjAlN0JnZXRfaHVnZ2luZ2ZhY2VfbGxtX2ltYWdlX3VyaSgnaHVnZ2luZ2ZhY2UnKSU3RCUyMiklMEFwcmludChmJTIyVEVJJTIwR1BVJTNBJTIwJTdCZ2V0X2h1Z2dpbmdmYWNlX2xsbV9pbWFnZV91cmkoJ2h1Z2dpbmdmYWNlLXRlaScpJTdEJTIyKSUwQXByaW50KGYlMjJURUklMjBDUFUlM0ElMjAlN0JnZXRfaHVnZ2luZ2ZhY2VfbGxtX2ltYWdlX3VyaSgnaHVnZ2luZ2ZhY2UtdGVpLWNwdScpJTdEJTIyKSUwQXByaW50KGYlMjJUR0klMjBOZXVyb24lM0ElMjAlN0JnZXRfaHVnZ2luZ2ZhY2VfbGxtX2ltYWdlX3VyaSgnaHVnZ2luZ2ZhY2UtbmV1cm9ueCcpJTdEJTIyKQ==",highlighted:`<span class="hljs-keyword">from</span> sagemaker.huggingface <span class="hljs-keyword">import</span> HuggingFaceModel, get_huggingface_llm_image_uri | |
| <span class="hljs-built_in">print</span>(<span class="hljs-string">f"TGI GPU: <span class="hljs-subst">{get_huggingface_llm_image_uri(<span class="hljs-string">'huggingface'</span>)}</span>"</span>) | |
| <span class="hljs-built_in">print</span>(<span class="hljs-string">f"TEI GPU: <span class="hljs-subst">{get_huggingface_llm_image_uri(<span class="hljs-string">'huggingface-tei'</span>)}</span>"</span>) | |
| <span class="hljs-built_in">print</span>(<span class="hljs-string">f"TEI CPU: <span class="hljs-subst">{get_huggingface_llm_image_uri(<span class="hljs-string">'huggingface-tei-cpu'</span>)}</span>"</span>) | |
| <span class="hljs-built_in">print</span>(<span class="hljs-string">f"TGI Neuron: <span class="hljs-subst">{get_huggingface_llm_image_uri(<span class="hljs-string">'huggingface-neuronx'</span>)}</span>"</span>)`,wrap:!1}}),q=new ct({props:{source:"https://github.com/huggingface/hub-docs/blob/main/docs/sagemaker/source/dlcs/available.md"}}),{c(){u=s("meta"),K=l(),B=s("p"),Q=l(),f(d.$$.fragment),O=l(),b=s("p"),b.textContent=je,ee=l(),T=s("p"),T.textContent=Ze,te=l(),f(y.$$.fragment),ne=l(),x=s("p"),x.textContent=Ae,ae=l(),C=s("p"),C.innerHTML=Ge,le=l(),$=s("table"),$.innerHTML=Se,ie=l(),f(v.$$.fragment),se=l(),f(w.$$.fragment),re=l(),L=s("p"),L.textContent=Ee,oe=l(),_=s("p"),_.innerHTML=We,ue=l(),M=s("table"),M.innerHTML=De,fe=l(),f(P.$$.fragment),pe=l(),U=s("p"),U.textContent=Ve,ce=l(),k=s("p"),k.innerHTML=Ne,he=l(),H=s("table"),H.innerHTML=Ye,me=l(),f(I.$$.fragment),ge=l(),j=s("p"),j.textContent=Re,de=l(),Z=s("table"),Z.innerHTML=Je,be=l(),f(A.$$.fragment),Te=l(),G=s("p"),G.innerHTML=Xe,ye=l(),S=s("p"),S.innerHTML=qe,xe=l(),E=s("p"),E.innerHTML=ze,Ce=l(),W=s("p"),W.innerHTML=Be,$e=l(),D=s("p"),D.innerHTML=Fe,ve=l(),V=s("p"),V.textContent=Ke,we=l(),N=s("ul"),N.innerHTML=Qe,Le=l(),Y=s("p"),Y.innerHTML=Oe,_e=l(),R=s("p"),R.textContent=et,Me=l(),f(J.$$.fragment),Pe=l(),X=s("p"),X.textContent=tt,Ue=l(),f(q.$$.fragment),ke=l(),F=s("p"),this.h()},l(e){const t=ut("svelte-u9bgzb",document.head);u=r(t,"META",{name:!0,content:!0}),t.forEach(n),K=i(e),B=r(e,"P",{}),nt(B).forEach(n),Q=i(e),p(d.$$.fragment,e),O=i(e),b=r(e,"P",{"data-svelte-h":!0}),o(b)!=="svelte-1eptnyh"&&(b.textContent=je),ee=i(e),T=r(e,"P",{"data-svelte-h":!0}),o(T)!=="svelte-nsjrcm"&&(T.textContent=Ze),te=i(e),p(y.$$.fragment,e),ne=i(e),x=r(e,"P",{"data-svelte-h":!0}),o(x)!=="svelte-dmm2ao"&&(x.textContent=Ae),ae=i(e),C=r(e,"P",{"data-svelte-h":!0}),o(C)!=="svelte-4leueb"&&(C.innerHTML=Ge),le=i(e),$=r(e,"TABLE",{"data-svelte-h":!0}),o($)!=="svelte-zzvgg0"&&($.innerHTML=Se),ie=i(e),p(v.$$.fragment,e),se=i(e),p(w.$$.fragment,e),re=i(e),L=r(e,"P",{"data-svelte-h":!0}),o(L)!=="svelte-i6peck"&&(L.textContent=Ee),oe=i(e),_=r(e,"P",{"data-svelte-h":!0}),o(_)!=="svelte-5mbpze"&&(_.innerHTML=We),ue=i(e),M=r(e,"TABLE",{"data-svelte-h":!0}),o(M)!=="svelte-1jvau90"&&(M.innerHTML=De),fe=i(e),p(P.$$.fragment,e),pe=i(e),U=r(e,"P",{"data-svelte-h":!0}),o(U)!=="svelte-z6dexv"&&(U.textContent=Ve),ce=i(e),k=r(e,"P",{"data-svelte-h":!0}),o(k)!=="svelte-4njdnv"&&(k.innerHTML=Ne),he=i(e),H=r(e,"TABLE",{"data-svelte-h":!0}),o(H)!=="svelte-9qecrq"&&(H.innerHTML=Ye),me=i(e),p(I.$$.fragment,e),ge=i(e),j=r(e,"P",{"data-svelte-h":!0}),o(j)!=="svelte-db04rk"&&(j.textContent=Re),de=i(e),Z=r(e,"TABLE",{"data-svelte-h":!0}),o(Z)!=="svelte-nev2u2"&&(Z.innerHTML=Je),be=i(e),p(A.$$.fragment,e),Te=i(e),G=r(e,"P",{"data-svelte-h":!0}),o(G)!=="svelte-qjgyy3"&&(G.innerHTML=Xe),ye=i(e),S=r(e,"P",{"data-svelte-h":!0}),o(S)!=="svelte-86ji6y"&&(S.innerHTML=qe),xe=i(e),E=r(e,"P",{"data-svelte-h":!0}),o(E)!=="svelte-1w4dc1f"&&(E.innerHTML=ze),Ce=i(e),W=r(e,"P",{"data-svelte-h":!0}),o(W)!=="svelte-8p8z10"&&(W.innerHTML=Be),$e=i(e),D=r(e,"P",{"data-svelte-h":!0}),o(D)!=="svelte-1he7r2b"&&(D.innerHTML=Fe),ve=i(e),V=r(e,"P",{"data-svelte-h":!0}),o(V)!=="svelte-1rzekti"&&(V.textContent=Ke),we=i(e),N=r(e,"UL",{"data-svelte-h":!0}),o(N)!=="svelte-tq759t"&&(N.innerHTML=Qe),Le=i(e),Y=r(e,"P",{"data-svelte-h":!0}),o(Y)!=="svelte-1kgkd98"&&(Y.innerHTML=Oe),_e=i(e),R=r(e,"P",{"data-svelte-h":!0}),o(R)!=="svelte-l6c2ju"&&(R.textContent=et),Me=i(e),p(J.$$.fragment,e),Pe=i(e),X=r(e,"P",{"data-svelte-h":!0}),o(X)!=="svelte-1om219l"&&(X.textContent=tt),Ue=i(e),p(q.$$.fragment,e),ke=i(e),F=r(e,"P",{}),nt(F).forEach(n),this.h()},h(){at(u,"name","hf:doc:metadata"),at(u,"content",mt)},m(e,t){ft(document.head,u),a(e,K,t),a(e,B,t),a(e,Q,t),c(d,e,t),a(e,O,t),a(e,b,t),a(e,ee,t),a(e,T,t),a(e,te,t),c(y,e,t),a(e,ne,t),a(e,x,t),a(e,ae,t),a(e,C,t),a(e,le,t),a(e,$,t),a(e,ie,t),c(v,e,t),a(e,se,t),c(w,e,t),a(e,re,t),a(e,L,t),a(e,oe,t),a(e,_,t),a(e,ue,t),a(e,M,t),a(e,fe,t),c(P,e,t),a(e,pe,t),a(e,U,t),a(e,ce,t),a(e,k,t),a(e,he,t),a(e,H,t),a(e,me,t),c(I,e,t),a(e,ge,t),a(e,j,t),a(e,de,t),a(e,Z,t),a(e,be,t),c(A,e,t),a(e,Te,t),a(e,G,t),a(e,ye,t),a(e,S,t),a(e,xe,t),a(e,E,t),a(e,Ce,t),a(e,W,t),a(e,$e,t),a(e,D,t),a(e,ve,t),a(e,V,t),a(e,we,t),a(e,N,t),a(e,Le,t),a(e,Y,t),a(e,_e,t),a(e,R,t),a(e,Me,t),c(J,e,t),a(e,Pe,t),a(e,X,t),a(e,Ue,t),c(q,e,t),a(e,ke,t),a(e,F,t),He=!0},p:it,i(e){He||(h(d.$$.fragment,e),h(y.$$.fragment,e),h(v.$$.fragment,e),h(w.$$.fragment,e),h(P.$$.fragment,e),h(I.$$.fragment,e),h(A.$$.fragment,e),h(J.$$.fragment,e),h(q.$$.fragment,e),He=!0)},o(e){m(d.$$.fragment,e),m(y.$$.fragment,e),m(v.$$.fragment,e),m(w.$$.fragment,e),m(P.$$.fragment,e),m(I.$$.fragment,e),m(A.$$.fragment,e),m(J.$$.fragment,e),m(q.$$.fragment,e),He=!1},d(e){e&&(n(K),n(B),n(Q),n(O),n(b),n(ee),n(T),n(te),n(ne),n(x),n(ae),n(C),n(le),n($),n(ie),n(se),n(re),n(L),n(oe),n(_),n(ue),n(M),n(fe),n(pe),n(U),n(ce),n(k),n(he),n(H),n(me),n(ge),n(j),n(de),n(Z),n(be),n(Te),n(G),n(ye),n(S),n(xe),n(E),n(Ce),n(W),n($e),n(D),n(ve),n(V),n(we),n(N),n(Le),n(Y),n(_e),n(R),n(Me),n(Pe),n(X),n(Ue),n(ke),n(F)),n(u),g(d,e),g(y,e),g(v,e),g(w,e),g(P,e),g(I,e),g(A,e),g(J,e),g(q,e)}}}const mt='{"title":"Available DLCs on AWS","local":"available-dlcs-on-aws","sections":[{"title":"Training","local":"training","sections":[],"depth":2},{"title":"Inference","local":"inference","sections":[{"title":"Pytorch Inference DLC","local":"pytorch-inference-dlc","sections":[],"depth":3},{"title":"LLM TGI","local":"llm-tgi","sections":[],"depth":3},{"title":"Text Embedding Inference","local":"text-embedding-inference","sections":[],"depth":3}],"depth":2},{"title":"FAQ","local":"faq","sections":[],"depth":2}],"depth":1}';function gt(Ie){return st(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class xt extends rt{constructor(u){super(),ot(this,u,gt,ht,lt,{})}}export{xt as component}; | |
Xet Storage Details
- Size:
- 13.5 kB
- Xet hash:
- 4c512a17691a04e2a1d53cdc818866b3c840af8ef6dcb4d3e39b5c969fc04214
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.