Buckets:

rtrm's picture
download
raw
9.64 kB
import{s as Ge,n as De,o as Se}from"../chunks/scheduler.389d799c.js";import{S as ze,i as We,g as l,s as r,r as c,A as Re,h as o,f as n,c as i,j as Ue,u,x as s,k as Ee,y as qe,a,v as m,d,t as p,w as h}from"../chunks/index.8f81d18f.js";import{H as R,E as Be}from"../chunks/index.d407e2cc.js";function Fe(ge){let f,F,q,N,g,j,$,$e="Below you can find a listing of all the Deep Learning Containers (DLCs) available on AWS.",Q,b,be="For each supported combination of use-case (training, inference), accelerator type (CPU, GPU, Neuron), and framework (PyTorch, TGI, TEI) containers are created.",O,T,Y,y,Te="<strong>How to choose the right container for my use case?</strong>",J,x,ye='<img src="https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/sagemaker/dlc-decision-tree.png" alt="dlc-decision-tree"/>',K,v,xe='<em>Note:</em> See <a href="(https://huggingface.co/docs/sagemaker/main/en/reference/inference-toolkit)">here</a> for the list of supported task in the inference toolkit.',V,C,ve='<em>Note:</em> Browse through the Hub to see if you model is tagged <a href="https://huggingface.co/models?other=text-generation-inference" rel="nofollow">“text-generation-inference”</a> or <a href="https://huggingface.co/models?other=text-embeddings-inference" rel="nofollow">“text-embeddings-inference”</a>',X,w,Ce=`<strong>How to find the URI of my container?</strong>
The URI is built with an AWS account ID and an AWS region. Those two values need to be replaced depending on your use case.
Let’s say you want to use the training DLC for GPUs in`,Z,L,we='<li><code>dlc-aws-account-id</code>: The AWS account ID of the account that owns the ECR repository. You can find them in the <a href="https://github.com/aws/sagemaker-python-sdk/blob/e0b9d38e1e3b48647a02af23c4be54980e53dc61/src/sagemaker/image_uri_config/huggingface.json#L21" rel="nofollow">here</a></li> <li><code>region</code>: The AWS region where you want to use it.</li>',ee,P,te,_,Le="Pytorch Training DLC: For training, our DLCs are available for PyTorch via :hugging_face: Transformers. They include support for training on GPUs and AWS AI chips with libraries such as :hugging_face: TRL, Sentence Transformers, or :firecracker: Diffusers.",ne,A,Pe="<thead><tr><th>Container URI</th> <th>Accelerator</th></tr></thead> <tbody><tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-training:2.5.1-transformers4.49.0-gpu-py311-cu124-ubuntu22.04</td> <td>GPU</td></tr> <tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-training-neuronx:2.1.2-transformers4.48.1-neuronx-py310-sdk2.20.0-ubuntu20.04</td> <td>Neuron</td></tr></tbody>",ae,k,re,H,ie,I,_e="For inference, we have a general-purpose PyTorch inference DLC, for serving models trained with any of those frameworks mentioned before on CPU, GPU, and AWS AI chips.",le,M,Ae="<thead><tr><th>Container URI</th> <th>Accelerator</th></tr></thead> <tbody><tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-inference:2.6.0-transformers4.49.0-cpu-py312-ubuntu22.04-</td> <td>CPU</td></tr> <tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-inference:2.6.0-transformers4.49.0-gpu-py312-cu124-ubuntu22.04</td> <td>GPU</td></tr> <tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-inference-neuronx:2.1.2-transformers4.43.2-neuronx-py310-sdk2.20.0-ubuntu20.04</td> <td>Neuron</td></tr></tbody>",oe,U,se,E,ke="There is also the Text Generation Inference (TGI) DLC for high-performance text generation of LLMs on GPU and AWS AI chips.",fe,G,He="<thead><tr><th>Container URI</th> <th>Accelerator</th></tr></thead> <tbody><tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-tgi-inference:2.6.0-tgi3.2.3-gpu-py311-cu124-ubuntu22.04</td> <td>GPU</td></tr> <tr><td>763104351884.dkr.ecr.us-east-1.amazonaws.com/huggingface-pytorch-tgi-inference:2.1.2-optimum0.0.28-neuronx-py310-ubuntu22.04</td> <td>Neuron</td></tr></tbody>",ce,D,ue,S,Ie="Finally, there is a Text Embeddings Inference (TEI) DLC for high-performance serving of embedding models on CPU and GPU.",me,z,Me="<thead><tr><th>Container URI</th> <th>Accelerator</th></tr></thead> <tbody><tr><td>683313688378.dkr.ecr.us-east-1.amazonaws.com/tei-cpu:2.0.1-tei1.2.3-cpu-py310-ubuntu22.04</td> <td>CPU</td></tr> <tr><td>683313688378.dkr.ecr.us-east-1.amazonaws.com/tei:2.0.1-tei1.4.0-gpu-py310-cu122-ubuntu22.04</td> <td>GPU</td></tr></tbody>",de,W,pe,B,he;return g=new R({props:{title:"Available DLCs on AWS",local:"available-dlcs-on-aws",headingTag:"h1"}}),T=new R({props:{title:"FAQ",local:"faq",headingTag:"h2"}}),P=new R({props:{title:"Training",local:"training",headingTag:"h2"}}),k=new R({props:{title:"Inference",local:"inference",headingTag:"h2"}}),H=new R({props:{title:"Pytorch Inference DLC",local:"pytorch-inference-dlc",headingTag:"h3"}}),U=new R({props:{title:"Text Generation Inference",local:"text-generation-inference",headingTag:"h3"}}),D=new R({props:{title:"Text Embedding Inference",local:"text-embedding-inference",headingTag:"h3"}}),W=new Be({props:{source:"https://github.com/huggingface/hub-docs/blob/main/docs/sagemaker/source/dlcs/available.md"}}),{c(){f=l("meta"),F=r(),q=l("p"),N=r(),c(g.$$.fragment),j=r(),$=l("p"),$.textContent=$e,Q=r(),b=l("p"),b.textContent=be,O=r(),c(T.$$.fragment),Y=r(),y=l("p"),y.innerHTML=Te,J=r(),x=l("p"),x.innerHTML=ye,K=r(),v=l("p"),v.innerHTML=xe,V=r(),C=l("p"),C.innerHTML=ve,X=r(),w=l("p"),w.innerHTML=Ce,Z=r(),L=l("ul"),L.innerHTML=we,ee=r(),c(P.$$.fragment),te=r(),_=l("p"),_.textContent=Le,ne=r(),A=l("table"),A.innerHTML=Pe,ae=r(),c(k.$$.fragment),re=r(),c(H.$$.fragment),ie=r(),I=l("p"),I.textContent=_e,le=r(),M=l("table"),M.innerHTML=Ae,oe=r(),c(U.$$.fragment),se=r(),E=l("p"),E.textContent=ke,fe=r(),G=l("table"),G.innerHTML=He,ce=r(),c(D.$$.fragment),ue=r(),S=l("p"),S.textContent=Ie,me=r(),z=l("table"),z.innerHTML=Me,de=r(),c(W.$$.fragment),pe=r(),B=l("p"),this.h()},l(e){const t=Re("svelte-u9bgzb",document.head);f=o(t,"META",{name:!0,content:!0}),t.forEach(n),F=i(e),q=o(e,"P",{}),Ue(q).forEach(n),N=i(e),u(g.$$.fragment,e),j=i(e),$=o(e,"P",{"data-svelte-h":!0}),s($)!=="svelte-1eptnyh"&&($.textContent=$e),Q=i(e),b=o(e,"P",{"data-svelte-h":!0}),s(b)!=="svelte-nsjrcm"&&(b.textContent=be),O=i(e),u(T.$$.fragment,e),Y=i(e),y=o(e,"P",{"data-svelte-h":!0}),s(y)!=="svelte-1w3mxbc"&&(y.innerHTML=Te),J=i(e),x=o(e,"P",{"data-svelte-h":!0}),s(x)!=="svelte-1ag007e"&&(x.innerHTML=ye),K=i(e),v=o(e,"P",{"data-svelte-h":!0}),s(v)!=="svelte-dqwr3y"&&(v.innerHTML=xe),V=i(e),C=o(e,"P",{"data-svelte-h":!0}),s(C)!=="svelte-8p8z10"&&(C.innerHTML=ve),X=i(e),w=o(e,"P",{"data-svelte-h":!0}),s(w)!=="svelte-1ljwo93"&&(w.innerHTML=Ce),Z=i(e),L=o(e,"UL",{"data-svelte-h":!0}),s(L)!=="svelte-tq759t"&&(L.innerHTML=we),ee=i(e),u(P.$$.fragment,e),te=i(e),_=o(e,"P",{"data-svelte-h":!0}),s(_)!=="svelte-1yazlon"&&(_.textContent=Le),ne=i(e),A=o(e,"TABLE",{"data-svelte-h":!0}),s(A)!=="svelte-zzvgg0"&&(A.innerHTML=Pe),ae=i(e),u(k.$$.fragment,e),re=i(e),u(H.$$.fragment,e),ie=i(e),I=o(e,"P",{"data-svelte-h":!0}),s(I)!=="svelte-i6peck"&&(I.textContent=_e),le=i(e),M=o(e,"TABLE",{"data-svelte-h":!0}),s(M)!=="svelte-1jvau90"&&(M.innerHTML=Ae),oe=i(e),u(U.$$.fragment,e),se=i(e),E=o(e,"P",{"data-svelte-h":!0}),s(E)!=="svelte-1i6swpw"&&(E.textContent=ke),fe=i(e),G=o(e,"TABLE",{"data-svelte-h":!0}),s(G)!=="svelte-9qecrq"&&(G.innerHTML=He),ce=i(e),u(D.$$.fragment,e),ue=i(e),S=o(e,"P",{"data-svelte-h":!0}),s(S)!=="svelte-db04rk"&&(S.textContent=Ie),me=i(e),z=o(e,"TABLE",{"data-svelte-h":!0}),s(z)!=="svelte-1fbtly3"&&(z.innerHTML=Me),de=i(e),u(W.$$.fragment,e),pe=i(e),B=o(e,"P",{}),Ue(B).forEach(n),this.h()},h(){Ee(f,"name","hf:doc:metadata"),Ee(f,"content",Ne)},m(e,t){qe(document.head,f),a(e,F,t),a(e,q,t),a(e,N,t),m(g,e,t),a(e,j,t),a(e,$,t),a(e,Q,t),a(e,b,t),a(e,O,t),m(T,e,t),a(e,Y,t),a(e,y,t),a(e,J,t),a(e,x,t),a(e,K,t),a(e,v,t),a(e,V,t),a(e,C,t),a(e,X,t),a(e,w,t),a(e,Z,t),a(e,L,t),a(e,ee,t),m(P,e,t),a(e,te,t),a(e,_,t),a(e,ne,t),a(e,A,t),a(e,ae,t),m(k,e,t),a(e,re,t),m(H,e,t),a(e,ie,t),a(e,I,t),a(e,le,t),a(e,M,t),a(e,oe,t),m(U,e,t),a(e,se,t),a(e,E,t),a(e,fe,t),a(e,G,t),a(e,ce,t),m(D,e,t),a(e,ue,t),a(e,S,t),a(e,me,t),a(e,z,t),a(e,de,t),m(W,e,t),a(e,pe,t),a(e,B,t),he=!0},p:De,i(e){he||(d(g.$$.fragment,e),d(T.$$.fragment,e),d(P.$$.fragment,e),d(k.$$.fragment,e),d(H.$$.fragment,e),d(U.$$.fragment,e),d(D.$$.fragment,e),d(W.$$.fragment,e),he=!0)},o(e){p(g.$$.fragment,e),p(T.$$.fragment,e),p(P.$$.fragment,e),p(k.$$.fragment,e),p(H.$$.fragment,e),p(U.$$.fragment,e),p(D.$$.fragment,e),p(W.$$.fragment,e),he=!1},d(e){e&&(n(F),n(q),n(N),n(j),n($),n(Q),n(b),n(O),n(Y),n(y),n(J),n(x),n(K),n(v),n(V),n(C),n(X),n(w),n(Z),n(L),n(ee),n(te),n(_),n(ne),n(A),n(ae),n(re),n(ie),n(I),n(le),n(M),n(oe),n(se),n(E),n(fe),n(G),n(ce),n(ue),n(S),n(me),n(z),n(de),n(pe),n(B)),n(f),h(g,e),h(T,e),h(P,e),h(k,e),h(H,e),h(U,e),h(D,e),h(W,e)}}}const Ne='{"title":"Available DLCs on AWS","local":"available-dlcs-on-aws","sections":[{"title":"FAQ","local":"faq","sections":[],"depth":2},{"title":"Training","local":"training","sections":[],"depth":2},{"title":"Inference","local":"inference","sections":[{"title":"Pytorch Inference DLC","local":"pytorch-inference-dlc","sections":[],"depth":3},{"title":"Text Generation Inference","local":"text-generation-inference","sections":[],"depth":3},{"title":"Text Embedding Inference","local":"text-embedding-inference","sections":[],"depth":3}],"depth":2}],"depth":1}';function je(ge){return Se(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class Je extends ze{constructor(f){super(),We(this,f,je,Fe,Ge,{})}}export{Je as component};

Xet Storage Details

Size:
9.64 kB
·
Xet hash:
8712ef50b77822dc5f68b6b19dc2cf710240b0ce9e998ba8230633e07f6171d6

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.