Buckets:

rtrm's picture
download
raw
7.58 kB
import{s as Ct,o as Tt,n as _t}from"../chunks/scheduler.852ec091.js";import{S as gt,i as kt,g as o,s as a,r as H,A as Pt,h as r,f as n,c as s,j as vt,u as G,x as d,k as wt,y as Mt,a as l,v as D,d as E,t as F,w as I}from"../chunks/index.28275fd3.js";import{T as Lt}from"../chunks/Tip.9f398c59.js";import{H as N,E as At}from"../chunks/EditOnGithub.582011f0.js";function Ht(R){let i,u='Apple Silicon support is planned for Q4 2024. We are actively seeking contributors to help implement this, develop a concrete plan, and create a detailed list of requirements. Due to limited resources, we rely on community contributions for this implementation effort. To discuss further, please spell out your thoughts and discuss in <a href="https://github.com/bitsandbytes-foundation/bitsandbytes/discussions/1340" rel="nofollow">this GitHub discussion</a> and tag <code>@Titus-von-Koeller</code> and <code>@matthewdouglas</code>. Thank you!';return{c(){i=o("p"),i.innerHTML=u},l(p){i=r(p,"P",{"data-svelte-h":!0}),d(i)!=="svelte-ztwrs6"&&(i.innerHTML=u)},m(p,U){l(p,i,U)},p:_t,d(p){p&&n(i)}}}function Gt(R){let i,u,p,U,m,O,h,ot="As part of a recent refactoring effort, we will soon offer official multi-backend support. Currently, this feature is available in a preview alpha release, allowing us to gather early feedback from users to improve the functionality and identify any bugs.",S,c,rt="At present, the Intel CPU and AMD ROCm backends are considered fully functional. The Intel XPU backend has limited functionality and is less mature.",j,b,dt='Please refer to the <a href="./installation#multi-backend">installation instructions</a> for details on installing the backend you intend to test (and hopefully provide feedback on).',q,f,z,$,X,y,pt="As we are currently in the alpha testing phase, bugs are expected, and performance might not meet expectations. However, this is exactly what we want to discover from <strong>your</strong> perspective as the end user!",Y,x,ft="Please share and discuss your feedback with us here:",K,v,ut='<li><a href="https://github.com/bitsandbytes-foundation/bitsandbytes/discussions/1339" rel="nofollow">Github Discussion: Multi-backend refactor: Alpha release ( AMD ROCm ONLY )</a></li> <li><a href="https://github.com/bitsandbytes-foundation/bitsandbytes/discussions/1338" rel="nofollow">Github Discussion: Multi-backend refactor: Alpha release ( Intel ONLY )</a></li>',Q,w,mt="Thank you for your support!",W,C,J,T,V,_,ht='The following performance data is collected from Intel 4th Gen Xeon (SPR) platform. The tables show speed-up and memory compared with different data types of <a href="https://huggingface.co/meta-llama/Llama-2-7b-chat-hf" rel="nofollow">Llama-2-7b-chat-hf</a>.',Z,g,ct="For inference:",tt,k,bt="<thead><tr><th>CPU</th> <th>BF16</th> <th>INT8</th> <th>NF4</th> <th>FP4</th></tr></thead> <tbody><tr><td>speed-up</td> <td>1.0x</td> <td>0.6x</td> <td>2.3x</td> <td>0.03x</td></tr> <tr><td>memory</td> <td>13.1G</td> <td>7.6G</td> <td>5.0G</td> <td>4.6G</td></tr></tbody>",et,P,$t="For fine-tune:",nt,M,yt="<thead><tr><th>CPU</th> <th>AMP BF16</th> <th>INT8</th> <th>NF4</th> <th>FP4</th></tr></thead> <tbody><tr><td>speed-up</td> <td>1.0x</td> <td>0.38x</td> <td>0.07x</td> <td>0.07x</td></tr> <tr><td>memory</td> <td>40G</td> <td>9G</td> <td>6.6G</td> <td>6.6G</td></tr></tbody>",lt,L,at,A,st,B,it;return m=new N({props:{title:"Multi-backend support (non-CUDA backends)",local:"multi-backend-support-non-cuda-backends",headingTag:"h1"}}),f=new Lt({props:{warning:!1,$$slots:{default:[Ht]},$$scope:{ctx:R}}}),$=new N({props:{title:"Alpha Release",local:"alpha-release",headingTag:"h2"}}),C=new N({props:{title:"Benchmarks",local:"benchmarks",headingTag:"h2"}}),T=new N({props:{title:"Intel",local:"intel",headingTag:"h3"}}),L=new N({props:{title:"AMD",local:"amd",headingTag:"h3"}}),A=new At({props:{source:"https://github.com/bitsandbytes-foundation/bitsandbytes/blob/main/docs/source/non_cuda_backends.mdx"}}),{c(){i=o("meta"),u=a(),p=o("p"),U=a(),H(m.$$.fragment),O=a(),h=o("p"),h.textContent=ot,S=a(),c=o("p"),c.textContent=rt,j=a(),b=o("p"),b.innerHTML=dt,q=a(),H(f.$$.fragment),z=a(),H($.$$.fragment),X=a(),y=o("p"),y.innerHTML=pt,Y=a(),x=o("p"),x.textContent=ft,K=a(),v=o("ul"),v.innerHTML=ut,Q=a(),w=o("p"),w.textContent=mt,W=a(),H(C.$$.fragment),J=a(),H(T.$$.fragment),V=a(),_=o("p"),_.innerHTML=ht,Z=a(),g=o("p"),g.textContent=ct,tt=a(),k=o("table"),k.innerHTML=bt,et=a(),P=o("p"),P.textContent=$t,nt=a(),M=o("table"),M.innerHTML=yt,lt=a(),H(L.$$.fragment),at=a(),H(A.$$.fragment),st=a(),B=o("p"),this.h()},l(t){const e=Pt("svelte-u9bgzb",document.head);i=r(e,"META",{name:!0,content:!0}),e.forEach(n),u=s(t),p=r(t,"P",{}),vt(p).forEach(n),U=s(t),G(m.$$.fragment,t),O=s(t),h=r(t,"P",{"data-svelte-h":!0}),d(h)!=="svelte-vyk3k9"&&(h.textContent=ot),S=s(t),c=r(t,"P",{"data-svelte-h":!0}),d(c)!=="svelte-12ne44y"&&(c.textContent=rt),j=s(t),b=r(t,"P",{"data-svelte-h":!0}),d(b)!=="svelte-1wpsr8f"&&(b.innerHTML=dt),q=s(t),G(f.$$.fragment,t),z=s(t),G($.$$.fragment,t),X=s(t),y=r(t,"P",{"data-svelte-h":!0}),d(y)!=="svelte-njzoox"&&(y.innerHTML=pt),Y=s(t),x=r(t,"P",{"data-svelte-h":!0}),d(x)!=="svelte-5kenpg"&&(x.textContent=ft),K=s(t),v=r(t,"UL",{"data-svelte-h":!0}),d(v)!=="svelte-7ea0dg"&&(v.innerHTML=ut),Q=s(t),w=r(t,"P",{"data-svelte-h":!0}),d(w)!=="svelte-16dyb3n"&&(w.textContent=mt),W=s(t),G(C.$$.fragment,t),J=s(t),G(T.$$.fragment,t),V=s(t),_=r(t,"P",{"data-svelte-h":!0}),d(_)!=="svelte-1qmjl0d"&&(_.innerHTML=ht),Z=s(t),g=r(t,"P",{"data-svelte-h":!0}),d(g)!=="svelte-1skyg7e"&&(g.textContent=ct),tt=s(t),k=r(t,"TABLE",{"data-svelte-h":!0}),d(k)!=="svelte-1cj7hng"&&(k.innerHTML=bt),et=s(t),P=r(t,"P",{"data-svelte-h":!0}),d(P)!=="svelte-18h2pc"&&(P.textContent=$t),nt=s(t),M=r(t,"TABLE",{"data-svelte-h":!0}),d(M)!=="svelte-161am9d"&&(M.innerHTML=yt),lt=s(t),G(L.$$.fragment,t),at=s(t),G(A.$$.fragment,t),st=s(t),B=r(t,"P",{}),vt(B).forEach(n),this.h()},h(){wt(i,"name","hf:doc:metadata"),wt(i,"content",Dt)},m(t,e){Mt(document.head,i),l(t,u,e),l(t,p,e),l(t,U,e),D(m,t,e),l(t,O,e),l(t,h,e),l(t,S,e),l(t,c,e),l(t,j,e),l(t,b,e),l(t,q,e),D(f,t,e),l(t,z,e),D($,t,e),l(t,X,e),l(t,y,e),l(t,Y,e),l(t,x,e),l(t,K,e),l(t,v,e),l(t,Q,e),l(t,w,e),l(t,W,e),D(C,t,e),l(t,J,e),D(T,t,e),l(t,V,e),l(t,_,e),l(t,Z,e),l(t,g,e),l(t,tt,e),l(t,k,e),l(t,et,e),l(t,P,e),l(t,nt,e),l(t,M,e),l(t,lt,e),D(L,t,e),l(t,at,e),D(A,t,e),l(t,st,e),l(t,B,e),it=!0},p(t,[e]){const xt={};e&2&&(xt.$$scope={dirty:e,ctx:t}),f.$set(xt)},i(t){it||(E(m.$$.fragment,t),E(f.$$.fragment,t),E($.$$.fragment,t),E(C.$$.fragment,t),E(T.$$.fragment,t),E(L.$$.fragment,t),E(A.$$.fragment,t),it=!0)},o(t){F(m.$$.fragment,t),F(f.$$.fragment,t),F($.$$.fragment,t),F(C.$$.fragment,t),F(T.$$.fragment,t),F(L.$$.fragment,t),F(A.$$.fragment,t),it=!1},d(t){t&&(n(u),n(p),n(U),n(O),n(h),n(S),n(c),n(j),n(b),n(q),n(z),n(X),n(y),n(Y),n(x),n(K),n(v),n(Q),n(w),n(W),n(J),n(V),n(_),n(Z),n(g),n(tt),n(k),n(et),n(P),n(nt),n(M),n(lt),n(at),n(st),n(B)),n(i),I(m,t),I(f,t),I($,t),I(C,t),I(T,t),I(L,t),I(A,t)}}}const Dt='{"title":"Multi-backend support (non-CUDA backends)","local":"multi-backend-support-non-cuda-backends","sections":[{"title":"Alpha Release","local":"alpha-release","sections":[],"depth":2},{"title":"Benchmarks","local":"benchmarks","sections":[{"title":"Intel","local":"intel","sections":[],"depth":3},{"title":"AMD","local":"amd","sections":[],"depth":3}],"depth":2}],"depth":1}';function Et(R){return Tt(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class Nt extends gt{constructor(i){super(),kt(this,i,Et,Gt,Ct,{})}}export{Nt as component};

Xet Storage Details

Size:
7.58 kB
·
Xet hash:
4cf8e8fecba318a46e6be9c2da9976e44d4722c4dc2d0ab8aad99538e9249ebb

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.