Buckets:

rtrm's picture
download
raw
8.21 kB
import{s as Tt,o as _t,n as xt}from"../chunks/scheduler.852ec091.js";import{S as Ct,i as kt,g as r,s as l,r as u,A as Pt,h as d,f as n,c as i,j as yt,u as m,x as f,k as vt,y as Mt,a,v as h,d as c,t as $,w as b}from"../chunks/index.28275fd3.js";import{T as wt}from"../chunks/Tip.9f398c59.js";import{H as R,E as Lt}from"../chunks/EditOnGithub.582011f0.js";function At(G){let s,p="If you feel these docs need some additional info, please consider submitting a PR or respectfully request the missing info in one of the below mentioned Github discussion spaces.";return{c(){s=r("p"),s.textContent=p},l(o){s=d(o,"P",{"data-svelte-h":!0}),f(s)!=="svelte-1mb3sz"&&(s.textContent=p)},m(o,g){a(o,s,g)},p:xt,d(o){o&&n(s)}}}function Ht(G){let s,p='Apple Silicon support is planned for Q4 2024. We are actively seeking contributors to help implement this, develop a concrete plan, and create a detailed list of requirements. Due to limited resources, we rely on community contributions for this implementation effort. To discuss further, please spell out your thoughts and discuss in <a href="https://github.com/bitsandbytes-foundation/bitsandbytes/discussions/1340" rel="nofollow">this GitHub discussion</a> and tag <code>@Titus-von-Koeller</code> and <code>@matthewdouglas</code>. Thank you!';return{c(){s=r("p"),s.innerHTML=p},l(o){s=d(o,"P",{"data-svelte-h":!0}),f(s)!=="svelte-ztwrs6"&&(s.innerHTML=p)},m(o,g){a(o,s,g)},p:xt,d(o){o&&n(s)}}}function Ut(G){let s,p,o,g,w,z,y,N,x,ot="As part of a recent refactoring effort, we will soon offer official multi-backend support. Currently, this feature is available in a preview alpha release, allowing us to gather early feedback from users to improve the functionality and identify any bugs.",q,T,rt="At present, the Intel CPU and AMD ROCm backends are considered fully functional. The Intel XPU backend has limited functionality and is less mature.",O,_,dt='Please refer to the <a href="./installation#multi-backend">installation instructions</a> for details on installing the backend you intend to test (and hopefully provide feedback on).',j,v,X,C,Y,k,ft="As we are currently in the alpha testing phase, bugs are expected, and performance might not meet expectations. However, this is exactly what we want to discover from <strong>your</strong> perspective as the end user!",K,P,pt="Please share and discuss your feedback with us here:",Q,M,ut='<li><a href="https://github.com/bitsandbytes-foundation/bitsandbytes/discussions/1339" rel="nofollow">Github Discussion: Multi-backend refactor: Alpha release ( AMD ROCm ONLY )</a></li> <li><a href="https://github.com/bitsandbytes-foundation/bitsandbytes/discussions/1338" rel="nofollow">Github Discussion: Multi-backend refactor: Alpha release ( Intel ONLY )</a></li>',W,L,mt="Thank you for your support!",J,A,V,H,Z,U,ht='The following performance data is collected from Intel 4th Gen Xeon (SPR) platform. The tables show speed-up and memory compared with different data types of <a href="https://huggingface.co/meta-llama/Llama-2-7b-chat-hf" rel="nofollow">Llama-2-7b-chat-hf</a>.',tt,I,et,B,ct="<thead><tr><th>Data Type</th> <th>BF16</th> <th>INT8</th> <th>NF4</th> <th>FP4</th></tr></thead> <tbody><tr><td>Speed-Up (vs BF16)</td> <td>1.0x</td> <td>0.6x</td> <td>2.3x</td> <td>0.03x</td></tr> <tr><td>Memory (GB)</td> <td>13.1</td> <td>7.6</td> <td>5.0</td> <td>4.6</td></tr></tbody>",nt,F,at,D,$t="<thead><tr><th>Data Type</th> <th>AMP BF16</th> <th>INT8</th> <th>NF4</th> <th>FP4</th></tr></thead> <tbody><tr><td>Speed-Up (vs AMP BF16)</td> <td>1.0x</td> <td>0.38x</td> <td>0.07x</td> <td>0.07x</td></tr> <tr><td>Memory (GB)</td> <td>40</td> <td>9</td> <td>6.6</td> <td>6.6</td></tr></tbody>",st,E,lt,S,it;return w=new R({props:{title:"Multi-backend support (non-CUDA backends)",local:"multi-backend-support-non-cuda-backends",headingTag:"h1"}}),y=new wt({props:{warning:!1,$$slots:{default:[At]},$$scope:{ctx:G}}}),v=new wt({props:{warning:!1,$$slots:{default:[Ht]},$$scope:{ctx:G}}}),C=new R({props:{title:"Alpha Release",local:"alpha-release",headingTag:"h2"}}),A=new R({props:{title:"Benchmarks",local:"benchmarks",headingTag:"h2"}}),H=new R({props:{title:"Intel",local:"intel",headingTag:"h3"}}),I=new R({props:{title:"Inference (CPU)",local:"inference-cpu",headingTag:"h4"}}),F=new R({props:{title:"Fine-Tuning (CPU)",local:"fine-tuning-cpu",headingTag:"h4"}}),E=new Lt({props:{source:"https://github.com/bitsandbytes-foundation/bitsandbytes/blob/main/docs/source/non_cuda_backends.mdx"}}),{c(){s=r("meta"),p=l(),o=r("p"),g=l(),u(w.$$.fragment),z=l(),u(y.$$.fragment),N=l(),x=r("p"),x.textContent=ot,q=l(),T=r("p"),T.textContent=rt,O=l(),_=r("p"),_.innerHTML=dt,j=l(),u(v.$$.fragment),X=l(),u(C.$$.fragment),Y=l(),k=r("p"),k.innerHTML=ft,K=l(),P=r("p"),P.textContent=pt,Q=l(),M=r("ul"),M.innerHTML=ut,W=l(),L=r("p"),L.textContent=mt,J=l(),u(A.$$.fragment),V=l(),u(H.$$.fragment),Z=l(),U=r("p"),U.innerHTML=ht,tt=l(),u(I.$$.fragment),et=l(),B=r("table"),B.innerHTML=ct,nt=l(),u(F.$$.fragment),at=l(),D=r("table"),D.innerHTML=$t,st=l(),u(E.$$.fragment),lt=l(),S=r("p"),this.h()},l(t){const e=Pt("svelte-u9bgzb",document.head);s=d(e,"META",{name:!0,content:!0}),e.forEach(n),p=i(t),o=d(t,"P",{}),yt(o).forEach(n),g=i(t),m(w.$$.fragment,t),z=i(t),m(y.$$.fragment,t),N=i(t),x=d(t,"P",{"data-svelte-h":!0}),f(x)!=="svelte-vyk3k9"&&(x.textContent=ot),q=i(t),T=d(t,"P",{"data-svelte-h":!0}),f(T)!=="svelte-12ne44y"&&(T.textContent=rt),O=i(t),_=d(t,"P",{"data-svelte-h":!0}),f(_)!=="svelte-1wpsr8f"&&(_.innerHTML=dt),j=i(t),m(v.$$.fragment,t),X=i(t),m(C.$$.fragment,t),Y=i(t),k=d(t,"P",{"data-svelte-h":!0}),f(k)!=="svelte-njzoox"&&(k.innerHTML=ft),K=i(t),P=d(t,"P",{"data-svelte-h":!0}),f(P)!=="svelte-5kenpg"&&(P.textContent=pt),Q=i(t),M=d(t,"UL",{"data-svelte-h":!0}),f(M)!=="svelte-7ea0dg"&&(M.innerHTML=ut),W=i(t),L=d(t,"P",{"data-svelte-h":!0}),f(L)!=="svelte-16dyb3n"&&(L.textContent=mt),J=i(t),m(A.$$.fragment,t),V=i(t),m(H.$$.fragment,t),Z=i(t),U=d(t,"P",{"data-svelte-h":!0}),f(U)!=="svelte-1qmjl0d"&&(U.innerHTML=ht),tt=i(t),m(I.$$.fragment,t),et=i(t),B=d(t,"TABLE",{"data-svelte-h":!0}),f(B)!=="svelte-1wzn4ht"&&(B.innerHTML=ct),nt=i(t),m(F.$$.fragment,t),at=i(t),D=d(t,"TABLE",{"data-svelte-h":!0}),f(D)!=="svelte-zjxg1q"&&(D.innerHTML=$t),st=i(t),m(E.$$.fragment,t),lt=i(t),S=d(t,"P",{}),yt(S).forEach(n),this.h()},h(){vt(s,"name","hf:doc:metadata"),vt(s,"content",It)},m(t,e){Mt(document.head,s),a(t,p,e),a(t,o,e),a(t,g,e),h(w,t,e),a(t,z,e),h(y,t,e),a(t,N,e),a(t,x,e),a(t,q,e),a(t,T,e),a(t,O,e),a(t,_,e),a(t,j,e),h(v,t,e),a(t,X,e),h(C,t,e),a(t,Y,e),a(t,k,e),a(t,K,e),a(t,P,e),a(t,Q,e),a(t,M,e),a(t,W,e),a(t,L,e),a(t,J,e),h(A,t,e),a(t,V,e),h(H,t,e),a(t,Z,e),a(t,U,e),a(t,tt,e),h(I,t,e),a(t,et,e),a(t,B,e),a(t,nt,e),h(F,t,e),a(t,at,e),a(t,D,e),a(t,st,e),h(E,t,e),a(t,lt,e),a(t,S,e),it=!0},p(t,[e]){const bt={};e&2&&(bt.$$scope={dirty:e,ctx:t}),y.$set(bt);const gt={};e&2&&(gt.$$scope={dirty:e,ctx:t}),v.$set(gt)},i(t){it||(c(w.$$.fragment,t),c(y.$$.fragment,t),c(v.$$.fragment,t),c(C.$$.fragment,t),c(A.$$.fragment,t),c(H.$$.fragment,t),c(I.$$.fragment,t),c(F.$$.fragment,t),c(E.$$.fragment,t),it=!0)},o(t){$(w.$$.fragment,t),$(y.$$.fragment,t),$(v.$$.fragment,t),$(C.$$.fragment,t),$(A.$$.fragment,t),$(H.$$.fragment,t),$(I.$$.fragment,t),$(F.$$.fragment,t),$(E.$$.fragment,t),it=!1},d(t){t&&(n(p),n(o),n(g),n(z),n(N),n(x),n(q),n(T),n(O),n(_),n(j),n(X),n(Y),n(k),n(K),n(P),n(Q),n(M),n(W),n(L),n(J),n(V),n(Z),n(U),n(tt),n(et),n(B),n(nt),n(at),n(D),n(st),n(lt),n(S)),n(s),b(w,t),b(y,t),b(v,t),b(C,t),b(A,t),b(H,t),b(I,t),b(F,t),b(E,t)}}}const It='{"title":"Multi-backend support (non-CUDA backends)","local":"multi-backend-support-non-cuda-backends","sections":[{"title":"Alpha Release","local":"alpha-release","sections":[],"depth":2},{"title":"Benchmarks","local":"benchmarks","sections":[{"title":"Intel","local":"intel","sections":[{"title":"Inference (CPU)","local":"inference-cpu","sections":[],"depth":4},{"title":"Fine-Tuning (CPU)","local":"fine-tuning-cpu","sections":[],"depth":4}],"depth":3}],"depth":2}],"depth":1}';function Bt(G){return _t(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class Rt extends Ct{constructor(s){super(),kt(this,s,Bt,Ut,Tt,{})}}export{Rt as component};

Xet Storage Details

Size:
8.21 kB
·
Xet hash:
40c1b81f3c71d20dff4954a3560a76856a6925eb5398599da10dc2bd2db5dd6e

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.