Buckets:

hf-doc-build
/

doc-dev

hf-doc-build/doc-dev / bitsandbytes /main /en /_app /immutable /nodes /9.9cbad9fa.js

rtrm's picture

about 1 month ago

3.35 kB

import{s as O,n as Q,o as W}from"../chunks/scheduler.852ec091.js";import{S as D,i as J,g as d,s,r as T,A as K,h as b,f as a,c as o,j as B,u as M,x as P,k as I,y as N,a as n,v as k,d as E,t as H,w as S}from"../chunks/index.28275fd3.js";import{H as G,E as V}from"../chunks/EditOnGithub.582011f0.js";function X(A){let i,$,h,g,l,w,r,F="bitsandbytes enables accessible large language models via k-bit quantization for PyTorch. bitsandbytes provides three main features for dramatically reducing memory consumption for inference and training:",_,m,R="<li>8-bit optimizers uses block-wise quantization to maintain 32-bit performance at a small fraction of the memory cost.</li> <li>LLM.Int() or 8-bit quantization enables large language model inference with only half the required memory and without any performance degradation. This method is based on vector-wise quantization to quantize most features to 8-bits and separately treating outliers with 16-bit matrix multiplication.</li> <li>QLoRA or 4-bit quantization enables large language model training with several memory-saving techniques that don’t compromise performance. This method quantizes a model to 4-bits and inserts a small set of trainable low-rank adaptation (LoRA) weights to allow training.</li>",z,u,v,f,U="bitsandbytes is MIT licensed.",x,c,j='We thank Fabio Cannizzo for his work on <a href="https://github.com/fabiocannizzo/FastBinarySearch" rel="nofollow">FastBinarySearch</a> which we use for CPU quantization.',q,p,C,y,L;return l=new G({props:{title:"bitsandbytes",local:"bitsandbytes",headingTag:"h1"}}),u=new G({props:{title:"License",local:"license",headingTag:"h1"}}),p=new V({props:{source:"https://github.com/bitsandbytes-foundation/bitsandbytes/blob/main/docs/source/index.mdx"}}),{c(){i=d("meta"),$=s(),h=d("p"),g=s(),T(l.$$.fragment),w=s(),r=d("p"),r.textContent=F,_=s(),m=d("ul"),m.innerHTML=R,z=s(),T(u.$$.fragment),v=s(),f=d("p"),f.textContent=U,x=s(),c=d("p"),c.innerHTML=j,q=s(),T(p.$$.fragment),C=s(),y=d("p"),this.h()},l(t){const e=K("svelte-u9bgzb",document.head);i=b(e,"META",{name:!0,content:!0}),e.forEach(a),$=o(t),h=b(t,"P",{}),B(h).forEach(a),g=o(t),M(l.$$.fragment,t),w=o(t),r=b(t,"P",{"data-svelte-h":!0}),P(r)!=="svelte-18pq57t"&&(r.textContent=F),_=o(t),m=b(t,"UL",{"data-svelte-h":!0}),P(m)!=="svelte-1tzxzzf"&&(m.innerHTML=R),z=o(t),M(u.$$.fragment,t),v=o(t),f=b(t,"P",{"data-svelte-h":!0}),P(f)!=="svelte-zzmy3r"&&(f.textContent=U),x=o(t),c=b(t,"P",{"data-svelte-h":!0}),P(c)!=="svelte-18bjayv"&&(c.innerHTML=j),q=o(t),M(p.$$.fragment,t),C=o(t),y=b(t,"P",{}),B(y).forEach(a),this.h()},h(){I(i,"name","hf:doc:metadata"),I(i,"content",Y)},m(t,e){N(document.head,i),n(t,$,e),n(t,h,e),n(t,g,e),k(l,t,e),n(t,w,e),n(t,r,e),n(t,_,e),n(t,m,e),n(t,z,e),k(u,t,e),n(t,v,e),n(t,f,e),n(t,x,e),n(t,c,e),n(t,q,e),k(p,t,e),n(t,C,e),n(t,y,e),L=!0},p:Q,i(t){L||(E(l.$$.fragment,t),E(u.$$.fragment,t),E(p.$$.fragment,t),L=!0)},o(t){H(l.$$.fragment,t),H(u.$$.fragment,t),H(p.$$.fragment,t),L=!1},d(t){t&&(a($),a(h),a(g),a(w),a(r),a(_),a(m),a(z),a(v),a(f),a(x),a(c),a(q),a(C),a(y)),a(i),S(l,t),S(u,t),S(p,t)}}}const Y='{"title":"bitsandbytes","local":"bitsandbytes","sections":[],"depth":1}';function Z(A){return W(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class nt extends D{constructor(i){super(),J(this,i,Z,X,O,{})}}export{nt as component};

Xet Storage Details

Size:: 3.35 kB
Xet hash:: aa8b71de53ccdb26ecf365f142611eac4bc7f45436c1e4555a405c5584b90d65

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.