Buckets:
| import{s as Ee,n as Ae,o as Re}from"../chunks/scheduler.8a2cc2fa.js";import{S as Ze,i as We,e as i,s as a,c as r,h as ze,a as M,d as t,b as n,f as ge,g as p,j as T,k as Be,l as ve,m as s,n as m,t as o,o as y,p as w}from"../chunks/index.7079e750.js";import{C as xe,H as N,E as Le}from"../chunks/MermaidChart.svelte_svelte_type_style_lang.2b7ce466.js";import{C as G}from"../chunks/CodeBlock.a326412a.js";function Ne(Ue){let c,F,S,H,J,Y,U,D,u,ue="The below academic work is ordered in reverse chronological order.",V,j,_,h,je="Authors: Tim Dettmers, Ruslan Svirschevski, Vage Egiazarian, Denis Kuznedelev, Elias Frantar, Saleh Ashkboos, Alexander Borzunov, Torsten Hoefler, Dan Alistarh",P,d,he='<li><a href="https://twitter.com/Tim_Dettmers/status/1666076553665744896" rel="nofollow">Twitter summary thread</a></li>',q,b,O,f,K,C,de="Authors: Tim Dettmers, Artidoro Pagnoni, Ari Holtzman, Luke Zettlemoyer",ee,I,be='<li><a href="https://www.youtube.com/watch?v=y9PHWGOa8HA&ab_channel=LondonMachineLearningMeetup" rel="nofollow">Video</a></li> <li><a href="https://twitter.com/Tim_Dettmers/status/1661379354507476994" rel="nofollow">Twitter summary thread</a></li>',le,k,te,$,se,Q,fe="Authors: Tim Dettmers, Luke Zettlemoyer",ae,g,Ce='<li><a href="https://www.youtube.com/watch?v=odlQa6AE1gY&ab_channel=TheInsideView" rel="nofollow">Video</a></li> <li><a href="https://twitter.com/Tim_Dettmers/status/1605209171758284805" rel="nofollow">Twitter summary thread</a></li>',ne,B,ie,E,Me,A,Ie="Authors: Tim Dettmers, Mike Lewis, Younes Belkada, Luke Zettlemoyer",re,R,ke='<li><a href="https://huggingface.co/blog/hf-bitsandbytes-integration" rel="nofollow">LLM.int8() Blog Post</a></li> <li><a href="https://timdettmers.com/2022/08/17/llm-int8-and-emergent-features/" rel="nofollow">LLM.int8() Emergent Features Blog Post</a></li> <li><a href="https://towardsdatascience.com/introduction-to-weight-quantization-2494701b9c0c" rel="nofollow">Introduction to Weight Quantization</a></li> <li><a href="https://twitter.com/Tim_Dettmers/status/1598351301942951937" rel="nofollow">Poster</a></li>',pe,Z,me,W,oe,z,$e="Authors: Tim Dettmers, Mike Lewis, Sam Shleifer, Luke Zettlemoyer",ye,v,Qe='<li><a href="https://www.youtube.com/watch?v=IxrlHAJtqKE" rel="nofollow">Video</a></li> <li><a href="https://twitter.com/Tim_Dettmers/status/1446472128979562499" rel="nofollow">Twitter summary thread</a></li>',we,x,Te,L,ce,X,Je;return J=new xe({props:{containerStyle:"float: right; margin-left: 10px; display: inline-flex; position: relative; z-index: 10;"}}),U=new N({props:{title:"Papers, related resources & how to cite",local:"papers-related-resources--how-to-cite",headingTag:"h1"}}),j=new N({props:{title:"SpQR: A Sparse-Quantized Representation for Near-Lossless LLM Weight Compression (Jun 2023)",local:"spqr-a-sparse-quantized-representation-for-near-lossless-llm-weight-compression-jun-2023",headingTag:"h2"}}),b=new G({props:{code:"JTQwYXJ0aWNsZSU3QmRldHRtZXJzMjAyM3NwcXIlMkMlMEElMjAlMjB0aXRsZSUzRCU3QlNwUVIlM0ElMjBBJTIwU3BhcnNlLVF1YW50aXplZCUyMFJlcHJlc2VudGF0aW9uJTIwZm9yJTIwTmVhci1Mb3NzbGVzcyUyMExMTSUyMFdlaWdodCUyMENvbXByZXNzaW9uJTdEJTJDJTBBJTIwJTIwYXV0aG9yJTNEJTdCRGV0dG1lcnMlMkMlMjBUaW0lMjBhbmQlMjBTdmlyc2NoZXZza2klMkMlMjBSdXNsYW4lMjBhbmQlMjBFZ2lhemFyaWFuJTJDJTIwVmFnZSUyMGFuZCUyMEt1em5lZGVsZXYlMkMlMjBEZW5pcyUyMGFuZCUyMEZyYW50YXIlMkMlMjBFbGlhcyUyMGFuZCUyMEFzaGtib29zJTJDJTIwU2FsZWglMjBhbmQlMjBCb3J6dW5vdiUyQyUyMEFsZXhhbmRlciUyMGFuZCUyMEhvZWZsZXIlMkMlMjBUb3JzdGVuJTIwYW5kJTIwQWxpc3RhcmglMkMlMjBEYW4lN0QlMkMlMEElMjAlMjBqb3VybmFsJTNEJTdCYXJYaXYlMjBwcmVwcmludCUyMGFyWGl2JTNBMjMwNi4wMzA3OCU3RCUyQyUwQSUyMCUyMHllYXIlM0QlN0IyMDIzJTdEJTBBJTdE",highlighted:`@article{dettmers2023spqr, | |
| title={SpQR: A Sparse-Quantized Representation for Near-Lossless <span class="hljs-keyword">LLM </span>Weight Compression}, | |
| author={Dettmers, Tim <span class="hljs-keyword">and </span>Svirschevski, Ruslan <span class="hljs-keyword">and </span>Egiazarian, Vage <span class="hljs-keyword">and </span>Kuznedelev, Denis <span class="hljs-keyword">and </span>Frantar, Elias <span class="hljs-keyword">and </span>Ashkboos, Saleh <span class="hljs-keyword">and </span><span class="hljs-keyword">Borzunov, </span>Alexander <span class="hljs-keyword">and </span>Hoefler, Torsten <span class="hljs-keyword">and </span>Alistarh, Dan}, | |
| <span class="hljs-keyword">journal={arXiv </span>preprint arXiv:<span class="hljs-number">2306</span>.<span class="hljs-number">03078</span>}, | |
| year={<span class="hljs-number">2023</span>} | |
| }`,wrap:!1}}),f=new N({props:{title:"QLoRA: Efficient Finetuning of Quantized LLMs (May 2023)",local:"qlora-efficient-finetuning-of-quantized-llms-may-2023",headingTag:"h2"}}),k=new G({props:{code:"JTQwYXJ0aWNsZSU3QmRldHRtZXJzMjAyM3Fsb3JhJTJDJTBBJTIwJTIwdGl0bGUlM0QlN0JRbG9yYSUzQSUyMEVmZmljaWVudCUyMGZpbmV0dW5pbmclMjBvZiUyMHF1YW50aXplZCUyMGxsbXMlN0QlMkMlMEElMjAlMjBhdXRob3IlM0QlN0JEZXR0bWVycyUyQyUyMFRpbSUyMGFuZCUyMFBhZ25vbmklMkMlMjBBcnRpZG9ybyUyMGFuZCUyMEhvbHR6bWFuJTJDJTIwQXJpJTIwYW5kJTIwWmV0dGxlbW95ZXIlMkMlMjBMdWtlJTdEJTJDJTBBJTIwJTIwam91cm5hbCUzRCU3QmFyWGl2JTIwcHJlcHJpbnQlMjBhclhpdiUzQTIzMDUuMTQzMTQlN0QlMkMlMEElMjAlMjB5ZWFyJTNEJTdCMjAyMyU3RCUwQSU3RA==",highlighted:`@article{dettmers2023qlora, | |
| title={Qlora: Efficient finetuning of quantized <span class="hljs-keyword">llms}, | |
| </span> author={Dettmers, Tim <span class="hljs-keyword">and </span>Pagnoni, Artidoro <span class="hljs-keyword">and </span>Holtzman, Ari <span class="hljs-keyword">and </span>Zettlemoyer, Luke}, | |
| <span class="hljs-keyword">journal={arXiv </span>preprint arXiv:<span class="hljs-number">2305</span>.<span class="hljs-number">14314</span>}, | |
| year={<span class="hljs-number">2023</span>} | |
| }`,wrap:!1}}),$=new N({props:{title:"The case for 4-bit precision: k-bit Inference Scaling Laws (Dec 2022)",local:"the-case-for-4-bit-precision-k-bit-inference-scaling-laws-dec-2022",headingTag:"h2"}}),B=new G({props:{code:"JTQwaW5wcm9jZWVkaW5ncyU3QmRldHRtZXJzMjAyM2Nhc2UlMkMlMEElMjAlMjB0aXRsZSUzRCU3QlRoZSUyMGNhc2UlMjBmb3IlMjA0LWJpdCUyMHByZWNpc2lvbiUzQSUyMGstYml0JTIwaW5mZXJlbmNlJTIwc2NhbGluZyUyMGxhd3MlN0QlMkMlMEElMjAlMjBhdXRob3IlM0QlN0JEZXR0bWVycyUyQyUyMFRpbSUyMGFuZCUyMFpldHRsZW1veWVyJTJDJTIwTHVrZSU3RCUyQyUwQSUyMCUyMGJvb2t0aXRsZSUzRCU3QkludGVybmF0aW9uYWwlMjBDb25mZXJlbmNlJTIwb24lMjBNYWNoaW5lJTIwTGVhcm5pbmclN0QlMkMlMEElMjAlMjBwYWdlcyUzRCU3Qjc3NTAtLTc3NzQlN0QlMkMlMEElMjAlMjB5ZWFyJTNEJTdCMjAyMyU3RCUyQyUwQSUyMCUyMG9yZ2FuaXphdGlvbiUzRCU3QlBNTFIlN0QlMEElN0Q=",highlighted:`<span class="language-xml">@inproceedings</span><span class="hljs-template-variable">{dettmers2023case, | |
| title={The case for 4-bit precision: k-bit inference scaling laws}</span><span class="language-xml">, | |
| author=</span><span class="hljs-template-variable">{Dettmers, Tim and Zettlemoyer, Luke}</span><span class="language-xml">, | |
| booktitle=</span><span class="hljs-template-variable">{International Conference on Machine Learning}</span><span class="language-xml">, | |
| pages=</span><span class="hljs-template-variable">{7750--7774}</span><span class="language-xml">, | |
| year=</span><span class="hljs-template-variable">{2023}</span><span class="language-xml">, | |
| organization=</span><span class="hljs-template-variable">{PMLR}</span><span class="language-xml"> | |
| }</span>`,wrap:!1}}),E=new N({props:{title:"LLM.int8(): 8-bit Matrix Multiplication for Transformers at Scale (Nov 2022)",local:"llm-int8",headingTag:"h2"}}),Z=new G({props:{code:"JTQwYXJ0aWNsZSU3QmRldHRtZXJzMjAyMmxsbSUyQyUwQSUyMCUyMHRpdGxlJTNEJTdCTGxtLiUyMGludDglMjAoKSUzQSUyMDgtYml0JTIwbWF0cml4JTIwbXVsdGlwbGljYXRpb24lMjBmb3IlMjB0cmFuc2Zvcm1lcnMlMjBhdCUyMHNjYWxlJTdEJTJDJTBBJTIwJTIwYXV0aG9yJTNEJTdCRGV0dG1lcnMlMkMlMjBUaW0lMjBhbmQlMjBMZXdpcyUyQyUyME1pa2UlMjBhbmQlMjBCZWxrYWRhJTJDJTIwWW91bmVzJTIwYW5kJTIwWmV0dGxlbW95ZXIlMkMlMjBMdWtlJTdEJTJDJTBBJTIwJTIwam91cm5hbCUzRCU3QmFyWGl2JTIwcHJlcHJpbnQlMjBhclhpdiUzQTIyMDguMDczMzklN0QlMkMlMEElMjAlMjB5ZWFyJTNEJTdCMjAyMiU3RCUwQSU3RA==",highlighted:`@article{dettmers2022llm, | |
| title={<span class="hljs-keyword">Llm. </span>int8 (): <span class="hljs-number">8</span>-<span class="hljs-keyword">bit </span>matrix <span class="hljs-keyword">multiplication </span>for transformers <span class="hljs-built_in">at</span> <span class="hljs-keyword">scale}, | |
| </span> author={Dettmers, Tim <span class="hljs-keyword">and </span>Lewis, Mike <span class="hljs-keyword">and </span><span class="hljs-keyword">Belkada, </span>Younes <span class="hljs-keyword">and </span>Zettlemoyer, Luke}, | |
| <span class="hljs-keyword">journal={arXiv </span>preprint arXiv:<span class="hljs-number">2208</span>.<span class="hljs-number">07339</span>}, | |
| year={<span class="hljs-number">2022</span>} | |
| }`,wrap:!1}}),W=new N({props:{title:"8-bit Optimizers via Block-wise Quantization (Oct 2021)",local:"8-bit-optimizers-via-block-wise-quantization-oct-2021",headingTag:"h2"}}),x=new G({props:{code:"JTQwYXJ0aWNsZSU3QkRCTFAlM0Fqb3VybmFscyUyRmNvcnIlMkZhYnMtMjExMC0wMjg2MSUyQyUwQSUyMCUyMGF1dGhvciUyMCUyMCUyMCUyMCUyMCUyMCUyMCUzRCUyMCU3QlRpbSUyMERldHRtZXJzJTIwYW5kJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwTWlrZSUyMExld2lzJTIwYW5kJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwU2FtJTIwU2hsZWlmZXIlMjBhbmQlMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjBMdWtlJTIwWmV0dGxlbW95ZXIlN0QlMkMlMEElMjAlMjB0aXRsZSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUzRCUyMCU3QjgtYml0JTIwT3B0aW1pemVycyUyMHZpYSUyMEJsb2NrLXdpc2UlMjBRdWFudGl6YXRpb24lN0QlMkMlMEElMjAlMjBqb3VybmFsJTIwJTIwJTIwJTIwJTIwJTIwJTNEJTIwJTdCQ29SUiU3RCUyQyUwQSUyMCUyMHZvbHVtZSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUzRCUyMCU3QmFicyUyRjIxMTAuMDI4NjElN0QlMkMlMEElMjAlMjB5ZWFyJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTNEJTIwJTdCMjAyMSU3RCUyQyUwQSUyMCUyMHVybCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUzRCUyMCU3Qmh0dHBzJTNBJTJGJTJGYXJ4aXYub3JnJTJGYWJzJTJGMjExMC4wMjg2MSU3RCUyQyUwQSUyMCUyMGVwcmludHR5cGUlMjAlMjAlMjAlMjAlM0QlMjAlN0JhclhpdiU3RCUyQyUwQSUyMCUyMGVwcmludCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUzRCUyMCU3QjIxMTAuMDI4NjElN0QlMkMlMEElMjAlMjB0aW1lc3RhbXAlMjAlMjAlMjAlMjAlM0QlMjAlN0JUaHUlMkMlMjAyMSUyME9jdCUyMDIwMjElMjAxNiUzQTIwJTNBMDglMjAlMkIwMjAwJTdEJTJDJTBBJTIwJTIwYmlidXJsJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTNEJTIwJTdCaHR0cHMlM0ElMkYlMkZkYmxwLm9yZyUyRnJlYyUyRmpvdXJuYWxzJTJGY29yciUyRmFicy0yMTEwLTAyODYxLmJpYiU3RCUyQyUwQSUyMCUyMGJpYnNvdXJjZSUyMCUyMCUyMCUyMCUzRCUyMCU3QmRibHAlMjBjb21wdXRlciUyMHNjaWVuY2UlMjBiaWJsaW9ncmFwaHklMkMlMjBodHRwcyUzQSUyRiUyRmRibHAub3JnJTdEJTBBJTdE",highlighted:`@article{DBLP:journals<span class="hljs-regexp">/corr/</span>abs-<span class="hljs-number">2110</span>-<span class="hljs-number">02861</span>, | |
| author = {Tim Dettmers and | |
| Mike Lewis and | |
| Sam Shleifer and | |
| Luke Zettlemoyer}, | |
| title = {<span class="hljs-number">8</span>-bit Optimizers via Block-wise Quantization}, | |
| journal = {CoRR}, | |
| volume = {abs/<span class="hljs-number">2110.02861</span>}, | |
| year = {<span class="hljs-number">2021</span>}, | |
| url = {https:<span class="hljs-regexp">//</span>arxiv.org<span class="hljs-regexp">/abs/</span><span class="hljs-number">2110.02861</span>}, | |
| eprinttype = {arXiv}, | |
| eprint = {<span class="hljs-number">2110.02861</span>}, | |
| timestamp = {Thu, <span class="hljs-number">21</span> Oct <span class="hljs-number">2021</span> <span class="hljs-number">16</span>:<span class="hljs-number">20</span>:<span class="hljs-number">08</span> +<span class="hljs-number">0200</span>}, | |
| biburl = {https:<span class="hljs-regexp">//</span>dblp.org<span class="hljs-regexp">/rec/</span>journals<span class="hljs-regexp">/corr/</span>abs-<span class="hljs-number">2110</span>-<span class="hljs-number">02861</span>.bib}, | |
| bibsource = {dblp computer science bibliography, https:<span class="hljs-regexp">//</span>dblp.org} | |
| }`,wrap:!1}}),L=new Le({props:{source:"https://github.com/bitsandbytes-foundation/bitsandbytes/blob/main/docs/source/explanations/resources.mdx"}}),{c(){c=i("meta"),F=a(),S=i("p"),H=a(),r(J.$$.fragment),Y=a(),r(U.$$.fragment),D=a(),u=i("p"),u.textContent=ue,V=a(),r(j.$$.fragment),_=a(),h=i("p"),h.textContent=je,P=a(),d=i("ul"),d.innerHTML=he,q=a(),r(b.$$.fragment),O=a(),r(f.$$.fragment),K=a(),C=i("p"),C.textContent=de,ee=a(),I=i("ul"),I.innerHTML=be,le=a(),r(k.$$.fragment),te=a(),r($.$$.fragment),se=a(),Q=i("p"),Q.textContent=fe,ae=a(),g=i("ul"),g.innerHTML=Ce,ne=a(),r(B.$$.fragment),ie=a(),r(E.$$.fragment),Me=a(),A=i("p"),A.textContent=Ie,re=a(),R=i("ul"),R.innerHTML=ke,pe=a(),r(Z.$$.fragment),me=a(),r(W.$$.fragment),oe=a(),z=i("p"),z.textContent=$e,ye=a(),v=i("ul"),v.innerHTML=Qe,we=a(),r(x.$$.fragment),Te=a(),r(L.$$.fragment),ce=a(),X=i("p"),this.h()},l(e){const l=ze("svelte-u9bgzb",document.head);c=M(l,"META",{name:!0,content:!0}),l.forEach(t),F=n(e),S=M(e,"P",{}),ge(S).forEach(t),H=n(e),p(J.$$.fragment,e),Y=n(e),p(U.$$.fragment,e),D=n(e),u=M(e,"P",{"data-svelte-h":!0}),T(u)!=="svelte-1jp7sfc"&&(u.textContent=ue),V=n(e),p(j.$$.fragment,e),_=n(e),h=M(e,"P",{"data-svelte-h":!0}),T(h)!=="svelte-6ej7zg"&&(h.textContent=je),P=n(e),d=M(e,"UL",{"data-svelte-h":!0}),T(d)!=="svelte-1bk8yei"&&(d.innerHTML=he),q=n(e),p(b.$$.fragment,e),O=n(e),p(f.$$.fragment,e),K=n(e),C=M(e,"P",{"data-svelte-h":!0}),T(C)!=="svelte-1m3ezda"&&(C.textContent=de),ee=n(e),I=M(e,"UL",{"data-svelte-h":!0}),T(I)!=="svelte-95bqwh"&&(I.innerHTML=be),le=n(e),p(k.$$.fragment,e),te=n(e),p($.$$.fragment,e),se=n(e),Q=M(e,"P",{"data-svelte-h":!0}),T(Q)!=="svelte-1ltttkj"&&(Q.textContent=fe),ae=n(e),g=M(e,"UL",{"data-svelte-h":!0}),T(g)!=="svelte-1uuma5m"&&(g.innerHTML=Ce),ne=n(e),p(B.$$.fragment,e),ie=n(e),p(E.$$.fragment,e),Me=n(e),A=M(e,"P",{"data-svelte-h":!0}),T(A)!=="svelte-1d05yau"&&(A.textContent=Ie),re=n(e),R=M(e,"UL",{"data-svelte-h":!0}),T(R)!=="svelte-1w2oslr"&&(R.innerHTML=ke),pe=n(e),p(Z.$$.fragment,e),me=n(e),p(W.$$.fragment,e),oe=n(e),z=M(e,"P",{"data-svelte-h":!0}),T(z)!=="svelte-cvnv0k"&&(z.textContent=$e),ye=n(e),v=M(e,"UL",{"data-svelte-h":!0}),T(v)!=="svelte-9u33gj"&&(v.innerHTML=Qe),we=n(e),p(x.$$.fragment,e),Te=n(e),p(L.$$.fragment,e),ce=n(e),X=M(e,"P",{}),ge(X).forEach(t),this.h()},h(){Be(c,"name","hf:doc:metadata"),Be(c,"content",Se)},m(e,l){ve(document.head,c),s(e,F,l),s(e,S,l),s(e,H,l),m(J,e,l),s(e,Y,l),m(U,e,l),s(e,D,l),s(e,u,l),s(e,V,l),m(j,e,l),s(e,_,l),s(e,h,l),s(e,P,l),s(e,d,l),s(e,q,l),m(b,e,l),s(e,O,l),m(f,e,l),s(e,K,l),s(e,C,l),s(e,ee,l),s(e,I,l),s(e,le,l),m(k,e,l),s(e,te,l),m($,e,l),s(e,se,l),s(e,Q,l),s(e,ae,l),s(e,g,l),s(e,ne,l),m(B,e,l),s(e,ie,l),m(E,e,l),s(e,Me,l),s(e,A,l),s(e,re,l),s(e,R,l),s(e,pe,l),m(Z,e,l),s(e,me,l),m(W,e,l),s(e,oe,l),s(e,z,l),s(e,ye,l),s(e,v,l),s(e,we,l),m(x,e,l),s(e,Te,l),m(L,e,l),s(e,ce,l),s(e,X,l),Je=!0},p:Ae,i(e){Je||(o(J.$$.fragment,e),o(U.$$.fragment,e),o(j.$$.fragment,e),o(b.$$.fragment,e),o(f.$$.fragment,e),o(k.$$.fragment,e),o($.$$.fragment,e),o(B.$$.fragment,e),o(E.$$.fragment,e),o(Z.$$.fragment,e),o(W.$$.fragment,e),o(x.$$.fragment,e),o(L.$$.fragment,e),Je=!0)},o(e){y(J.$$.fragment,e),y(U.$$.fragment,e),y(j.$$.fragment,e),y(b.$$.fragment,e),y(f.$$.fragment,e),y(k.$$.fragment,e),y($.$$.fragment,e),y(B.$$.fragment,e),y(E.$$.fragment,e),y(Z.$$.fragment,e),y(W.$$.fragment,e),y(x.$$.fragment,e),y(L.$$.fragment,e),Je=!1},d(e){e&&(t(F),t(S),t(H),t(Y),t(D),t(u),t(V),t(_),t(h),t(P),t(d),t(q),t(O),t(K),t(C),t(ee),t(I),t(le),t(te),t(se),t(Q),t(ae),t(g),t(ne),t(ie),t(Me),t(A),t(re),t(R),t(pe),t(me),t(oe),t(z),t(ye),t(v),t(we),t(Te),t(ce),t(X)),t(c),w(J,e),w(U,e),w(j,e),w(b,e),w(f,e),w(k,e),w($,e),w(B,e),w(E,e),w(Z,e),w(W,e),w(x,e),w(L,e)}}}const Se='{"title":"Papers, related resources & how to cite","local":"papers-related-resources--how-to-cite","sections":[{"title":"SpQR: A Sparse-Quantized Representation for Near-Lossless LLM Weight Compression (Jun 2023)","local":"spqr-a-sparse-quantized-representation-for-near-lossless-llm-weight-compression-jun-2023","sections":[],"depth":2},{"title":"QLoRA: Efficient Finetuning of Quantized LLMs (May 2023)","local":"qlora-efficient-finetuning-of-quantized-llms-may-2023","sections":[],"depth":2},{"title":"The case for 4-bit precision: k-bit Inference Scaling Laws (Dec 2022)","local":"the-case-for-4-bit-precision-k-bit-inference-scaling-laws-dec-2022","sections":[],"depth":2},{"title":"LLM.int8(): 8-bit Matrix Multiplication for Transformers at Scale (Nov 2022)","local":"llm-int8","sections":[],"depth":2},{"title":"8-bit Optimizers via Block-wise Quantization (Oct 2021)","local":"8-bit-optimizers-via-block-wise-quantization-oct-2021","sections":[],"depth":2}],"depth":1}';function Xe(Ue){return Re(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class De extends Ze{constructor(c){super(),We(this,c,Xe,Ne,Ee,{})}}export{De as component}; | |
Xet Storage Details
- Size:
- 16.7 kB
- Xet hash:
- 45fa63f77e3024664c05ca08051e13caa7b7148ebff2e722459d206f1f21d8cb
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.