Buckets:

rtrm's picture
download
raw
45 kB
import{s as Al,o as Bl,n as ze}from"../chunks/scheduler.37c15a92.js";import{S as ql,i as Ll,g as M,s,r as p,A as Nl,h as u,f as l,c as a,j as Yl,u as o,x as d,k as Fl,y as Pl,a as n,v as c,d as m,t as f,w as $}from"../chunks/index.2bf4358c.js";import{T as Xe}from"../chunks/Tip.363c041f.js";import{Y as Sl}from"../chunks/Youtube.1e50a667.js";import{C as y}from"../chunks/CodeBlock.4e987730.js";import{C as Dl}from"../chunks/CourseFloatingBanner.9ff4c771.js";import{Q as Ye}from"../chunks/Question.668688bc.js";import{F as Kl}from"../chunks/FrameworkSwitchCourse.8d4d4ab6.js";import{H as h,E as Ol}from"../chunks/getInferenceSnippets.24b50994.js";function en(J){let r,T='๐Ÿ“š <strong>ํ›ˆ๋ จ ๋ฆฌ์†Œ์Šค</strong>: ํ›ˆ๋ จ์„ ์‹œ์ž‘ํ•˜๊ธฐ ์ „์— ํฌ๊ด„์ ์ธ <a href="https://huggingface.co/docs/transformers/main/en/training" rel="nofollow">๐Ÿค— Transformers ํ›ˆ๋ จ ๊ฐ€์ด๋“œ</a>๋ฅผ ์ˆ™์ง€ํ•˜๊ณ  <a href="https://huggingface.co/learn/cookbook/en/fine_tuning_code_llm_on_single_gpu" rel="nofollow">๋ฏธ์„ธ ์กฐ์ • ์ฟก๋ถ</a>์˜ ์‹ค์šฉ์ ์ธ ์˜ˆ์ œ๋ฅผ ์‚ดํŽด๋ณด์„ธ์š”.';return{c(){r=M("p"),r.innerHTML=T},l(i){r=u(i,"P",{"data-svelte-h":!0}),d(r)!=="svelte-1d8z8sh"&&(r.innerHTML=T)},m(i,g){n(i,r,g)},p:ze,d(i){i&&l(r)}}}function tn(J){let r,T='๐Ÿš€ <strong>๊ณ ๊ธ‰ ์„ค์ •</strong>: ์‚ฌ์šฉ ๊ฐ€๋Šฅํ•œ ๋ชจ๋“  ํ›ˆ๋ จ ์ธ์ˆ˜์™€ ์ตœ์ ํ™” ์ „๋žต์— ๋Œ€ํ•œ ์ž์„ธํ•œ ์ •๋ณด๋Š” <a href="https://huggingface.co/docs/transformers/main/en/main_classes/trainer#transformers.TrainingArguments" rel="nofollow">TrainingArguments ๋ฌธ์„œ</a>์™€ <a href="https://huggingface.co/learn/cookbook/en/fine_tuning_code_llm_on_single_gpu" rel="nofollow">ํ›ˆ๋ จ ๊ตฌ์„ฑ ์ฟก๋ถ</a>์„ ์ฐธ๊ณ ํ•˜์„ธ์š”.';return{c(){r=M("p"),r.innerHTML=T},l(i){r=u(i,"P",{"data-svelte-h":!0}),d(r)!=="svelte-oywe3r"&&(r.innerHTML=T)},m(i,g){n(i,r,g)},p:ze,d(i){i&&l(r)}}}function ln(J){let r,T='๐Ÿ“– <strong>๋” ์ž์„ธํžˆ ์•Œ์•„๋ณด๊ธฐ</strong>: Trainer ํด๋ž˜์Šค์™€ ๊ทธ ๋งค๊ฐœ๋ณ€์ˆ˜์— ๋Œ€ํ•œ ์ž์„ธํ•œ ๋‚ด์šฉ์€ <a href="https://huggingface.co/docs/transformers/main/en/main_classes/trainer" rel="nofollow">Trainer API ๋ฌธ์„œ</a>๋ฅผ ๋ฐฉ๋ฌธํ•˜๊ณ  <a href="https://huggingface.co/learn/cookbook/en/fine_tuning_code_llm_on_single_gpu" rel="nofollow">ํ›ˆ๋ จ ์ฟก๋ถ ๋ ˆ์‹œํ”ผ</a>์—์„œ ๊ณ ๊ธ‰ ์‚ฌ์šฉ ํŒจํ„ด์„ ์‚ดํŽด๋ณด์„ธ์š”.';return{c(){r=M("p"),r.innerHTML=T},l(i){r=u(i,"P",{"data-svelte-h":!0}),d(r)!=="svelte-1vnjsqm"&&(r.innerHTML=T)},m(i,g){n(i,r,g)},p:ze,d(i){i&&l(r)}}}function nn(J){let r,T='๋‹ค์–‘ํ•œ ํ‰๊ฐ€ ๋ฉ”ํŠธ๋ฆญ๊ณผ ์ „๋žต์— ๋Œ€ํ•ด ์•Œ์•„๋ณด๋ ค๋ฉด <a href="https://huggingface.co/docs/evaluate/" rel="nofollow">๐Ÿค— Evaluate ๋ฌธ์„œ</a>๋ฅผ ์ฐธ๊ณ ํ•˜์„ธ์š”.';return{c(){r=M("p"),r.innerHTML=T},l(i){r=u(i,"P",{"data-svelte-h":!0}),d(r)!=="svelte-3mjkop"&&(r.innerHTML=T)},m(i,g){n(i,r,g)},p:ze,d(i){i&&l(r)}}}function sn(J){let r,T='๐ŸŽฏ <strong>์„ฑ๋Šฅ ์ตœ์ ํ™”</strong>: ๋ถ„์‚ฐ ํ›ˆ๋ จ, ๋ฉ”๋ชจ๋ฆฌ ์ตœ์ ํ™”, ํ•˜๋“œ์›จ์–ด๋ณ„ ์ตœ์ ํ™”๋ฅผ ํฌํ•จํ•œ ๊ณ ๊ธ‰ ํ›ˆ๋ จ ๊ธฐ์ˆ ์— ๋Œ€ํ•ด์„œ๋Š” <a href="https://huggingface.co/docs/transformers/main/en/performance" rel="nofollow">๐Ÿค— Transformers ์„ฑ๋Šฅ ๊ฐ€์ด๋“œ</a>๋ฅผ ์‚ดํŽด๋ณด์„ธ์š”.';return{c(){r=M("p"),r.innerHTML=T},l(i){r=u(i,"P",{"data-svelte-h":!0}),d(r)!=="svelte-1avfr8p"&&(r.innerHTML=T)},m(i,g){n(i,r,g)},p:ze,d(i){i&&l(r)}}}function an(J){let r,T='๐Ÿ“ <strong>๋” ๋งŽ์€ ์˜ˆ์ œ</strong>: <a href="https://huggingface.co/docs/transformers/main/en/notebooks" rel="nofollow">๐Ÿค— Transformers ๋…ธํŠธ๋ถ</a>์— ์žˆ๋Š” ๋ฐฉ๋Œ€ํ•œ ์ž๋ฃŒ๋ฅผ ํ™•์ธํ•ด ๋ณด์„ธ์š”.';return{c(){r=M("p"),r.innerHTML=T},l(i){r=u(i,"P",{"data-svelte-h":!0}),d(r)!=="svelte-1j34o6j"&&(r.innerHTML=T)},m(i,g){n(i,r,g)},p:ze,d(i){i&&l(r)}}}function rn(J){let r,T="๐Ÿ’ก <strong>ํ•ต์‹ฌ ์š”์ :</strong>",i,g,w="<li><code>Trainer</code> API๋Š” ๋Œ€๋ถ€๋ถ„์˜ ํ›ˆ๋ จ ๋ณต์žก์„ฑ์„ ์ฒ˜๋ฆฌํ•˜๋Š” ๋†’์€ ์ˆ˜์ค€์˜ ์ธํ„ฐํŽ˜์ด์Šค๋ฅผ ์ œ๊ณตํ•ฉ๋‹ˆ๋‹ค.</li> <li><code>processing_class</code>๋Š” ์ ์ ˆํ•œ ๋ฐ์ดํ„ฐ ์ฒ˜๋ฆฌ๋ฅผ ์œ„ํ•ด ํ† ํฌ๋‚˜์ด์ €๋ฅผ ์ €์žฅํ•˜๋Š” ๋ฐ ์‚ฌ์šฉ๋ฉ๋‹ˆ๋‹ค.</li> <li><code>TrainingArguments</code>๋Š” ํ•™์Šต๋ฅ , ๋ฐฐ์น˜ ํฌ๊ธฐ, ํ‰๊ฐ€ ์ „๋žต, ์ตœ์ ํ™” ๋“ฑ ํ›ˆ๋ จ์˜ ๋ชจ๋“  ์ธก๋ฉด์„ ์ œ์–ดํ•ฉ๋‹ˆ๋‹ค.</li> <li><code>compute_metrics</code>๋ฅผ ์‚ฌ์šฉํ•˜๋ฉด ํ›ˆ๋ จ ์†์‹ค ์™ธ์— ์‚ฌ์šฉ์ž ์ •์˜ ํ‰๊ฐ€ ๋ฉ”ํŠธ๋ฆญ์„ ํ™œ์šฉํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.</li> <li>ํ˜ผํ•ฉ ์ •๋ฐ€๋„(<code>fp16=True</code>)์™€ ๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ ๊ณผ ๊ฐ™์€ ์ตœ์‹  ๊ธฐ๋Šฅ์€ ํ›ˆ๋ จ ํšจ์œจ์„ฑ์„ ํฌ๊ฒŒ ํ–ฅ์ƒ์‹œํ‚ฌ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.</li>";return{c(){r=M("p"),r.innerHTML=T,i=s(),g=M("ul"),g.innerHTML=w},l(U){r=u(U,"P",{"data-svelte-h":!0}),d(r)!=="svelte-3aouuq"&&(r.innerHTML=T),i=a(U),g=u(U,"UL",{"data-svelte-h":!0}),d(g)!=="svelte-56lnro"&&(g.innerHTML=w)},m(U,b){n(U,r,b),n(U,i,b),n(U,g,b)},p:ze,d(U){U&&(l(r),l(i),l(g))}}}function pn(J){let r,T,i,g,w,U,b,Ae,H,Be,W,qe,G,il='๐Ÿค— Transformers๋Š” <code>Trainer</code> ํด๋ž˜์Šค๋ฅผ ์ œ๊ณตํ•ฉ๋‹ˆ๋‹ค. ์ด ํด๋ž˜์Šค๋ฅผ ์‚ฌ์šฉํ•˜๋ฉด ์‚ฌ์ „ ํ•™์Šต๋œ ๋ชจ๋ธ์„ ์—ฌ๋Ÿฌ๋ถ„์˜ ๋ฐ์ดํ„ฐ์…‹์— ๋งž์ถฐ ์ตœ์‹  ๊ธฐ๋ฒ•์œผ๋กœ ์‰ฝ๊ฒŒ ๋ฏธ์„ธ ์กฐ์ •ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ์ด์ „ ์„น์…˜์—์„œ ๋ฐ์ดํ„ฐ ์ „์ฒ˜๋ฆฌ ์ž‘์—…์„ ๋ชจ๋‘ ๋งˆ์ณค๋‹ค๋ฉด ์ด์ œ ๋ช‡ ๋‹จ๊ณ„๋งŒ ๊ฑฐ์น˜๋ฉด <code>Trainer</code>๋ฅผ ์ •์˜ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ๊ฐ€์žฅ ์–ด๋ ค์šด ๋ถ€๋ถ„์€ <code>Trainer.train()</code>์„ ์‹คํ–‰ํ•  ํ™˜๊ฒฝ์„ ์ค€๋น„ํ•˜๋Š” ๊ณผ์ •์ผ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ์ด ์ž‘์—…์€ CPU์—์„œ ๋งค์šฐ ๋А๋ฆฌ๊ฒŒ ์‹คํ–‰๋˜๊ธฐ ๋•Œ๋ฌธ์ž…๋‹ˆ๋‹ค. ๋งŒ์•ฝ GPU๊ฐ€ ์—†๋‹ค๋ฉด <a href="https://colab.research.google.com/" rel="nofollow">Google Colab</a>์—์„œ ๋ฌด๋ฃŒ๋กœ ์ œ๊ณตํ•˜๋Š” GPU๋‚˜ TPU๋ฅผ ์ด์šฉํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.',Le,_,Ne,I,pl="์•„๋ž˜ ์ฝ”๋“œ ์˜ˆ์‹œ๋Š” ์ด์ „ ์„น์…˜์˜ ์ฝ”๋“œ๋ฅผ ๋ชจ๋‘ ์‹คํ–‰ํ–ˆ๋‹ค๋Š” ๊ฐ€์ •ํ•˜์— ์ž‘๋™ํ•ฉ๋‹ˆ๋‹ค. ์ฆ‰, ๋‹ค์Œ ์‚ฌํ•ญ๋“ค์ด ํ•„์š”ํ•ฉ๋‹ˆ๋‹ค.",Pe,Z,Se,E,De,Q,ol="<code>Trainer</code>๋ฅผ ์ •์˜ํ•˜๊ธฐ ์ „ ์ฒซ ๋ฒˆ์งธ ๋‹จ๊ณ„๋Š” <code>Trainer</code>๊ฐ€ ํ›ˆ๋ จ ๋ฐ ํ‰๊ฐ€์— ์‚ฌ์šฉํ•  ๋ชจ๋“  ํ•˜์ดํผํŒŒ๋ผ๋ฏธํ„ฐ๋ฅผ ๋‹ด์„<code>TrainingArguments</code> ํด๋ž˜์Šค๋ฅผ ์ •์˜ํ•˜๋Š” ๊ฒƒ์ž…๋‹ˆ๋‹ค. ํ•„์ˆ˜๋กœ ์ œ๊ณตํ•ด์•ผ ํ•˜๋Š” ์œ ์ผํ•œ ์ธ์ˆ˜๋Š” ํ›ˆ๋ จ๋œ ๋ชจ๋ธ๊ณผ ์ค‘๊ฐ„ ์ฒดํฌํฌ์ธํŠธ๊ฐ€ ์ €์žฅ๋  ๋””๋ ‰ํ† ๋ฆฌ์ž…๋‹ˆ๋‹ค. ๋‚˜๋จธ์ง€๋Š” ๊ธฐ๋ณธ๊ฐ’์œผ๋กœ ๋‘˜ ์ˆ˜ ์žˆ์œผ๋ฉฐ, ๊ธฐ๋ณธ์ ์ธ ๋ฏธ์„ธ ์กฐ์ • ์ž‘์—…์—๋Š” ์ถฉ๋ถ„ํ•œ ์„ค์ •์ž…๋‹ˆ๋‹ค.",Ke,V,Oe,X,cl='ํ›ˆ๋ จ ์ค‘์— ๋ชจ๋ธ์„ Hub์— ์ž๋™์œผ๋กœ ์—…๋กœ๋“œํ•˜๋ ค๋ฉด <code>TrainingArguments</code>์—์„œ <code>push_to_hub=True</code>๋ฅผ ์ „๋‹ฌํ•˜์„ธ์š”. ์ด ๊ธฐ๋Šฅ์— ๋Œ€ํ•ด์„œ๋Š” <a href="/course/chapter4/3">Chapter 4</a>์—์„œ ์ž์„ธํžˆ ์•Œ์•„๋ณด๊ฒ ์Šต๋‹ˆ๋‹ค.',et,j,tt,z,ml='๋‘ ๋ฒˆ์งธ ๋‹จ๊ณ„๋Š” ๋ชจ๋ธ์„ ์ •์˜ํ•˜๋Š” ๊ฒƒ์ž…๋‹ˆ๋‹ค. <a href="/course/chapter2">์ด์ „ ์ฑ•ํ„ฐ</a>์—์„œ์™€ ๊ฐ™์ด ๋‘ ๊ฐœ์˜ ๋ผ๋ฒจ๊ณผ ํ•จ๊ป˜ <code>AutoModelForSequenceClassification</code> ํด๋ž˜์Šค๋ฅผ ์‚ฌ์šฉํ•˜๊ฒ ์Šต๋‹ˆ๋‹ค.',lt,Y,nt,F,fl='<a href="/course/chapter2">Chapter 2</a>์™€ ๋‹ฌ๋ฆฌ ์ด ์‚ฌ์ „ ํ›ˆ๋ จ๋œ ๋ชจ๋ธ์„ ์ธ์Šคํ„ด์Šคํ™”ํ•˜๋ฉด ๊ฒฝ๊ณ  ๋ฉ”์‹œ์ง€๊ฐ€ ๋‚˜ํƒ€๋‚˜๋Š” ๊ฒƒ์„ ํ™•์ธํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ์ด๋Š” BERT๊ฐ€ ๋ฌธ์žฅ ์Œ ๋ถ„๋ฅ˜๋ฅผ ์œ„ํ•ด ์‚ฌ์ „ ํ›ˆ๋ จ๋˜์ง€ ์•Š์•˜๊ธฐ ๋•Œ๋ฌธ์—, ์‚ฌ์ „ ํ›ˆ๋ จ๋œ ๋ชจ๋ธ์˜ ํ—ค๋“œ๊ฐ€ ์ œ๊ฑฐ๋˜๊ณ  ์‹œํ€€์Šค ๋ถ„๋ฅ˜์— ์ ํ•ฉํ•œ ์ƒˆ๋กœ์šด ํ—ค๋“œ๊ฐ€ ์ถ”๊ฐ€๋˜์—ˆ๊ธฐ ๋•Œ๋ฌธ์ž…๋‹ˆ๋‹ค. ๊ฒฝ๊ณ ๋Š” ์ผ๋ถ€ ๊ฐ€์ค‘์น˜(์ œ๊ฑฐ๋œ ์‚ฌ์ „ ํ›ˆ๋ จ ํ—ค๋“œ์— ํ•ด๋‹นํ•˜๋Š” ๊ฐ€์ค‘์น˜)๊ฐ€ ์‚ฌ์šฉ๋˜์ง€ ์•Š์•˜๊ณ , ์ผ๋ถ€ ๋‹ค๋ฅธ ๊ฐ€์ค‘์น˜(์ƒˆ๋กœ์šด ํ—ค๋“œ์šฉ)๊ฐ€ ๋ฌด์ž‘์œ„๋กœ ์ดˆ๊ธฐํ™”๋˜์—ˆ๋‹ค๋Š” ๊ฒƒ์„ ๋‚˜ํƒ€๋ƒ…๋‹ˆ๋‹ค. ๋งˆ์ง€๋ง‰์œผ๋กœ ๋ชจ๋ธ์„ ํ›ˆ๋ จ์‹œํ‚ค๋ผ๋Š” ๋ฉ”์‹œ์ง€๊ฐ€ ๋‚˜์˜ค๋Š”๋ฐ, ๋ฐ”๋กœ ์ง€๊ธˆ๋ถ€ํ„ฐ ๊ทธ ์ž‘์—…์„ ์‹œ์ž‘ํ•˜๊ฒ ์Šต๋‹ˆ๋‹ค.',st,A,$l="๋ชจ๋ธ์ด ์ค€๋น„๋˜๋ฉด, ์ง€๊ธˆ๊นŒ์ง€ ๊ตฌ์„ฑํ•œ ๋ชจ๋“  ๊ฐ์ฒด(<code>model</code>, <code>training_args</code>, ํ›ˆ๋ จ ๋ฐ ๊ฒ€์ฆ ๋ฐ์ดํ„ฐ์…‹, <code>data_collator</code>, <code>processing_class</code>)๋ฅผ ์ „๋‹ฌํ•˜์—ฌ <code>Trainer</code>๋ฅผ ์ •์˜ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. <code>processing_class</code> ๋งค๊ฐœ๋ณ€์ˆ˜๋Š” ๋น„๊ต์  ์ตœ๊ทผ์— ์ถ”๊ฐ€๋œ ๊ธฐ๋Šฅ์œผ๋กœ, <code>Trainer</code>์—๊ฒŒ ์–ด๋–ค ํ† ํฌ๋‚˜์ด์ €๋ฅผ ์‚ฌ์šฉํ•ด ๋ฐ์ดํ„ฐ๋ฅผ ์ฒ˜๋ฆฌํ• ์ง€ ์•Œ๋ ค์ค๋‹ˆ๋‹ค.",at,B,rt,q,Ml="<code>processing_class</code>์— ํ† ํฌ๋‚˜์ด์ €๋ฅผ ์ „๋‹ฌํ•˜๋ฉด, <code>Trainer</code>๊ฐ€ ๊ธฐ๋ณธ์ ์œผ๋กœ <code>DataCollatorWithPadding</code>์„ <code>data_collator</code>๋กœ ์‚ฌ์šฉํ•ฉ๋‹ˆ๋‹ค. ๋”ฐ๋ผ์„œ ์ด ๊ฒฝ์šฐ์—๋Š” <code>data_collator=data_collator</code> ์ค„์„ ์ƒ๋žตํ•  ์ˆ˜ ์žˆ์ง€๋งŒ, ๋ฐ์ดํ„ฐ ์ฒ˜๋ฆฌ ํŒŒ์ดํ”„๋ผ์ธ์˜ ์ค‘์š”ํ•œ ๋ถ€๋ถ„์„ ๋ณด์—ฌ๋“œ๋ฆฌ๊ธฐ ์œ„ํ•ด ์ฝ”๋“œ์— ํฌํ•จํ–ˆ์Šต๋‹ˆ๋‹ค.",it,C,pt,L,ul="๋ฐ์ดํ„ฐ์…‹์—์„œ ๋ชจ๋ธ์„ ๋ฏธ์„ธ ์กฐ์ •ํ•˜๋ ค๋ฉด <code>Trainer</code>์˜ <code>train()</code> ๋ฉ”์†Œ๋“œ๋ฅผ ํ˜ธ์ถœํ•˜๊ธฐ๋งŒ ํ•˜๋ฉด ๋ฉ๋‹ˆ๋‹ค.",ot,N,ct,P,dl="์ด๋ ‡๊ฒŒ ํ•˜๋ฉด ๋ฏธ์„ธ ์กฐ์ •์ด ์‹œ์ž‘๋ฉ๋‹ˆ๋‹ค(GPU์—์„œ๋Š” ๋ช‡ ๋ถ„ ์ •๋„ ์†Œ์š”๋ฉ๋‹ˆ๋‹ค). 500๋‹จ๊ณ„๋งˆ๋‹ค ํ›ˆ๋ จ ์†์‹ค์ด ์ถœ๋ ฅ๋˜์ง€๋งŒ, ๋ชจ๋ธ์˜ ์„ฑ๋Šฅ์ด ์–ผ๋งˆ๋‚˜ ์ข‹์€์ง€(๋˜๋Š” ๋‚˜์œ์ง€)๋Š” ์•Œ๋ ค์ฃผ์ง€ ์•Š์Šต๋‹ˆ๋‹ค. ๊ทธ ์ด์œ ๋Š” ๋‹ค์Œ๊ณผ ๊ฐ™์Šต๋‹ˆ๋‹ค.",mt,S,Tl="<li><code>TrainingArguments</code>์—์„œ <code>eval_strategy</code>๋ฅผ <code>&quot;steps&quot;</code> (๋งค <code>eval_steps</code>๋งˆ๋‹ค ํ‰๊ฐ€) ๋˜๋Š” <code>&quot;epoch&quot;</code> (๊ฐ ์—ํฌํฌ ์ข…๋ฃŒ ์‹œ ํ‰๊ฐ€)๋กœ ์„ค์ •ํ•˜์ง€ ์•Š์•˜์Šต๋‹ˆ๋‹ค.</li> <li>ํ‰๊ฐ€ ์ค‘์— ๋ฉ”ํŠธ๋ฆญ์„ ๊ณ„์‚ฐํ•˜๊ธฐ ์œ„ํ•œ <code>compute_metrics()</code> ํ•จ์ˆ˜๋ฅผ <code>Trainer</code>์— ์ œ๊ณตํ•˜์ง€ ์•Š์•˜์Šต๋‹ˆ๋‹ค. ์ด ํ•จ์ˆ˜๊ฐ€ ์—†์œผ๋ฉด ํ‰๊ฐ€์—์„œ ์†์‹ค ๊ฐ’๋งŒ ์ถœ๋ ฅ๋˜๋Š”๋ฐ, ์ด ๊ฐ’๋งŒ์œผ๋กœ๋Š” ์„ฑ๋Šฅ์„ ํŒŒ์•…ํ•˜๊ธฐ ์–ด๋ ต์Šต๋‹ˆ๋‹ค.</li>",ft,D,$t,K,gl="์ด์ œ ์œ ์šฉํ•œ <code>compute_metrics()</code> ํ•จ์ˆ˜๋ฅผ ์–ด๋–ป๊ฒŒ ๋งŒ๋“ค๊ณ  ๋‹ค์Œ ํ›ˆ๋ จ ์‹œ ์‚ฌ์šฉํ•  ์ˆ˜ ์žˆ๋Š”์ง€ ์•Œ์•„๋ณด๊ฒ ์Šต๋‹ˆ๋‹ค. ์ด ํ•จ์ˆ˜๋Š” <code>EvalPrediction</code> ๊ฐ์ฒด(<code>predictions</code> ํ•„๋“œ์™€ <code>label_ids</code> ํ•„๋“œ๋ฅผ ๊ฐ–๋Š” ๋ช…๋ช…๋œ ํŠœํ”Œ)๋ฅผ ์ž…๋ ฅ๋ฐ›์Šต๋‹ˆ๋‹ค. ๊ทธ๋ฆฌ๊ณ  ๊ฐ ๋ฉ”ํŠธ๋ฆญ์˜ ์ด๋ฆ„์„ ํ‚ค(๋ฌธ์ž์—ด)๋กœ, ์„ฑ๋Šฅ์„ ๊ฐ’(๋ถ€๋™์†Œ์ˆ˜์ )์œผ๋กœ ๊ฐ–๋Š” ๋”•์…”๋„ˆ๋ฆฌ๋ฅผ ๋ฐ˜ํ™˜ํ•ด์•ผ ํ•ฉ๋‹ˆ๋‹ค. ๋ชจ๋ธ์˜ ์˜ˆ์ธก๊ฐ’์„ ์–ป๊ธฐ ์œ„ํ•ด <code>Trainer.predict()</code>๋ฅผ ์‚ฌ์šฉํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.",Mt,O,ut,ee,dt,te,Jl="<code>predict()</code> ๋ฉ”์†Œ๋“œ์˜ ์ถœ๋ ฅ์€ <code>predictions</code>, <code>label_ids</code>, <code>metrics</code> ์„ธ ๊ฐœ์˜ ํ•„๋“œ๊ฐ€ ์žˆ๋Š” ๋˜ ๋‹ค๋ฅธ ๋ช…๋ช…๋œ ํŠœํ”Œ์ž…๋‹ˆ๋‹ค. <code>metrics</code> ํ•„๋“œ์—๋Š” ์ „๋‹ฌ๋œ ๋ฐ์ดํ„ฐ์…‹์— ๋Œ€ํ•œ ์†์‹ค ๊ฐ’๊ณผ ์‹œ๊ฐ„ ๊ด€๋ จ ๋ฉ”ํŠธ๋ฆญ(์ด ์˜ˆ์ธก ์‹œ๊ฐ„, ํ‰๊ท  ์˜ˆ์ธก ์‹œ๊ฐ„)๋งŒ ํฌํ•จ๋ฉ๋‹ˆ๋‹ค. ํ•˜์ง€๋งŒ <code>compute_metrics()</code> ํ•จ์ˆ˜๋ฅผ ์™„์„ฑํ•˜์—ฌ <code>Trainer</code>์— ์ „๋‹ฌํ•˜๋ฉด, ์ด ํ•„๋“œ์— <code>compute_metrics()</code>๊ฐ€ ๋ฐ˜ํ™˜ํ•˜๋Š” ๋ฉ”ํŠธ๋ฆญ๋“ค๋„ ํ•จ๊ป˜ ํฌํ•จ๋ฉ๋‹ˆ๋‹ค.",Tt,le,yl='๋ณด์‹œ๋‹ค์‹œํ”ผ, <code>predictions</code>๋Š” 408 x 2 ๋ชจ์–‘์˜ 2์ฐจ์› ๋ฐฐ์—ด์ž…๋‹ˆ๋‹ค (408์€ predict()์— ์ „๋‹ฌํ•œ ๋ฐ์ดํ„ฐ์…‹์˜ ์ƒ˜ํ”Œ ๊ฐœ์ˆ˜์ž…๋‹ˆ๋‹ค). ์ด ๊ฐ’๋“ค์€ <code>predict()</code>์— ์ „๋‹ฌํ•œ ๋ฐ์ดํ„ฐ์…‹์˜ ๊ฐ ์ƒ˜ํ”Œ์— ๋Œ€ํ•œ ๋กœ์ง“์ž…๋‹ˆ๋‹ค (<a href="/course/chapter2">์ด์ „ ์ฑ•ํ„ฐ</a>์—์„œ ๋ณด์•˜๋“ฏ์ด ๋ชจ๋“  Transformer ๋ชจ๋ธ์€ ๋กœ์ง“์„ ๋ฐ˜ํ™˜ํ•ฉ๋‹ˆ๋‹ค). ์ด ๋กœ์ง“์„ ์šฐ๋ฆฌ๊ฐ€ ๊ฐ€์ง„ ๋ ˆ์ด๋ธ”๊ณผ ๋น„๊ตํ•  ์ˆ˜ ์žˆ๋Š” ์˜ˆ์ธก๊ฐ’์œผ๋กœ ๋ณ€ํ™˜ํ•˜๋ ค๋ฉด, ๋‘ ๋ฒˆ์งธ ์ถ•์—์„œ ์ตœ๋Œ“๊ฐ’์„ ๊ฐ€์ง„ ์ธ๋ฑ์Šค๋ฅผ ๊ตฌํ•ด์•ผ ํ•ฉ๋‹ˆ๋‹ค.',gt,ne,Jt,se,Ul='์ด์ œ ์ด <code>preds</code>๋ฅผ ๋ผ๋ฒจ๊ณผ ๋น„๊ตํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. <code>compute_metric()</code> ํ•จ์ˆ˜๋ฅผ ๋นŒ๋“œํ•˜๊ธฐ ์œ„ํ•ด ๐Ÿค— <a href="https://github.com/huggingface/evaluate/" rel="nofollow">Evaluate</a> ๋ผ์ด๋ธŒ๋Ÿฌ๋ฆฌ์˜ ๋ฉ”ํŠธ๋ฆญ์„ ํ™œ์šฉํ•˜๊ฒ ์Šต๋‹ˆ๋‹ค. ๋ฐ์ดํ„ฐ์…‹์„ ๋กœ๋“œํ–ˆ๋˜ ๊ฒƒ์ฒ˜๋Ÿผ, MRPC ๋ฐ์ดํ„ฐ์…‹๊ณผ ๊ด€๋ จ๋œ ๋ฉ”ํŠธ๋ฆญ๋„ <code>evaluate.load()</code> ํ•จ์ˆ˜๋กœ ์‰ฝ๊ฒŒ ๋กœ๋“œํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ๋ฐ˜ํ™˜๋œ ๊ฐ์ฒด์˜ <code>compute()</code> ๋ฉ”์„œ๋“œ๋ฅผ ์‚ฌ์šฉํ•ด ๋ฉ”ํŠธ๋ฆญ์„ ๊ณ„์‚ฐํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.',yt,ae,Ut,re,wt,v,bt,ie,wl='๋ชจ๋ธ ํ—ค๋“œ์˜ ๊ฐ€์ค‘์น˜๊ฐ€ ๋ฌด์ž‘์œ„๋กœ ์ดˆ๊ธฐํ™”๋˜๊ธฐ ๋•Œ๋ฌธ์— ์–ป๊ฒŒ ๋˜๋Š” ๊ฒฐ๊ณผ๋Š” ์กฐ๊ธˆ์”ฉ ๋‹ค๋ฅผ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ๊ฒฐ๊ณผ๋ฅผ ๋ณด๋ฉด ์šฐ๋ฆฌ ๋ชจ๋ธ์ด ๊ฒ€์ฆ ์„ธํŠธ์—์„œ 85.78%์˜ ์ •ํ™•๋„์™€ 89.97%์˜ F1 ์ ์ˆ˜๋ฅผ ๋‹ฌ์„ฑํ–ˆ์Œ์„ ๋ณผ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ์ด ๋‘ ๊ฐ€์ง€๋Š” GLUE ๋ฒค์น˜๋งˆํฌ์˜ MRPC ๋ฐ์ดํ„ฐ์…‹์—์„œ ๊ฒฐ๊ณผ๋ฅผ ํ‰๊ฐ€ํ•˜๋Š” ๋ฐ ์‚ฌ์šฉ๋˜๋Š” ๋ฉ”ํŠธ๋ฆญ์ž…๋‹ˆ๋‹ค. <a href="https://arxiv.org/pdf/1810.04805.pdf" rel="nofollow">BERT ๋…ผ๋ฌธ</a>์—์„œ๋Š” ๊ธฐ๋ณธ ๋ชจ๋ธ์˜ F1 ์ ์ˆ˜๋ฅผ 88.9๋กœ ๋ณด๊ณ ํ•˜์˜€์Šต๋‹ˆ๋‹ค. ๋‹น์‹œ์—๋Š” <code>uncased</code> ๋ชจ๋ธ์„ ์‚ฌ์šฉํ–ˆ์ง€๋งŒ, ์šฐ๋ฆฌ๋Š” ํ˜„์žฌ <code>cased</code> ๋ชจ๋ธ์„ ์‚ฌ์šฉํ•˜๊ณ  ์žˆ๊ธฐ ๋•Œ๋ฌธ์— ๋” ๋‚˜์€ ๊ฒฐ๊ณผ๊ฐ€ ๋‚˜์˜จ ๊ฒƒ์ž…๋‹ˆ๋‹ค.',ht,pe,bl="์ด ๋ชจ๋“  ๊ฒƒ์„ ์ข…ํ•ฉํ•˜๋ฉด, ๋‹ค์Œ์ฒ˜๋Ÿผ <code>compute_metrics()</code> ํ•จ์ˆ˜๋ฅผ ๋‹ค์Œ๊ณผ ๊ฐ™์ด ์ •์˜ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.",_t,oe,jt,ce,hl="๊ฐ ์—ํญ์ด ๋๋‚  ๋•Œ๋งˆ๋‹ค ๋ฉ”ํŠธ๋ฆญ์ด ์ถœ๋ ฅ๋˜๋„๋ก, ์ด <code>compute_metrics()</code> ํ•จ์ˆ˜๊ฐ€ ํฌํ•จํ•˜์—ฌ <code>Trainer</code>๋ฅผ ์ƒˆ๋กœ ์ •์˜ํ•ด ๋ณด๊ฒ ์Šต๋‹ˆ๋‹ค.",Ct,me,vt,fe,_l="์ฐธ๊ณ ๋กœ, ์šฐ๋ฆฌ๋Š” <code>eval_strategy</code>๋ฅผ <code>&quot;epoch&quot;</code>์œผ๋กœ ์„ค์ •ํ•œ ์ƒˆ๋กœ์šด <code>TrainingArguments</code>์™€ ์ƒˆ๋กœ์šด ๋ชจ๋ธ์„ ์ƒ์„ฑํ•ฉ๋‹ˆ๋‹ค. ์ด๋ ‡๊ฒŒ ํ•˜์ง€ ์•Š์œผ๋ฉด ์ด๋ฏธ ํ›ˆ๋ จ๋œ ๋ชจ๋ธ์˜ ํ›ˆ๋ จ์„ ๊ณ„์†ํ•˜๊ฒŒ ๋  ๊ฒ๋‹ˆ๋‹ค. ์ƒˆ๋กœ์šด ํ›ˆ๋ จ์„ ์‹œ์ž‘ํ•˜๋ ค๋ฉด ๋‹ค์Œ์„ ์‹คํ–‰ํ•˜์„ธ์š”.",kt,$e,Rt,Me,jl="์ด๋ฒˆ์—๋Š” ํ›ˆ๋ จ ์†์‹ค ์™ธ์—๋„ ๊ฐ ์—ํญ์ด ๋๋‚  ๋•Œ๋งˆ๋‹ค ๊ฒ€์ฆ ์†์‹ค๊ณผ ๋ฉ”ํŠธ๋ฆญ์ด ํ•จ๊ป˜ ์ถœ๋ ฅ๋  ๊ฒ๋‹ˆ๋‹ค. ์•ž์„œ ๋งํ–ˆ๋“ฏ์ด ๋ชจ๋ธ ํ—ค๋“œ์˜ ๋ฌด์ž‘์œ„ ์ดˆ๊ธฐํ™” ๋•Œ๋ฌธ์— ์—ฌ๋Ÿฌ๋ถ„์ด ์–ป๋Š” ์ •ํ™•๋„/F1 ์ ์ˆ˜๋Š” ์šฐ๋ฆฌ๊ฐ€ ์–ป์€ ๊ฒฐ๊ณผ์™€ ์•ฝ๊ฐ„ ๋‹ค๋ฅผ ์ˆ˜ ์žˆ์ง€๋งŒ, ๋น„์Šทํ•œ ๋ฒ”์œ„์— ์žˆ์„ ๊ฒ๋‹ˆ๋‹ค.",xt,ue,Ht,de,Cl="<code>Trainer</code>๋Š” ํ˜„๋Œ€ ๋”ฅ๋Ÿฌ๋‹์˜ ๋ชจ๋ฒ” ์‚ฌ๋ก€๋“ค์„ ์‰ฝ๊ฒŒ ํ™œ์šฉํ•  ์ˆ˜ ์žˆ๋„๋ก ๋‹ค์–‘ํ•œ ๋‚ด์žฅ ๊ธฐ๋Šฅ์„ ์ œ๊ณตํ•ฉ๋‹ˆ๋‹ค.",Wt,Te,vl="<strong>ํ˜ผํ•ฉ ์ •๋ฐ€๋„ ํ›ˆ๋ จ</strong>: ๋” ๋น ๋ฅธ ํ›ˆ๋ จ๊ณผ ๋ฉ”๋ชจ๋ฆฌ ์‚ฌ์šฉ๋Ÿ‰ ๊ฐ์†Œ๋ฅผ ์œ„ํ•ด ํ›ˆ๋ จ ์ธ์ˆ˜์—์„œ <code>fp16=True</code>๋ฅผ ์„ค์ •ํ•˜์„ธ์š”.",Gt,ge,It,Je,kl="<strong>๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ </strong>: GPU ๋ฉ”๋ชจ๋ฆฌ๊ฐ€ ๋ถ€์กฑํ•  ๋•Œ ๋” ํฐ ๋ฐฐ์น˜ ํฌ๊ธฐ๋กœ ํ•™์Šตํ•˜๋Š” ํšจ๊ณผ๋ฅผ ๋‚ผ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.",Zt,ye,Et,Ue,Rl="<strong>ํ•™์Šต๋ฅ  ์Šค์ผ€์ค„๋ง</strong>: Trainer๋Š” ๊ธฐ๋ณธ์ ์œผ๋กœ ์„ ํ˜• ๊ฐ์†Œ ๋ฐฉ์‹์„ ์‚ฌ์šฉํ•˜์ง€๋งŒ, ์‚ฌ์šฉ์ž ๋งž์ถค ์„ค์ •์ด ๊ฐ€๋Šฅํ•ฉ๋‹ˆ๋‹ค.",Qt,we,Vt,k,Xt,be,xl="<code>Trainer</code>๋Š” ์—ฌ๋Ÿฌ GPU ๋˜๋Š” TPU์—์„œ ์ฆ‰์‹œ ์ž‘๋™ํ•˜๋ฉฐ ๋ถ„์‚ฐ ํ›ˆ๋ จ์„ ์œ„ํ•œ ๋งŽ์€ ์˜ต์…˜์„ ์ œ๊ณตํ•ฉ๋‹ˆ๋‹ค. ์ด์™€ ๊ด€๋ จ๋œ ๋ชจ๋“  ๋‚ด์šฉ์€ Chapter 10์—์„œ ๋‹ค๋ฃจ๊ฒ ์Šต๋‹ˆ๋‹ค.",zt,he,Hl='์ด๊ฒƒ์œผ๋กœ <code>Trainer</code> API๋ฅผ ์‚ฌ์šฉํ•œ ๋ฏธ์„ธ ์กฐ์ • ์†Œ๊ฐœ๋ฅผ ๋งˆ์นฉ๋‹ˆ๋‹ค. ๋Œ€๋ถ€๋ถ„์˜ ์ผ๋ฐ˜์ ์ธ NLP ์ž‘์—…์— ๋Œ€ํ•œ ์˜ˆ์ œ๋Š” <a href="/course/chapter7">Chapter 7</a>์—์„œ ๋‹ค๋ฃฐ ์˜ˆ์ •์ด๋ฉฐ, ๋‹ค์Œ์œผ๋กœ๋Š” ์ˆœ์ˆ˜ PyTorch ์ฝ”๋“œ๋กœ ๋™์ผํ•œ ์ž‘์—…์„ ์ˆ˜ํ–‰ํ•˜๋Š” ๋ฐฉ๋ฒ•์„ ์‚ดํŽด๋ณด๊ฒ ์Šต๋‹ˆ๋‹ค.',Yt,R,Ft,_e,At,je,Wl="Trainer API์™€ ๋ฏธ์„ธ ์กฐ์ • ๊ฐœ๋…์— ๋Œ€ํ•œ ์ดํ•ด๋ฅผ ํ…Œ์ŠคํŠธํ•ด๋ณด์„ธ์š”.",Bt,Ce,qt,ve,Lt,ke,Nt,Re,Pt,xe,St,He,Dt,We,Kt,Ge,Ot,Ie,el,Ze,tl,Ee,ll,Qe,nl,x,sl,Ve,al,Fe,rl;return w=new Kl({props:{fw:J[0]}}),b=new h({props:{title:"Trainer API๋กœ ๋ชจ๋ธ ๋ฏธ์„ธ ์กฐ์ •ํ•˜๊ธฐ",local:"fine-tuning-a-model-with-the-trainer-api",headingTag:"h1"}}),H=new Dl({props:{chapter:3,classNames:"absolute z-10 right-0 top-0",notebooks:[{label:"Google Colab",value:"https://colab.research.google.com/github/huggingface/notebooks/blob/master/course/en/chapter3/section3.ipynb"},{label:"Aws Studio",value:"https://studiolab.sagemaker.aws/import/github/huggingface/notebooks/blob/master/course/en/chapter3/section3.ipynb"}]}}),W=new Sl({props:{id:"nvBXf7s7vTI"}}),_=new Xe({props:{$$slots:{default:[en]},$$scope:{ctx:J}}}),Z=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBZnJvbSUyMHRyYW5zZm9ybWVycyUyMGltcG9ydCUyMEF1dG9Ub2tlbml6ZXIlMkMlMjBEYXRhQ29sbGF0b3JXaXRoUGFkZGluZyUwQSUwQXJhd19kYXRhc2V0cyUyMCUzRCUyMGxvYWRfZGF0YXNldCglMjJnbHVlJTIyJTJDJTIwJTIybXJwYyUyMiklMEFjaGVja3BvaW50JTIwJTNEJTIwJTIyYmVydC1iYXNlLXVuY2FzZWQlMjIlMEF0b2tlbml6ZXIlMjAlM0QlMjBBdXRvVG9rZW5pemVyLmZyb21fcHJldHJhaW5lZChjaGVja3BvaW50KSUwQSUwQSUwQWRlZiUyMHRva2VuaXplX2Z1bmN0aW9uKGV4YW1wbGUpJTNBJTBBJTIwJTIwJTIwJTIwcmV0dXJuJTIwdG9rZW5pemVyKGV4YW1wbGUlNUIlMjJzZW50ZW5jZTElMjIlNUQlMkMlMjBleGFtcGxlJTVCJTIyc2VudGVuY2UyJTIyJTVEJTJDJTIwdHJ1bmNhdGlvbiUzRFRydWUpJTBBJTBBJTBBdG9rZW5pemVkX2RhdGFzZXRzJTIwJTNEJTIwcmF3X2RhdGFzZXRzLm1hcCh0b2tlbml6ZV9mdW5jdGlvbiUyQyUyMGJhdGNoZWQlM0RUcnVlKSUwQWRhdGFfY29sbGF0b3IlMjAlM0QlMjBEYXRhQ29sbGF0b3JXaXRoUGFkZGluZyh0b2tlbml6ZXIlM0R0b2tlbml6ZXIp",highlighted:`<span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset
<span class="hljs-keyword">from</span> transformers <span class="hljs-keyword">import</span> AutoTokenizer, DataCollatorWithPadding
raw_datasets = load_dataset(<span class="hljs-string">&quot;glue&quot;</span>, <span class="hljs-string">&quot;mrpc&quot;</span>)
checkpoint = <span class="hljs-string">&quot;bert-base-uncased&quot;</span>
tokenizer = AutoTokenizer.from_pretrained(checkpoint)
<span class="hljs-keyword">def</span> <span class="hljs-title function_">tokenize_function</span>(<span class="hljs-params">example</span>):
<span class="hljs-keyword">return</span> tokenizer(example[<span class="hljs-string">&quot;sentence1&quot;</span>], example[<span class="hljs-string">&quot;sentence2&quot;</span>], truncation=<span class="hljs-literal">True</span>)
tokenized_datasets = raw_datasets.<span class="hljs-built_in">map</span>(tokenize_function, batched=<span class="hljs-literal">True</span>)
data_collator = DataCollatorWithPadding(tokenizer=tokenizer)`,wrap:!1}}),E=new h({props:{title:"ํ›ˆ๋ จ",local:"training",headingTag:"h3"}}),V=new y({props:{code:"ZnJvbSUyMHRyYW5zZm9ybWVycyUyMGltcG9ydCUyMFRyYWluaW5nQXJndW1lbnRzJTBBJTBBdHJhaW5pbmdfYXJncyUyMCUzRCUyMFRyYWluaW5nQXJndW1lbnRzKCUyMnRlc3QtdHJhaW5lciUyMik=",highlighted:`<span class="hljs-keyword">from</span> transformers <span class="hljs-keyword">import</span> TrainingArguments
training_args = TrainingArguments(<span class="hljs-string">&quot;test-trainer&quot;</span>)`,wrap:!1}}),j=new Xe({props:{$$slots:{default:[tn]},$$scope:{ctx:J}}}),Y=new y({props:{code:"ZnJvbSUyMHRyYW5zZm9ybWVycyUyMGltcG9ydCUyMEF1dG9Nb2RlbEZvclNlcXVlbmNlQ2xhc3NpZmljYXRpb24lMEElMEFtb2RlbCUyMCUzRCUyMEF1dG9Nb2RlbEZvclNlcXVlbmNlQ2xhc3NpZmljYXRpb24uZnJvbV9wcmV0cmFpbmVkKGNoZWNrcG9pbnQlMkMlMjBudW1fbGFiZWxzJTNEMik=",highlighted:`<span class="hljs-keyword">from</span> transformers <span class="hljs-keyword">import</span> AutoModelForSequenceClassification
model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=<span class="hljs-number">2</span>)`,wrap:!1}}),B=new y({props:{code:"ZnJvbSUyMHRyYW5zZm9ybWVycyUyMGltcG9ydCUyMFRyYWluZXIlMEElMEF0cmFpbmVyJTIwJTNEJTIwVHJhaW5lciglMEElMjAlMjAlMjAlMjBtb2RlbCUyQyUwQSUyMCUyMCUyMCUyMHRyYWluaW5nX2FyZ3MlMkMlMEElMjAlMjAlMjAlMjB0cmFpbl9kYXRhc2V0JTNEdG9rZW5pemVkX2RhdGFzZXRzJTVCJTIydHJhaW4lMjIlNUQlMkMlMEElMjAlMjAlMjAlMjBldmFsX2RhdGFzZXQlM0R0b2tlbml6ZWRfZGF0YXNldHMlNUIlMjJ2YWxpZGF0aW9uJTIyJTVEJTJDJTBBJTIwJTIwJTIwJTIwZGF0YV9jb2xsYXRvciUzRGRhdGFfY29sbGF0b3IlMkMlMEElMjAlMjAlMjAlMjBwcm9jZXNzaW5nX2NsYXNzJTNEdG9rZW5pemVyJTJDJTBBKQ==",highlighted:`<span class="hljs-keyword">from</span> transformers <span class="hljs-keyword">import</span> Trainer
trainer = Trainer(
model,
training_args,
train_dataset=tokenized_datasets[<span class="hljs-string">&quot;train&quot;</span>],
eval_dataset=tokenized_datasets[<span class="hljs-string">&quot;validation&quot;</span>],
data_collator=data_collator,
processing_class=tokenizer,
)`,wrap:!1}}),C=new Xe({props:{$$slots:{default:[ln]},$$scope:{ctx:J}}}),N=new y({props:{code:"dHJhaW5lci50cmFpbigp",highlighted:"trainer.train()",wrap:!1}}),D=new h({props:{title:"ํ‰๊ฐ€",local:"evaluation",headingTag:"h3"}}),O=new y({props:{code:"cHJlZGljdGlvbnMlMjAlM0QlMjB0cmFpbmVyLnByZWRpY3QodG9rZW5pemVkX2RhdGFzZXRzJTVCJTIydmFsaWRhdGlvbiUyMiU1RCklMEFwcmludChwcmVkaWN0aW9ucy5wcmVkaWN0aW9ucy5zaGFwZSUyQyUyMHByZWRpY3Rpb25zLmxhYmVsX2lkcy5zaGFwZSk=",highlighted:`predictions = trainer.predict(tokenized_datasets[<span class="hljs-string">&quot;validation&quot;</span>])
<span class="hljs-built_in">print</span>(predictions.predictions.shape, predictions.label_ids.shape)`,wrap:!1}}),ee=new y({props:{code:"KDQwOCUyQyUyMDIpJTIwKDQwOCUyQyk=",highlighted:'(<span class="hljs-number">408</span>, <span class="hljs-number">2</span>) (<span class="hljs-number">408</span>,)',wrap:!1}}),ne=new y({props:{code:"aW1wb3J0JTIwbnVtcHklMjBhcyUyMG5wJTBBJTBBcHJlZHMlMjAlM0QlMjBucC5hcmdtYXgocHJlZGljdGlvbnMucHJlZGljdGlvbnMlMkMlMjBheGlzJTNELTEp",highlighted:`<span class="hljs-keyword">import</span> numpy <span class="hljs-keyword">as</span> np
preds = np.argmax(predictions.predictions, axis=-<span class="hljs-number">1</span>)`,wrap:!1}}),ae=new y({props:{code:"aW1wb3J0JTIwZXZhbHVhdGUlMEElMEFtZXRyaWMlMjAlM0QlMjBldmFsdWF0ZS5sb2FkKCUyMmdsdWUlMjIlMkMlMjAlMjJtcnBjJTIyKSUwQW1ldHJpYy5jb21wdXRlKHByZWRpY3Rpb25zJTNEcHJlZHMlMkMlMjByZWZlcmVuY2VzJTNEcHJlZGljdGlvbnMubGFiZWxfaWRzKQ==",highlighted:`<span class="hljs-keyword">import</span> evaluate
metric = evaluate.load(<span class="hljs-string">&quot;glue&quot;</span>, <span class="hljs-string">&quot;mrpc&quot;</span>)
metric.compute(predictions=preds, references=predictions.label_ids)`,wrap:!1}}),re=new y({props:{code:"JTdCJ2FjY3VyYWN5JyUzQSUyMDAuODU3ODQzMTM3MjU0OTAxOSUyQyUyMCdmMSclM0ElMjAwLjg5OTY1Mzk3OTIzODc1NDIlN0Q=",highlighted:'{<span class="hljs-string">&#x27;accuracy&#x27;</span>: <span class="hljs-number">0.8578431372549019</span>, <span class="hljs-string">&#x27;f1&#x27;</span>: <span class="hljs-number">0.8996539792387542</span>}',wrap:!1}}),v=new Xe({props:{$$slots:{default:[nn]},$$scope:{ctx:J}}}),oe=new y({props:{code:"ZGVmJTIwY29tcHV0ZV9tZXRyaWNzKGV2YWxfcHJlZHMpJTNBJTBBJTIwJTIwJTIwJTIwbWV0cmljJTIwJTNEJTIwZXZhbHVhdGUubG9hZCglMjJnbHVlJTIyJTJDJTIwJTIybXJwYyUyMiklMEElMjAlMjAlMjAlMjBsb2dpdHMlMkMlMjBsYWJlbHMlMjAlM0QlMjBldmFsX3ByZWRzJTBBJTIwJTIwJTIwJTIwcHJlZGljdGlvbnMlMjAlM0QlMjBucC5hcmdtYXgobG9naXRzJTJDJTIwYXhpcyUzRC0xKSUwQSUyMCUyMCUyMCUyMHJldHVybiUyMG1ldHJpYy5jb21wdXRlKHByZWRpY3Rpb25zJTNEcHJlZGljdGlvbnMlMkMlMjByZWZlcmVuY2VzJTNEbGFiZWxzKQ==",highlighted:`<span class="hljs-keyword">def</span> <span class="hljs-title function_">compute_metrics</span>(<span class="hljs-params">eval_preds</span>):
metric = evaluate.load(<span class="hljs-string">&quot;glue&quot;</span>, <span class="hljs-string">&quot;mrpc&quot;</span>)
logits, labels = eval_preds
predictions = np.argmax(logits, axis=-<span class="hljs-number">1</span>)
<span class="hljs-keyword">return</span> metric.compute(predictions=predictions, references=labels)`,wrap:!1}}),me=new y({props:{code:"dHJhaW5pbmdfYXJncyUyMCUzRCUyMFRyYWluaW5nQXJndW1lbnRzKCUyMnRlc3QtdHJhaW5lciUyMiUyQyUyMGV2YWxfc3RyYXRlZ3klM0QlMjJlcG9jaCUyMiklMEFtb2RlbCUyMCUzRCUyMEF1dG9Nb2RlbEZvclNlcXVlbmNlQ2xhc3NpZmljYXRpb24uZnJvbV9wcmV0cmFpbmVkKGNoZWNrcG9pbnQlMkMlMjBudW1fbGFiZWxzJTNEMiklMEElMEF0cmFpbmVyJTIwJTNEJTIwVHJhaW5lciglMEElMjAlMjAlMjAlMjBtb2RlbCUyQyUwQSUyMCUyMCUyMCUyMHRyYWluaW5nX2FyZ3MlMkMlMEElMjAlMjAlMjAlMjB0cmFpbl9kYXRhc2V0JTNEdG9rZW5pemVkX2RhdGFzZXRzJTVCJTIydHJhaW4lMjIlNUQlMkMlMEElMjAlMjAlMjAlMjBldmFsX2RhdGFzZXQlM0R0b2tlbml6ZWRfZGF0YXNldHMlNUIlMjJ2YWxpZGF0aW9uJTIyJTVEJTJDJTBBJTIwJTIwJTIwJTIwZGF0YV9jb2xsYXRvciUzRGRhdGFfY29sbGF0b3IlMkMlMEElMjAlMjAlMjAlMjBwcm9jZXNzaW5nX2NsYXNzJTNEdG9rZW5pemVyJTJDJTBBJTIwJTIwJTIwJTIwY29tcHV0ZV9tZXRyaWNzJTNEY29tcHV0ZV9tZXRyaWNzJTJDJTBBKQ==",highlighted:`training_args = TrainingArguments(<span class="hljs-string">&quot;test-trainer&quot;</span>, eval_strategy=<span class="hljs-string">&quot;epoch&quot;</span>)
model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=<span class="hljs-number">2</span>)
trainer = Trainer(
model,
training_args,
train_dataset=tokenized_datasets[<span class="hljs-string">&quot;train&quot;</span>],
eval_dataset=tokenized_datasets[<span class="hljs-string">&quot;validation&quot;</span>],
data_collator=data_collator,
processing_class=tokenizer,
compute_metrics=compute_metrics,
)`,wrap:!1}}),$e=new y({props:{code:"dHJhaW5lci50cmFpbigp",highlighted:"trainer.train()",wrap:!1}}),ue=new h({props:{title:"๊ณ ๊ธ‰ ํ›ˆ๋ จ ๊ธฐ๋Šฅ",local:"advanced-training-features",headingTag:"h3"}}),ge=new y({props:{code:"dHJhaW5pbmdfYXJncyUyMCUzRCUyMFRyYWluaW5nQXJndW1lbnRzKCUwQSUyMCUyMCUyMCUyMCUyMnRlc3QtdHJhaW5lciUyMiUyQyUwQSUyMCUyMCUyMCUyMGV2YWxfc3RyYXRlZ3klM0QlMjJlcG9jaCUyMiUyQyUwQSUyMCUyMCUyMCUyMGZwMTYlM0RUcnVlJTJDJTIwJTIwJTIzJTIwJUVEJTk4JUJDJUVEJTk1JUE5JTIwJUVDJUEwJTk1JUVCJUIwJTgwJUVCJThGJTg0JTIwJUVEJTk5JTlDJUVDJTg0JUIxJUVEJTk5JTk0JTBBKQ==",highlighted:`training_args = TrainingArguments(
<span class="hljs-string">&quot;test-trainer&quot;</span>,
eval_strategy=<span class="hljs-string">&quot;epoch&quot;</span>,
fp16=<span class="hljs-literal">True</span>, <span class="hljs-comment"># ํ˜ผํ•ฉ ์ •๋ฐ€๋„ ํ™œ์„ฑํ™”</span>
)`,wrap:!1}}),ye=new y({props:{code:"dHJhaW5pbmdfYXJncyUyMCUzRCUyMFRyYWluaW5nQXJndW1lbnRzKCUwQSUyMCUyMCUyMCUyMCUyMnRlc3QtdHJhaW5lciUyMiUyQyUwQSUyMCUyMCUyMCUyMGV2YWxfc3RyYXRlZ3klM0QlMjJlcG9jaCUyMiUyQyUwQSUyMCUyMCUyMCUyMHBlcl9kZXZpY2VfdHJhaW5fYmF0Y2hfc2l6ZSUzRDQlMkMlMEElMjAlMjAlMjAlMjBncmFkaWVudF9hY2N1bXVsYXRpb25fc3RlcHMlM0Q0JTJDJTIwJTIwJTIzJTIwJUVDJTlDJUEwJUVEJTlBJUE4JTIwJUVCJUIwJUIwJUVDJUI5JTk4JTIwJUVEJTgxJUFDJUVBJUI4JUIwJTIwJTNEJTIwNCUyMColMjA0JTIwJTNEJTIwMTYlMEEp",highlighted:`training_args = TrainingArguments(
<span class="hljs-string">&quot;test-trainer&quot;</span>,
eval_strategy=<span class="hljs-string">&quot;epoch&quot;</span>,
per_device_train_batch_size=<span class="hljs-number">4</span>,
gradient_accumulation_steps=<span class="hljs-number">4</span>, <span class="hljs-comment"># ์œ ํšจ ๋ฐฐ์น˜ ํฌ๊ธฐ = 4 * 4 = 16</span>
)`,wrap:!1}}),we=new y({props:{code:"dHJhaW5pbmdfYXJncyUyMCUzRCUyMFRyYWluaW5nQXJndW1lbnRzKCUwQSUyMCUyMCUyMCUyMCUyMnRlc3QtdHJhaW5lciUyMiUyQyUwQSUyMCUyMCUyMCUyMGV2YWxfc3RyYXRlZ3klM0QlMjJlcG9jaCUyMiUyQyUwQSUyMCUyMCUyMCUyMGxlYXJuaW5nX3JhdGUlM0QyZS01JTJDJTBBJTIwJTIwJTIwJTIwbHJfc2NoZWR1bGVyX3R5cGUlM0QlMjJjb3NpbmUlMjIlMkMlMjAlMjAlMjMlMjAlRUIlOEIlQTQlRUIlQTUlQjglMjAlRUMlOEElQTQlRUMlQkMlODAlRUMlQTQlODQlRUIlOUYlQUMlMjAlRUMlOEIlOUMlRUIlOEYlODQlMEEp",highlighted:`training_args = TrainingArguments(
<span class="hljs-string">&quot;test-trainer&quot;</span>,
eval_strategy=<span class="hljs-string">&quot;epoch&quot;</span>,
learning_rate=<span class="hljs-number">2e-5</span>,
lr_scheduler_type=<span class="hljs-string">&quot;cosine&quot;</span>, <span class="hljs-comment"># ๋‹ค๋ฅธ ์Šค์ผ€์ค„๋Ÿฌ ์‹œ๋„</span>
)`,wrap:!1}}),k=new Xe({props:{$$slots:{default:[sn]},$$scope:{ctx:J}}}),R=new Xe({props:{$$slots:{default:[an]},$$scope:{ctx:J}}}),_e=new h({props:{title:"์„น์…˜ ํ€ด์ฆˆ",local:"section-quiz",headingTag:"h2"}}),Ce=new h({props:{title:"1. Trainer ์—์„œ <code> processing_class </code> ๋งค๊ฐœ๋ณ€์ˆ˜์˜ ๋ชฉ์ ์€ ๋ฌด์—‡์ธ๊ฐ€์š”?",local:"1-trainer-์—์„œ-code-processingclass-code-๋งค๊ฐœ๋ณ€์ˆ˜์˜-๋ชฉ์ ์€-๋ฌด์—‡์ธ๊ฐ€์š”",headingTag:"h3"}}),ve=new Ye({props:{choices:[{text:"์‚ฌ์šฉํ•  ๋ชจ๋ธ ์•„ํ‚คํ…์ฒ˜๋ฅผ ์ง€์ •ํ•ฉ๋‹ˆ๋‹ค.",explain:"๋ชจ๋ธ ์•„ํ‚คํ…์ฒ˜๋Š” ๋ชจ๋ธ์„ ๋กœ๋“œํ•  ๋•Œ ์ง€์ •๋˜๋ฉฐ, Trainer์—์„œ ์ง€์ •ํ•˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค."},{text:"๋ฐ์ดํ„ฐ ์ฒ˜๋ฆฌ์— ์‚ฌ์šฉํ•  ํ† ํฌ๋‚˜์ด์ €๋ฅผ Trainer์— ์•Œ๋ ค์ค๋‹ˆ๋‹ค.",explain:"processing_class ๋งค๊ฐœ๋ณ€์ˆ˜๋Š” ์‚ฌ์šฉํ•  ํ† ํฌ๋‚˜์ด์ €๋ฅผ Trainer๊ฐ€ ์•Œ ์ˆ˜ ์žˆ๋„๋ก ๋„์™€์ฃผ๋Š” ์ตœ์‹  ์ถ”๊ฐ€ ์‚ฌํ•ญ์ž…๋‹ˆ๋‹ค.",correct:!0},{text:"ํ›ˆ๋ จ์„ ์œ„ํ•œ ๋ฐฐ์น˜ ํฌ๊ธฐ๋ฅผ ๊ฒฐ์ •ํ•ฉ๋‹ˆ๋‹ค.",explain:"๋ฐฐ์น˜ ํฌ๊ธฐ๋Š” processing_class๊ฐ€ ์•„๋‹Œ TrainingArguments์—์„œ ์„ค์ •๋ฉ๋‹ˆ๋‹ค."},{text:"ํ‰๊ฐ€ ๋นˆ๋„๋ฅผ ์ œ์–ดํ•ฉ๋‹ˆ๋‹ค.",explain:"ํ‰๊ฐ€ ๋นˆ๋„๋Š” TrainingArguments์˜ eval_strategy๋กœ ์ œ์–ด๋ฉ๋‹ˆ๋‹ค."}]}}),ke=new h({props:{title:"2. ํ›ˆ๋ จ ์ค‘ ํ‰๊ฐ€๊ฐ€ ์–ผ๋งˆ๋‚˜ ์ž์ฃผ ๋ฐœ์ƒํ•˜๋Š”์ง€๋ฅผ ์ œ์–ดํ•˜๋Š” TrainingArguments ๋งค๊ฐœ๋ณ€์ˆ˜๋Š” ๋ฌด์—‡์ธ๊ฐ€์š”?",local:"2-ํ›ˆ๋ จ-์ค‘-ํ‰๊ฐ€๊ฐ€-์–ผ๋งˆ๋‚˜-์ž์ฃผ-๋ฐœ์ƒํ•˜๋Š”์ง€๋ฅผ-์ œ์–ดํ•˜๋Š”-trainingarguments-๋งค๊ฐœ๋ณ€์ˆ˜๋Š”-๋ฌด์—‡์ธ๊ฐ€์š”",headingTag:"h3"}}),Re=new Ye({props:{choices:[{text:"eval_frequency",explain:"TrainingArguments์—๋Š” eval_frequency ๋งค๊ฐœ๋ณ€์ˆ˜๊ฐ€ ์—†์Šต๋‹ˆ๋‹ค."},{text:"eval_strategy",explain:"eval_strategy๋Š” ํ‰๊ฐ€ ํƒ€์ด๋ฐ์„ ์ œ์–ดํ•˜๊ธฐ ์œ„ํ•ด 'epoch', 'steps', ๋˜๋Š” 'no'๋กœ ์„ค์ •ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.",correct:!0},{text:"evaluation_steps",explain:"eval_steps๋Š” ํ‰๊ฐ€ ์‚ฌ์ด์˜ ๋‹จ๊ณ„ ์ˆ˜๋ฅผ ์„ค์ •ํ•˜์ง€๋งŒ, eval_strategy๊ฐ€ ํ‰๊ฐ€ ๋ฐœ์ƒ ์—ฌ๋ถ€/์‹œ๊ธฐ๋ฅผ ๊ฒฐ์ •ํ•ฉ๋‹ˆ๋‹ค."},{text:"do_eval",explain:"์ตœ์‹  TrainingArguments์—๋Š” do_eval ๋งค๊ฐœ๋ณ€์ˆ˜๊ฐ€ ์—†์Šต๋‹ˆ๋‹ค."}]}}),xe=new h({props:{title:"3. TrainingArguments์—์„œ <code> fp16=True </code> ๋Š” ๋ฌด์—‡์„ ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”?",local:"3-trainingarguments์—์„œ-code-fp16true-code-๋Š”-๋ฌด์—‡์„-ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”",headingTag:"h3"}}),He=new Ye({props:{choices:[{text:"๋” ๋น ๋ฅธ ํ›ˆ๋ จ์„ ์œ„ํ•œ 16๋น„ํŠธ ์ •์ˆ˜ ์ •๋ฐ€๋„",explain:"fp16์€ ์ •์ˆ˜ ์ •๋ฐ€๋„๊ฐ€ ์•„๋‹Œ ๋ถ€๋™์†Œ์ˆ˜์  ์ •๋ฐ€๋„๋ฅผ ์˜๋ฏธํ•ฉ๋‹ˆ๋‹ค."},{text:"๋” ๋น ๋ฅธ ํ›ˆ๋ จ๊ณผ ๋ฉ”๋ชจ๋ฆฌ ์‚ฌ์šฉ๋Ÿ‰ ๊ฐ์†Œ๋ฅผ ์œ„ํ•œ 16๋น„ํŠธ ๋ถ€๋™์†Œ์ˆ˜์  ์ˆ˜๋ฅผ ์‚ฌ์šฉํ•œ ํ˜ผํ•ฉ ์ •๋ฐ€๋„ ํ›ˆ๋ จ",explain:"ํ˜ผํ•ฉ ์ •๋ฐ€๋„ ํ›ˆ๋ จ์€ ์ˆœ์ „ํŒŒ์—๋Š” 16๋น„ํŠธ ํ”Œ๋กœํŠธ๋ฅผ, ๊ทธ๋ ˆ์ด๋””์–ธํŠธ์—๋Š” 32๋น„ํŠธ๋ฅผ ์‚ฌ์šฉํ•˜์—ฌ ์†๋„๋ฅผ ํ–ฅ์ƒ์‹œํ‚ค๊ณ  ๋ฉ”๋ชจ๋ฆฌ ์‚ฌ์šฉ๋Ÿ‰์„ ์ค„์ž…๋‹ˆ๋‹ค.",correct:!0},{text:"์ •ํ™•ํžˆ 16 ์—ํฌํฌ ๋™์•ˆ ํ›ˆ๋ จ",explain:"fp16์€ ์—ํฌํฌ ์ˆ˜์™€ ๊ด€๋ จ์ด ์—†์Šต๋‹ˆ๋‹ค."},{text:"๋ถ„์‚ฐ ํ›ˆ๋ จ์„ ์œ„ํ•œ 16๊ฐœ GPU ์‚ฌ์šฉ",explain:"GPU ์ˆ˜๋Š” fp16 ๋งค๊ฐœ๋ณ€์ˆ˜๋กœ ์ œ์–ด๋˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค."}]}}),We=new h({props:{title:"4. Trainer์—์„œ <code> compute_metrics </code> ํ•จ์ˆ˜์˜ ์—ญํ• ์€ ๋ฌด์—‡์ธ๊ฐ€์š”?",local:"4-trainer์—์„œ-code-computemetrics-code-ํ•จ์ˆ˜์˜-์—ญํ• ์€-๋ฌด์—‡์ธ๊ฐ€์š”",headingTag:"h3"}}),Ge=new Ye({props:{choices:[{text:"ํ›ˆ๋ จ ์ค‘ ์†์‹ค์„ ๊ณ„์‚ฐํ•ฉ๋‹ˆ๋‹ค.",explain:"์†์‹ค ๊ณ„์‚ฐ์€ compute_metrics๊ฐ€ ์•„๋‹Œ ๋ชจ๋ธ์—์„œ ์ž๋™์œผ๋กœ ์ฒ˜๋ฆฌ๋ฉ๋‹ˆ๋‹ค."},{text:"๋กœ์ง“์„ ์˜ˆ์ธก์œผ๋กœ ๋ณ€ํ™˜ํ•˜๊ณ  ์ •ํ™•๋„ ๋ฐ F1๊ณผ ๊ฐ™์€ ํ‰๊ฐ€ ๋ฉ”ํŠธ๋ฆญ์„ ๊ณ„์‚ฐํ•ฉ๋‹ˆ๋‹ค.",explain:"compute_metrics๋Š” ์˜ˆ์ธก๊ณผ ๋ผ๋ฒจ์„ ๋ฐ›์•„์„œ ํ‰๊ฐ€๋ฅผ ์œ„ํ•œ ๋ฉ”ํŠธ๋ฆญ์„ ๋ฐ˜ํ™˜ํ•ฉ๋‹ˆ๋‹ค.",correct:!0},{text:"์‚ฌ์šฉํ•  ์˜ตํ‹ฐ๋งˆ์ด์ €๋ฅผ ๊ฒฐ์ •ํ•ฉ๋‹ˆ๋‹ค.",explain:"์˜ตํ‹ฐ๋งˆ์ด์ € ์„ ํƒ์€ compute_metrics๋กœ ์ฒ˜๋ฆฌ๋˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค."},{text:"ํ›ˆ๋ จ ๋ฐ์ดํ„ฐ๋ฅผ ์ „์ฒ˜๋ฆฌํ•ฉ๋‹ˆ๋‹ค.",explain:"๋ฐ์ดํ„ฐ ์ „์ฒ˜๋ฆฌ๋Š” ํ›ˆ๋ จ ์ „์— ์ˆ˜ํ–‰๋˜๋ฉฐ, ํ‰๊ฐ€ ์ค‘ compute_metrics๋กœ ์ˆ˜ํ–‰๋˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค."}]}}),Ie=new h({props:{title:"5. Trainer์— <code> eval_dataset </code> ์„ ์ œ๊ณตํ•˜์ง€ ์•Š์œผ๋ฉด ์–ด๋–ป๊ฒŒ ๋˜๋‚˜์š”?",local:"5-trainer์—-code-evaldataset-code-์„-์ œ๊ณตํ•˜์ง€-์•Š์œผ๋ฉด-์–ด๋–ป๊ฒŒ-๋˜๋‚˜์š”",headingTag:"h3"}}),Ze=new Ye({props:{choices:[{text:"ํ›ˆ๋ จ์ด ์˜ค๋ฅ˜์™€ ํ•จ๊ป˜ ์‹คํŒจํ•ฉ๋‹ˆ๋‹ค.",explain:"eval_dataset ์—†์ด๋„ ํ›ˆ๋ จ์„ ์ง„ํ–‰ํ•  ์ˆ˜ ์žˆ์ง€๋งŒ, ํ‰๊ฐ€ ๋ฉ”ํŠธ๋ฆญ์€ ์–ป์„ ์ˆ˜ ์—†์Šต๋‹ˆ๋‹ค."},{text:"Trainer๊ฐ€ ์ž๋™์œผ๋กœ ํ›ˆ๋ จ ๋ฐ์ดํ„ฐ๋ฅผ ํ‰๊ฐ€์šฉ์œผ๋กœ ๋ถ„ํ• ํ•ฉ๋‹ˆ๋‹ค.",explain:"Trainer๋Š” ์ž๋™์œผ๋กœ ๊ฒ€์ฆ ๋ถ„ํ• ์„ ์ƒ์„ฑํ•˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค."},{text:"ํ›ˆ๋ จ ์ค‘ ํ‰๊ฐ€ ๋ฉ”ํŠธ๋ฆญ์„ ์–ป์„ ์ˆ˜ ์—†์ง€๋งŒ ํ›ˆ๋ จ์€ ์—ฌ์ „ํžˆ ์ž‘๋™ํ•ฉ๋‹ˆ๋‹ค.",explain:"ํ‰๊ฐ€๋Š” ์„ ํƒ์‚ฌํ•ญ์ž…๋‹ˆ๋‹ค - ํ‰๊ฐ€ ์—†์ด๋„ ํ›ˆ๋ จํ•  ์ˆ˜ ์žˆ์ง€๋งŒ ๊ฒ€์ฆ ๋ฉ”ํŠธ๋ฆญ์€ ๋ณผ ์ˆ˜ ์—†์Šต๋‹ˆ๋‹ค.",correct:!0},{text:"๋ชจ๋ธ์ด ํ‰๊ฐ€๋ฅผ ์œ„ํ•ด ํ›ˆ๋ จ ๋ฐ์ดํ„ฐ๋ฅผ ์‚ฌ์šฉํ•ฉ๋‹ˆ๋‹ค.",explain:"Trainer๋Š” ์ž๋™์œผ๋กœ ํ‰๊ฐ€๋ฅผ ์œ„ํ•ด ํ›ˆ๋ จ ๋ฐ์ดํ„ฐ๋ฅผ ์‚ฌ์šฉํ•˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค - ๋‹จ์ˆœํžˆ ํ‰๊ฐ€ํ•˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค."}]}}),Ee=new h({props:{title:"6. ๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ ์ด๋ž€ ๋ฌด์—‡์ด๋ฉฐ ์–ด๋–ป๊ฒŒ ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”?",local:"6-๊ทธ๋ ˆ์ด๋””์–ธํŠธ-๋ˆ„์ ์ด๋ž€-๋ฌด์—‡์ด๋ฉฐ-์–ด๋–ป๊ฒŒ-ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”",headingTag:"h3"}}),Qe=new Ye({props:{choices:[{text:"๊ทธ๋ ˆ์ด๋””์–ธํŠธ๋ฅผ ๋””์Šคํฌ์— ์ €์žฅํ•˜๋Š” ๊ฒƒ์œผ๋กœ, save_gradients=True๋กœ ํ™œ์„ฑํ™”๋ฉ๋‹ˆ๋‹ค.",explain:"๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ ์€ ๊ทธ๋ ˆ์ด๋””์–ธํŠธ๋ฅผ ๋””์Šคํฌ์— ์ €์žฅํ•˜๋Š” ๊ฒƒ๊ณผ ๊ด€๋ จ์ด ์—†์Šต๋‹ˆ๋‹ค."},{text:"์—…๋ฐ์ดํŠธ ์ „์— ์—ฌ๋Ÿฌ ๋ฐฐ์น˜์— ๊ฑธ์ณ ๊ทธ๋ ˆ์ด๋””์–ธํŠธ๋ฅผ ๋ˆ„์ ํ•˜๋Š” ๊ฒƒ์œผ๋กœ, gradient_accumulation_steps๋กœ ํ™œ์„ฑํ™”๋ฉ๋‹ˆ๋‹ค.",explain:"์ด๋ฅผ ํ†ตํ•ด ์—ฌ๋Ÿฌ ์ˆœ์ „ํŒŒ์— ๊ฑธ์ณ ๊ทธ๋ ˆ์ด๋””์–ธํŠธ๋ฅผ ๋ˆ„์ ํ•˜์—ฌ ๋” ํฐ ๋ฐฐ์น˜ ํฌ๊ธฐ๋ฅผ ์‹œ๋ฎฌ๋ ˆ์ด์…˜ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.",correct:!0},{text:"๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๊ณ„์‚ฐ์„ ๊ฐ€์†ํ™”ํ•˜๋Š” ๊ฒƒ์œผ๋กœ, fp16๊ณผ ํ•จ๊ป˜ ์ž๋™์œผ๋กœ ํ™œ์„ฑํ™”๋ฉ๋‹ˆ๋‹ค.",explain:"fp16์ด ํ›ˆ๋ จ์„ ๊ฐ€์†ํ™”ํ•  ์ˆ˜ ์žˆ์ง€๋งŒ, ๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ ์€ ๋ณ„๋„์˜ ๊ธฐ์ˆ ์ž…๋‹ˆ๋‹ค."},{text:"๊ทธ๋ ˆ์ด๋””์–ธํŠธ ์˜ค๋ฒ„ํ”Œ๋กœ์šฐ๋ฅผ ๋ฐฉ์ง€ํ•˜๋Š” ๊ฒƒ์œผ๋กœ, gradient_clipping=True๋กœ ํ™œ์„ฑํ™”๋ฉ๋‹ˆ๋‹ค.",explain:"์ด๋Š” ๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ ์ด ์•„๋‹Œ ๊ทธ๋ ˆ์ด๋””์–ธํŠธ ํด๋ฆฌํ•‘์„ ์„ค๋ช…ํ•ฉ๋‹ˆ๋‹ค."}]}}),x=new Xe({props:{$$slots:{default:[rn]},$$scope:{ctx:J}}}),Ve=new Ol({props:{source:"https://github.com/huggingface/course/blob/main/chapters/ko/chapter3/3.mdx"}}),{c(){r=M("meta"),T=s(),i=M("p"),g=s(),p(w.$$.fragment),U=s(),p(b.$$.fragment),Ae=s(),p(H.$$.fragment),Be=s(),p(W.$$.fragment),qe=s(),G=M("p"),G.innerHTML=il,Le=s(),p(_.$$.fragment),Ne=s(),I=M("p"),I.textContent=pl,Pe=s(),p(Z.$$.fragment),Se=s(),p(E.$$.fragment),De=s(),Q=M("p"),Q.innerHTML=ol,Ke=s(),p(V.$$.fragment),Oe=s(),X=M("p"),X.innerHTML=cl,et=s(),p(j.$$.fragment),tt=s(),z=M("p"),z.innerHTML=ml,lt=s(),p(Y.$$.fragment),nt=s(),F=M("p"),F.innerHTML=fl,st=s(),A=M("p"),A.innerHTML=$l,at=s(),p(B.$$.fragment),rt=s(),q=M("p"),q.innerHTML=Ml,it=s(),p(C.$$.fragment),pt=s(),L=M("p"),L.innerHTML=ul,ot=s(),p(N.$$.fragment),ct=s(),P=M("p"),P.textContent=dl,mt=s(),S=M("ol"),S.innerHTML=Tl,ft=s(),p(D.$$.fragment),$t=s(),K=M("p"),K.innerHTML=gl,Mt=s(),p(O.$$.fragment),ut=s(),p(ee.$$.fragment),dt=s(),te=M("p"),te.innerHTML=Jl,Tt=s(),le=M("p"),le.innerHTML=yl,gt=s(),p(ne.$$.fragment),Jt=s(),se=M("p"),se.innerHTML=Ul,yt=s(),p(ae.$$.fragment),Ut=s(),p(re.$$.fragment),wt=s(),p(v.$$.fragment),bt=s(),ie=M("p"),ie.innerHTML=wl,ht=s(),pe=M("p"),pe.innerHTML=bl,_t=s(),p(oe.$$.fragment),jt=s(),ce=M("p"),ce.innerHTML=hl,Ct=s(),p(me.$$.fragment),vt=s(),fe=M("p"),fe.innerHTML=_l,kt=s(),p($e.$$.fragment),Rt=s(),Me=M("p"),Me.textContent=jl,xt=s(),p(ue.$$.fragment),Ht=s(),de=M("p"),de.innerHTML=Cl,Wt=s(),Te=M("p"),Te.innerHTML=vl,Gt=s(),p(ge.$$.fragment),It=s(),Je=M("p"),Je.innerHTML=kl,Zt=s(),p(ye.$$.fragment),Et=s(),Ue=M("p"),Ue.innerHTML=Rl,Qt=s(),p(we.$$.fragment),Vt=s(),p(k.$$.fragment),Xt=s(),be=M("p"),be.innerHTML=xl,zt=s(),he=M("p"),he.innerHTML=Hl,Yt=s(),p(R.$$.fragment),Ft=s(),p(_e.$$.fragment),At=s(),je=M("p"),je.textContent=Wl,Bt=s(),p(Ce.$$.fragment),qt=s(),p(ve.$$.fragment),Lt=s(),p(ke.$$.fragment),Nt=s(),p(Re.$$.fragment),Pt=s(),p(xe.$$.fragment),St=s(),p(He.$$.fragment),Dt=s(),p(We.$$.fragment),Kt=s(),p(Ge.$$.fragment),Ot=s(),p(Ie.$$.fragment),el=s(),p(Ze.$$.fragment),tl=s(),p(Ee.$$.fragment),ll=s(),p(Qe.$$.fragment),nl=s(),p(x.$$.fragment),sl=s(),p(Ve.$$.fragment),al=s(),Fe=M("p"),this.h()},l(e){const t=Nl("svelte-u9bgzb",document.head);r=u(t,"META",{name:!0,content:!0}),t.forEach(l),T=a(e),i=u(e,"P",{}),Yl(i).forEach(l),g=a(e),o(w.$$.fragment,e),U=a(e),o(b.$$.fragment,e),Ae=a(e),o(H.$$.fragment,e),Be=a(e),o(W.$$.fragment,e),qe=a(e),G=u(e,"P",{"data-svelte-h":!0}),d(G)!=="svelte-knkc89"&&(G.innerHTML=il),Le=a(e),o(_.$$.fragment,e),Ne=a(e),I=u(e,"P",{"data-svelte-h":!0}),d(I)!=="svelte-hs8a7l"&&(I.textContent=pl),Pe=a(e),o(Z.$$.fragment,e),Se=a(e),o(E.$$.fragment,e),De=a(e),Q=u(e,"P",{"data-svelte-h":!0}),d(Q)!=="svelte-1enyha7"&&(Q.innerHTML=ol),Ke=a(e),o(V.$$.fragment,e),Oe=a(e),X=u(e,"P",{"data-svelte-h":!0}),d(X)!=="svelte-18au6nv"&&(X.innerHTML=cl),et=a(e),o(j.$$.fragment,e),tt=a(e),z=u(e,"P",{"data-svelte-h":!0}),d(z)!=="svelte-nt9c4b"&&(z.innerHTML=ml),lt=a(e),o(Y.$$.fragment,e),nt=a(e),F=u(e,"P",{"data-svelte-h":!0}),d(F)!=="svelte-s3sck9"&&(F.innerHTML=fl),st=a(e),A=u(e,"P",{"data-svelte-h":!0}),d(A)!=="svelte-4ai6qh"&&(A.innerHTML=$l),at=a(e),o(B.$$.fragment,e),rt=a(e),q=u(e,"P",{"data-svelte-h":!0}),d(q)!=="svelte-1m2yas3"&&(q.innerHTML=Ml),it=a(e),o(C.$$.fragment,e),pt=a(e),L=u(e,"P",{"data-svelte-h":!0}),d(L)!=="svelte-13y4n8x"&&(L.innerHTML=ul),ot=a(e),o(N.$$.fragment,e),ct=a(e),P=u(e,"P",{"data-svelte-h":!0}),d(P)!=="svelte-1vb1ztl"&&(P.textContent=dl),mt=a(e),S=u(e,"OL",{"data-svelte-h":!0}),d(S)!=="svelte-1kijd9m"&&(S.innerHTML=Tl),ft=a(e),o(D.$$.fragment,e),$t=a(e),K=u(e,"P",{"data-svelte-h":!0}),d(K)!=="svelte-1kov8l9"&&(K.innerHTML=gl),Mt=a(e),o(O.$$.fragment,e),ut=a(e),o(ee.$$.fragment,e),dt=a(e),te=u(e,"P",{"data-svelte-h":!0}),d(te)!=="svelte-44hwg3"&&(te.innerHTML=Jl),Tt=a(e),le=u(e,"P",{"data-svelte-h":!0}),d(le)!=="svelte-1f3lia8"&&(le.innerHTML=yl),gt=a(e),o(ne.$$.fragment,e),Jt=a(e),se=u(e,"P",{"data-svelte-h":!0}),d(se)!=="svelte-4of9x9"&&(se.innerHTML=Ul),yt=a(e),o(ae.$$.fragment,e),Ut=a(e),o(re.$$.fragment,e),wt=a(e),o(v.$$.fragment,e),bt=a(e),ie=u(e,"P",{"data-svelte-h":!0}),d(ie)!=="svelte-1ylr8sj"&&(ie.innerHTML=wl),ht=a(e),pe=u(e,"P",{"data-svelte-h":!0}),d(pe)!=="svelte-2jb62l"&&(pe.innerHTML=bl),_t=a(e),o(oe.$$.fragment,e),jt=a(e),ce=u(e,"P",{"data-svelte-h":!0}),d(ce)!=="svelte-vtoh1f"&&(ce.innerHTML=hl),Ct=a(e),o(me.$$.fragment,e),vt=a(e),fe=u(e,"P",{"data-svelte-h":!0}),d(fe)!=="svelte-14c26ht"&&(fe.innerHTML=_l),kt=a(e),o($e.$$.fragment,e),Rt=a(e),Me=u(e,"P",{"data-svelte-h":!0}),d(Me)!=="svelte-1yytiyu"&&(Me.textContent=jl),xt=a(e),o(ue.$$.fragment,e),Ht=a(e),de=u(e,"P",{"data-svelte-h":!0}),d(de)!=="svelte-1lmwzzc"&&(de.innerHTML=Cl),Wt=a(e),Te=u(e,"P",{"data-svelte-h":!0}),d(Te)!=="svelte-1h0qf0f"&&(Te.innerHTML=vl),Gt=a(e),o(ge.$$.fragment,e),It=a(e),Je=u(e,"P",{"data-svelte-h":!0}),d(Je)!=="svelte-pmu9yq"&&(Je.innerHTML=kl),Zt=a(e),o(ye.$$.fragment,e),Et=a(e),Ue=u(e,"P",{"data-svelte-h":!0}),d(Ue)!=="svelte-umpq8u"&&(Ue.innerHTML=Rl),Qt=a(e),o(we.$$.fragment,e),Vt=a(e),o(k.$$.fragment,e),Xt=a(e),be=u(e,"P",{"data-svelte-h":!0}),d(be)!=="svelte-kboajh"&&(be.innerHTML=xl),zt=a(e),he=u(e,"P",{"data-svelte-h":!0}),d(he)!=="svelte-1p27re0"&&(he.innerHTML=Hl),Yt=a(e),o(R.$$.fragment,e),Ft=a(e),o(_e.$$.fragment,e),At=a(e),je=u(e,"P",{"data-svelte-h":!0}),d(je)!=="svelte-1f5akmu"&&(je.textContent=Wl),Bt=a(e),o(Ce.$$.fragment,e),qt=a(e),o(ve.$$.fragment,e),Lt=a(e),o(ke.$$.fragment,e),Nt=a(e),o(Re.$$.fragment,e),Pt=a(e),o(xe.$$.fragment,e),St=a(e),o(He.$$.fragment,e),Dt=a(e),o(We.$$.fragment,e),Kt=a(e),o(Ge.$$.fragment,e),Ot=a(e),o(Ie.$$.fragment,e),el=a(e),o(Ze.$$.fragment,e),tl=a(e),o(Ee.$$.fragment,e),ll=a(e),o(Qe.$$.fragment,e),nl=a(e),o(x.$$.fragment,e),sl=a(e),o(Ve.$$.fragment,e),al=a(e),Fe=u(e,"P",{}),Yl(Fe).forEach(l),this.h()},h(){Fl(r,"name","hf:doc:metadata"),Fl(r,"content",on)},m(e,t){Pl(document.head,r),n(e,T,t),n(e,i,t),n(e,g,t),c(w,e,t),n(e,U,t),c(b,e,t),n(e,Ae,t),c(H,e,t),n(e,Be,t),c(W,e,t),n(e,qe,t),n(e,G,t),n(e,Le,t),c(_,e,t),n(e,Ne,t),n(e,I,t),n(e,Pe,t),c(Z,e,t),n(e,Se,t),c(E,e,t),n(e,De,t),n(e,Q,t),n(e,Ke,t),c(V,e,t),n(e,Oe,t),n(e,X,t),n(e,et,t),c(j,e,t),n(e,tt,t),n(e,z,t),n(e,lt,t),c(Y,e,t),n(e,nt,t),n(e,F,t),n(e,st,t),n(e,A,t),n(e,at,t),c(B,e,t),n(e,rt,t),n(e,q,t),n(e,it,t),c(C,e,t),n(e,pt,t),n(e,L,t),n(e,ot,t),c(N,e,t),n(e,ct,t),n(e,P,t),n(e,mt,t),n(e,S,t),n(e,ft,t),c(D,e,t),n(e,$t,t),n(e,K,t),n(e,Mt,t),c(O,e,t),n(e,ut,t),c(ee,e,t),n(e,dt,t),n(e,te,t),n(e,Tt,t),n(e,le,t),n(e,gt,t),c(ne,e,t),n(e,Jt,t),n(e,se,t),n(e,yt,t),c(ae,e,t),n(e,Ut,t),c(re,e,t),n(e,wt,t),c(v,e,t),n(e,bt,t),n(e,ie,t),n(e,ht,t),n(e,pe,t),n(e,_t,t),c(oe,e,t),n(e,jt,t),n(e,ce,t),n(e,Ct,t),c(me,e,t),n(e,vt,t),n(e,fe,t),n(e,kt,t),c($e,e,t),n(e,Rt,t),n(e,Me,t),n(e,xt,t),c(ue,e,t),n(e,Ht,t),n(e,de,t),n(e,Wt,t),n(e,Te,t),n(e,Gt,t),c(ge,e,t),n(e,It,t),n(e,Je,t),n(e,Zt,t),c(ye,e,t),n(e,Et,t),n(e,Ue,t),n(e,Qt,t),c(we,e,t),n(e,Vt,t),c(k,e,t),n(e,Xt,t),n(e,be,t),n(e,zt,t),n(e,he,t),n(e,Yt,t),c(R,e,t),n(e,Ft,t),c(_e,e,t),n(e,At,t),n(e,je,t),n(e,Bt,t),c(Ce,e,t),n(e,qt,t),c(ve,e,t),n(e,Lt,t),c(ke,e,t),n(e,Nt,t),c(Re,e,t),n(e,Pt,t),c(xe,e,t),n(e,St,t),c(He,e,t),n(e,Dt,t),c(We,e,t),n(e,Kt,t),c(Ge,e,t),n(e,Ot,t),c(Ie,e,t),n(e,el,t),c(Ze,e,t),n(e,tl,t),c(Ee,e,t),n(e,ll,t),c(Qe,e,t),n(e,nl,t),c(x,e,t),n(e,sl,t),c(Ve,e,t),n(e,al,t),n(e,Fe,t),rl=!0},p(e,[t]){const Gl={};t&1&&(Gl.fw=e[0]),w.$set(Gl);const Il={};t&2&&(Il.$$scope={dirty:t,ctx:e}),_.$set(Il);const Zl={};t&2&&(Zl.$$scope={dirty:t,ctx:e}),j.$set(Zl);const El={};t&2&&(El.$$scope={dirty:t,ctx:e}),C.$set(El);const Ql={};t&2&&(Ql.$$scope={dirty:t,ctx:e}),v.$set(Ql);const Vl={};t&2&&(Vl.$$scope={dirty:t,ctx:e}),k.$set(Vl);const Xl={};t&2&&(Xl.$$scope={dirty:t,ctx:e}),R.$set(Xl);const zl={};t&2&&(zl.$$scope={dirty:t,ctx:e}),x.$set(zl)},i(e){rl||(m(w.$$.fragment,e),m(b.$$.fragment,e),m(H.$$.fragment,e),m(W.$$.fragment,e),m(_.$$.fragment,e),m(Z.$$.fragment,e),m(E.$$.fragment,e),m(V.$$.fragment,e),m(j.$$.fragment,e),m(Y.$$.fragment,e),m(B.$$.fragment,e),m(C.$$.fragment,e),m(N.$$.fragment,e),m(D.$$.fragment,e),m(O.$$.fragment,e),m(ee.$$.fragment,e),m(ne.$$.fragment,e),m(ae.$$.fragment,e),m(re.$$.fragment,e),m(v.$$.fragment,e),m(oe.$$.fragment,e),m(me.$$.fragment,e),m($e.$$.fragment,e),m(ue.$$.fragment,e),m(ge.$$.fragment,e),m(ye.$$.fragment,e),m(we.$$.fragment,e),m(k.$$.fragment,e),m(R.$$.fragment,e),m(_e.$$.fragment,e),m(Ce.$$.fragment,e),m(ve.$$.fragment,e),m(ke.$$.fragment,e),m(Re.$$.fragment,e),m(xe.$$.fragment,e),m(He.$$.fragment,e),m(We.$$.fragment,e),m(Ge.$$.fragment,e),m(Ie.$$.fragment,e),m(Ze.$$.fragment,e),m(Ee.$$.fragment,e),m(Qe.$$.fragment,e),m(x.$$.fragment,e),m(Ve.$$.fragment,e),rl=!0)},o(e){f(w.$$.fragment,e),f(b.$$.fragment,e),f(H.$$.fragment,e),f(W.$$.fragment,e),f(_.$$.fragment,e),f(Z.$$.fragment,e),f(E.$$.fragment,e),f(V.$$.fragment,e),f(j.$$.fragment,e),f(Y.$$.fragment,e),f(B.$$.fragment,e),f(C.$$.fragment,e),f(N.$$.fragment,e),f(D.$$.fragment,e),f(O.$$.fragment,e),f(ee.$$.fragment,e),f(ne.$$.fragment,e),f(ae.$$.fragment,e),f(re.$$.fragment,e),f(v.$$.fragment,e),f(oe.$$.fragment,e),f(me.$$.fragment,e),f($e.$$.fragment,e),f(ue.$$.fragment,e),f(ge.$$.fragment,e),f(ye.$$.fragment,e),f(we.$$.fragment,e),f(k.$$.fragment,e),f(R.$$.fragment,e),f(_e.$$.fragment,e),f(Ce.$$.fragment,e),f(ve.$$.fragment,e),f(ke.$$.fragment,e),f(Re.$$.fragment,e),f(xe.$$.fragment,e),f(He.$$.fragment,e),f(We.$$.fragment,e),f(Ge.$$.fragment,e),f(Ie.$$.fragment,e),f(Ze.$$.fragment,e),f(Ee.$$.fragment,e),f(Qe.$$.fragment,e),f(x.$$.fragment,e),f(Ve.$$.fragment,e),rl=!1},d(e){e&&(l(T),l(i),l(g),l(U),l(Ae),l(Be),l(qe),l(G),l(Le),l(Ne),l(I),l(Pe),l(Se),l(De),l(Q),l(Ke),l(Oe),l(X),l(et),l(tt),l(z),l(lt),l(nt),l(F),l(st),l(A),l(at),l(rt),l(q),l(it),l(pt),l(L),l(ot),l(ct),l(P),l(mt),l(S),l(ft),l($t),l(K),l(Mt),l(ut),l(dt),l(te),l(Tt),l(le),l(gt),l(Jt),l(se),l(yt),l(Ut),l(wt),l(bt),l(ie),l(ht),l(pe),l(_t),l(jt),l(ce),l(Ct),l(vt),l(fe),l(kt),l(Rt),l(Me),l(xt),l(Ht),l(de),l(Wt),l(Te),l(Gt),l(It),l(Je),l(Zt),l(Et),l(Ue),l(Qt),l(Vt),l(Xt),l(be),l(zt),l(he),l(Yt),l(Ft),l(At),l(je),l(Bt),l(qt),l(Lt),l(Nt),l(Pt),l(St),l(Dt),l(Kt),l(Ot),l(el),l(tl),l(ll),l(nl),l(sl),l(al),l(Fe)),l(r),$(w,e),$(b,e),$(H,e),$(W,e),$(_,e),$(Z,e),$(E,e),$(V,e),$(j,e),$(Y,e),$(B,e),$(C,e),$(N,e),$(D,e),$(O,e),$(ee,e),$(ne,e),$(ae,e),$(re,e),$(v,e),$(oe,e),$(me,e),$($e,e),$(ue,e),$(ge,e),$(ye,e),$(we,e),$(k,e),$(R,e),$(_e,e),$(Ce,e),$(ve,e),$(ke,e),$(Re,e),$(xe,e),$(He,e),$(We,e),$(Ge,e),$(Ie,e),$(Ze,e),$(Ee,e),$(Qe,e),$(x,e),$(Ve,e)}}}const on='{"title":"Trainer API๋กœ ๋ชจ๋ธ ๋ฏธ์„ธ ์กฐ์ •ํ•˜๊ธฐ","local":"fine-tuning-a-model-with-the-trainer-api","sections":[{"title":"ํ›ˆ๋ จ","local":"training","sections":[],"depth":3},{"title":"ํ‰๊ฐ€","local":"evaluation","sections":[],"depth":3},{"title":"๊ณ ๊ธ‰ ํ›ˆ๋ จ ๊ธฐ๋Šฅ","local":"advanced-training-features","sections":[],"depth":3},{"title":"์„น์…˜ ํ€ด์ฆˆ","local":"section-quiz","sections":[{"title":"1. Trainer ์—์„œ <code> processing_class </code> ๋งค๊ฐœ๋ณ€์ˆ˜์˜ ๋ชฉ์ ์€ ๋ฌด์—‡์ธ๊ฐ€์š”?","local":"1-trainer-์—์„œ-code-processingclass-code-๋งค๊ฐœ๋ณ€์ˆ˜์˜-๋ชฉ์ ์€-๋ฌด์—‡์ธ๊ฐ€์š”","sections":[],"depth":3},{"title":"2. ํ›ˆ๋ จ ์ค‘ ํ‰๊ฐ€๊ฐ€ ์–ผ๋งˆ๋‚˜ ์ž์ฃผ ๋ฐœ์ƒํ•˜๋Š”์ง€๋ฅผ ์ œ์–ดํ•˜๋Š” TrainingArguments ๋งค๊ฐœ๋ณ€์ˆ˜๋Š” ๋ฌด์—‡์ธ๊ฐ€์š”?","local":"2-ํ›ˆ๋ จ-์ค‘-ํ‰๊ฐ€๊ฐ€-์–ผ๋งˆ๋‚˜-์ž์ฃผ-๋ฐœ์ƒํ•˜๋Š”์ง€๋ฅผ-์ œ์–ดํ•˜๋Š”-trainingarguments-๋งค๊ฐœ๋ณ€์ˆ˜๋Š”-๋ฌด์—‡์ธ๊ฐ€์š”","sections":[],"depth":3},{"title":"3. TrainingArguments์—์„œ <code> fp16=True </code> ๋Š” ๋ฌด์—‡์„ ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”?","local":"3-trainingarguments์—์„œ-code-fp16true-code-๋Š”-๋ฌด์—‡์„-ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”","sections":[],"depth":3},{"title":"4. Trainer์—์„œ <code> compute_metrics </code> ํ•จ์ˆ˜์˜ ์—ญํ• ์€ ๋ฌด์—‡์ธ๊ฐ€์š”?","local":"4-trainer์—์„œ-code-computemetrics-code-ํ•จ์ˆ˜์˜-์—ญํ• ์€-๋ฌด์—‡์ธ๊ฐ€์š”","sections":[],"depth":3},{"title":"5. Trainer์— <code> eval_dataset </code> ์„ ์ œ๊ณตํ•˜์ง€ ์•Š์œผ๋ฉด ์–ด๋–ป๊ฒŒ ๋˜๋‚˜์š”?","local":"5-trainer์—-code-evaldataset-code-์„-์ œ๊ณตํ•˜์ง€-์•Š์œผ๋ฉด-์–ด๋–ป๊ฒŒ-๋˜๋‚˜์š”","sections":[],"depth":3},{"title":"6. ๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ ์ด๋ž€ ๋ฌด์—‡์ด๋ฉฐ ์–ด๋–ป๊ฒŒ ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”?","local":"6-๊ทธ๋ ˆ์ด๋””์–ธํŠธ-๋ˆ„์ ์ด๋ž€-๋ฌด์—‡์ด๋ฉฐ-์–ด๋–ป๊ฒŒ-ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”","sections":[],"depth":3}],"depth":2}],"depth":1}';function cn(J,r,T){let i="pt";return Bl(()=>{const g=new URLSearchParams(window.location.search);T(0,i=g.get("fw")||"pt")}),[i]}class yn extends ql{constructor(r){super(),Ll(this,r,cn,pn,Al,{})}}export{yn as component};

Xet Storage Details

Size:
45 kB
ยท
Xet hash:
9e2b3ce8a3d0cf2bfbf37d75f66cf57f741ca6503112f7b33bc25b9870b0db87

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.