Buckets:

rtrm's picture
download
raw
43.6 kB
import{s as ql,o as Bl}from"../chunks/scheduler.505acc25.js";import{S as Al,i as Ll,e as M,s,c as i,h as Nl,a as f,d as l,b as a,f as Fl,g as r,j as d,k as y,l as Pl,m as n,n as p,t as o,o as c,p as m}from"../chunks/index.821724d0.js";import{C as Sl,H as T,E as Dl}from"../chunks/MermaidChart.svelte_svelte_type_style_lang.cee6bd49.js";import{Y as Ol}from"../chunks/Youtube.c5effbdd.js";import{C as u}from"../chunks/CodeBlock.9ca76b2e.js";import{C as Kl}from"../chunks/CourseFloatingBanner.415ffed3.js";import{Q as Xe}from"../chunks/Question.33cf0d1a.js";import{F as en}from"../chunks/FrameworkSwitchCourse.fd0863d0.js";function tn(rl){let $,Qe,g,Ve,J,Ye,k,Fe,v,qe,x,Be,R,Ae,H,pl='๐Ÿค— Transformers๋Š” <code>Trainer</code> ํด๋ž˜์Šค๋ฅผ ์ œ๊ณตํ•ฉ๋‹ˆ๋‹ค. ์ด ํด๋ž˜์Šค๋ฅผ ์‚ฌ์šฉํ•˜๋ฉด ์‚ฌ์ „ ํ•™์Šต๋œ ๋ชจ๋ธ์„ ์—ฌ๋Ÿฌ๋ถ„์˜ ๋ฐ์ดํ„ฐ์…‹์— ๋งž์ถฐ ์ตœ์‹  ๊ธฐ๋ฒ•์œผ๋กœ ์‰ฝ๊ฒŒ ๋ฏธ์„ธ ์กฐ์ •ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ์ด์ „ ์„น์…˜์—์„œ ๋ฐ์ดํ„ฐ ์ „์ฒ˜๋ฆฌ ์ž‘์—…์„ ๋ชจ๋‘ ๋งˆ์ณค๋‹ค๋ฉด ์ด์ œ ๋ช‡ ๋‹จ๊ณ„๋งŒ ๊ฑฐ์น˜๋ฉด <code>Trainer</code>๋ฅผ ์ •์˜ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ๊ฐ€์žฅ ์–ด๋ ค์šด ๋ถ€๋ถ„์€ <code>Trainer.train()</code>์„ ์‹คํ–‰ํ•  ํ™˜๊ฒฝ์„ ์ค€๋น„ํ•˜๋Š” ๊ณผ์ •์ผ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ์ด ์ž‘์—…์€ CPU์—์„œ ๋งค์šฐ ๋А๋ฆฌ๊ฒŒ ์‹คํ–‰๋˜๊ธฐ ๋•Œ๋ฌธ์ž…๋‹ˆ๋‹ค. ๋งŒ์•ฝ GPU๊ฐ€ ์—†๋‹ค๋ฉด <a href="https://colab.research.google.com/" rel="nofollow">Google Colab</a>์—์„œ ๋ฌด๋ฃŒ๋กœ ์ œ๊ณตํ•˜๋Š” GPU๋‚˜ TPU๋ฅผ ์ด์šฉํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.',Le,U,ol='<p>๐Ÿ“š <strong>ํ›ˆ๋ จ ๋ฆฌ์†Œ์Šค</strong>: ํ›ˆ๋ จ์„ ์‹œ์ž‘ํ•˜๊ธฐ ์ „์— ํฌ๊ด„์ ์ธ <a href="https://huggingface.co/docs/transformers/main/en/training" rel="nofollow">๐Ÿค— Transformers ํ›ˆ๋ จ ๊ฐ€์ด๋“œ</a>๋ฅผ ์ˆ™์ง€ํ•˜๊ณ  <a href="https://huggingface.co/learn/cookbook/en/fine_tuning_code_llm_on_single_gpu" rel="nofollow">๋ฏธ์„ธ ์กฐ์ • ์ฟก๋ถ</a>์˜ ์‹ค์šฉ์ ์ธ ์˜ˆ์ œ๋ฅผ ์‚ดํŽด๋ณด์„ธ์š”.</p>',Ne,W,cl="์•„๋ž˜ ์ฝ”๋“œ ์˜ˆ์‹œ๋Š” ์ด์ „ ์„น์…˜์˜ ์ฝ”๋“œ๋ฅผ ๋ชจ๋‘ ์‹คํ–‰ํ–ˆ๋‹ค๋Š” ๊ฐ€์ •ํ•˜์— ์ž‘๋™ํ•ฉ๋‹ˆ๋‹ค. ์ฆ‰, ๋‹ค์Œ ์‚ฌํ•ญ๋“ค์ด ํ•„์š”ํ•ฉ๋‹ˆ๋‹ค.",Pe,G,Se,I,De,Z,ml="<code>Trainer</code>๋ฅผ ์ •์˜ํ•˜๊ธฐ ์ „ ์ฒซ ๋ฒˆ์งธ ๋‹จ๊ณ„๋Š” <code>Trainer</code>๊ฐ€ ํ›ˆ๋ จ ๋ฐ ํ‰๊ฐ€์— ์‚ฌ์šฉํ•  ๋ชจ๋“  ํ•˜์ดํผํŒŒ๋ผ๋ฏธํ„ฐ๋ฅผ ๋‹ด์„<code>TrainingArguments</code> ํด๋ž˜์Šค๋ฅผ ์ •์˜ํ•˜๋Š” ๊ฒƒ์ž…๋‹ˆ๋‹ค. ํ•„์ˆ˜๋กœ ์ œ๊ณตํ•ด์•ผ ํ•˜๋Š” ์œ ์ผํ•œ ์ธ์ˆ˜๋Š” ํ›ˆ๋ จ๋œ ๋ชจ๋ธ๊ณผ ์ค‘๊ฐ„ ์ฒดํฌํฌ์ธํŠธ๊ฐ€ ์ €์žฅ๋  ๋””๋ ‰ํ† ๋ฆฌ์ž…๋‹ˆ๋‹ค. ๋‚˜๋จธ์ง€๋Š” ๊ธฐ๋ณธ๊ฐ’์œผ๋กœ ๋‘˜ ์ˆ˜ ์žˆ์œผ๋ฉฐ, ๊ธฐ๋ณธ์ ์ธ ๋ฏธ์„ธ ์กฐ์ • ์ž‘์—…์—๋Š” ์ถฉ๋ถ„ํ•œ ์„ค์ •์ž…๋‹ˆ๋‹ค.",Oe,E,Ke,Q,Ml='ํ›ˆ๋ จ ์ค‘์— ๋ชจ๋ธ์„ Hub์— ์ž๋™์œผ๋กœ ์—…๋กœ๋“œํ•˜๋ ค๋ฉด <code>TrainingArguments</code>์—์„œ <code>push_to_hub=True</code>๋ฅผ ์ „๋‹ฌํ•˜์„ธ์š”. ์ด ๊ธฐ๋Šฅ์— ๋Œ€ํ•ด์„œ๋Š” <a href="/course/chapter4/3">Chapter 4</a>์—์„œ ์ž์„ธํžˆ ์•Œ์•„๋ณด๊ฒ ์Šต๋‹ˆ๋‹ค.',et,b,fl='<p>๐Ÿš€ <strong>๊ณ ๊ธ‰ ์„ค์ •</strong>: ์‚ฌ์šฉ ๊ฐ€๋Šฅํ•œ ๋ชจ๋“  ํ›ˆ๋ จ ์ธ์ˆ˜์™€ ์ตœ์ ํ™” ์ „๋žต์— ๋Œ€ํ•œ ์ž์„ธํ•œ ์ •๋ณด๋Š” <a href="https://huggingface.co/docs/transformers/main/en/main_classes/trainer#transformers.TrainingArguments" rel="nofollow">TrainingArguments ๋ฌธ์„œ</a>์™€ <a href="https://huggingface.co/learn/cookbook/en/fine_tuning_code_llm_on_single_gpu" rel="nofollow">ํ›ˆ๋ จ ๊ตฌ์„ฑ ์ฟก๋ถ</a>์„ ์ฐธ๊ณ ํ•˜์„ธ์š”.</p>',tt,V,dl='๋‘ ๋ฒˆ์งธ ๋‹จ๊ณ„๋Š” ๋ชจ๋ธ์„ ์ •์˜ํ•˜๋Š” ๊ฒƒ์ž…๋‹ˆ๋‹ค. <a href="/course/chapter2">์ด์ „ ์ฑ•ํ„ฐ</a>์—์„œ์™€ ๊ฐ™์ด ๋‘ ๊ฐœ์˜ ๋ผ๋ฒจ๊ณผ ํ•จ๊ป˜ <code>AutoModelForSequenceClassification</code> ํด๋ž˜์Šค๋ฅผ ์‚ฌ์šฉํ•˜๊ฒ ์Šต๋‹ˆ๋‹ค.',lt,X,nt,z,ul='<a href="/course/chapter2">Chapter 2</a>์™€ ๋‹ฌ๋ฆฌ ์ด ์‚ฌ์ „ ํ›ˆ๋ จ๋œ ๋ชจ๋ธ์„ ์ธ์Šคํ„ด์Šคํ™”ํ•˜๋ฉด ๊ฒฝ๊ณ  ๋ฉ”์‹œ์ง€๊ฐ€ ๋‚˜ํƒ€๋‚˜๋Š” ๊ฒƒ์„ ํ™•์ธํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ์ด๋Š” BERT๊ฐ€ ๋ฌธ์žฅ ์Œ ๋ถ„๋ฅ˜๋ฅผ ์œ„ํ•ด ์‚ฌ์ „ ํ›ˆ๋ จ๋˜์ง€ ์•Š์•˜๊ธฐ ๋•Œ๋ฌธ์—, ์‚ฌ์ „ ํ›ˆ๋ จ๋œ ๋ชจ๋ธ์˜ ํ—ค๋“œ๊ฐ€ ์ œ๊ฑฐ๋˜๊ณ  ์‹œํ€€์Šค ๋ถ„๋ฅ˜์— ์ ํ•ฉํ•œ ์ƒˆ๋กœ์šด ํ—ค๋“œ๊ฐ€ ์ถ”๊ฐ€๋˜์—ˆ๊ธฐ ๋•Œ๋ฌธ์ž…๋‹ˆ๋‹ค. ๊ฒฝ๊ณ ๋Š” ์ผ๋ถ€ ๊ฐ€์ค‘์น˜(์ œ๊ฑฐ๋œ ์‚ฌ์ „ ํ›ˆ๋ จ ํ—ค๋“œ์— ํ•ด๋‹นํ•˜๋Š” ๊ฐ€์ค‘์น˜)๊ฐ€ ์‚ฌ์šฉ๋˜์ง€ ์•Š์•˜๊ณ , ์ผ๋ถ€ ๋‹ค๋ฅธ ๊ฐ€์ค‘์น˜(์ƒˆ๋กœ์šด ํ—ค๋“œ์šฉ)๊ฐ€ ๋ฌด์ž‘์œ„๋กœ ์ดˆ๊ธฐํ™”๋˜์—ˆ๋‹ค๋Š” ๊ฒƒ์„ ๋‚˜ํƒ€๋ƒ…๋‹ˆ๋‹ค. ๋งˆ์ง€๋ง‰์œผ๋กœ ๋ชจ๋ธ์„ ํ›ˆ๋ จ์‹œํ‚ค๋ผ๋Š” ๋ฉ”์‹œ์ง€๊ฐ€ ๋‚˜์˜ค๋Š”๋ฐ, ๋ฐ”๋กœ ์ง€๊ธˆ๋ถ€ํ„ฐ ๊ทธ ์ž‘์—…์„ ์‹œ์ž‘ํ•˜๊ฒ ์Šต๋‹ˆ๋‹ค.',st,Y,Tl="๋ชจ๋ธ์ด ์ค€๋น„๋˜๋ฉด, ์ง€๊ธˆ๊นŒ์ง€ ๊ตฌ์„ฑํ•œ ๋ชจ๋“  ๊ฐ์ฒด(<code>model</code>, <code>training_args</code>, ํ›ˆ๋ จ ๋ฐ ๊ฒ€์ฆ ๋ฐ์ดํ„ฐ์…‹, <code>data_collator</code>, <code>processing_class</code>)๋ฅผ ์ „๋‹ฌํ•˜์—ฌ <code>Trainer</code>๋ฅผ ์ •์˜ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. <code>processing_class</code> ๋งค๊ฐœ๋ณ€์ˆ˜๋Š” ๋น„๊ต์  ์ตœ๊ทผ์— ์ถ”๊ฐ€๋œ ๊ธฐ๋Šฅ์œผ๋กœ, <code>Trainer</code>์—๊ฒŒ ์–ด๋–ค ํ† ํฌ๋‚˜์ด์ €๋ฅผ ์‚ฌ์šฉํ•ด ๋ฐ์ดํ„ฐ๋ฅผ ์ฒ˜๋ฆฌํ• ์ง€ ์•Œ๋ ค์ค๋‹ˆ๋‹ค.",at,F,it,q,$l="<code>processing_class</code>์— ํ† ํฌ๋‚˜์ด์ €๋ฅผ ์ „๋‹ฌํ•˜๋ฉด, <code>Trainer</code>๊ฐ€ ๊ธฐ๋ณธ์ ์œผ๋กœ <code>DataCollatorWithPadding</code>์„ <code>data_collator</code>๋กœ ์‚ฌ์šฉํ•ฉ๋‹ˆ๋‹ค. ๋”ฐ๋ผ์„œ ์ด ๊ฒฝ์šฐ์—๋Š” <code>data_collator=data_collator</code> ์ค„์„ ์ƒ๋žตํ•  ์ˆ˜ ์žˆ์ง€๋งŒ, ๋ฐ์ดํ„ฐ ์ฒ˜๋ฆฌ ํŒŒ์ดํ”„๋ผ์ธ์˜ ์ค‘์š”ํ•œ ๋ถ€๋ถ„์„ ๋ณด์—ฌ๋“œ๋ฆฌ๊ธฐ ์œ„ํ•ด ์ฝ”๋“œ์— ํฌํ•จํ–ˆ์Šต๋‹ˆ๋‹ค.",rt,w,yl='<p>๐Ÿ“– <strong>๋” ์ž์„ธํžˆ ์•Œ์•„๋ณด๊ธฐ</strong>: Trainer ํด๋ž˜์Šค์™€ ๊ทธ ๋งค๊ฐœ๋ณ€์ˆ˜์— ๋Œ€ํ•œ ์ž์„ธํ•œ ๋‚ด์šฉ์€ <a href="https://huggingface.co/docs/transformers/main/en/main_classes/trainer" rel="nofollow">Trainer API ๋ฌธ์„œ</a>๋ฅผ ๋ฐฉ๋ฌธํ•˜๊ณ  <a href="https://huggingface.co/learn/cookbook/en/fine_tuning_code_llm_on_single_gpu" rel="nofollow">ํ›ˆ๋ จ ์ฟก๋ถ ๋ ˆ์‹œํ”ผ</a>์—์„œ ๊ณ ๊ธ‰ ์‚ฌ์šฉ ํŒจํ„ด์„ ์‚ดํŽด๋ณด์„ธ์š”.</p>',pt,B,gl="๋ฐ์ดํ„ฐ์…‹์—์„œ ๋ชจ๋ธ์„ ๋ฏธ์„ธ ์กฐ์ •ํ•˜๋ ค๋ฉด <code>Trainer</code>์˜ <code>train()</code> ๋ฉ”์†Œ๋“œ๋ฅผ ํ˜ธ์ถœํ•˜๊ธฐ๋งŒ ํ•˜๋ฉด ๋ฉ๋‹ˆ๋‹ค.",ot,A,ct,L,Jl="์ด๋ ‡๊ฒŒ ํ•˜๋ฉด ๋ฏธ์„ธ ์กฐ์ •์ด ์‹œ์ž‘๋ฉ๋‹ˆ๋‹ค(GPU์—์„œ๋Š” ๋ช‡ ๋ถ„ ์ •๋„ ์†Œ์š”๋ฉ๋‹ˆ๋‹ค). 500๋‹จ๊ณ„๋งˆ๋‹ค ํ›ˆ๋ จ ์†์‹ค์ด ์ถœ๋ ฅ๋˜์ง€๋งŒ, ๋ชจ๋ธ์˜ ์„ฑ๋Šฅ์ด ์–ผ๋งˆ๋‚˜ ์ข‹์€์ง€(๋˜๋Š” ๋‚˜์œ์ง€)๋Š” ์•Œ๋ ค์ฃผ์ง€ ์•Š์Šต๋‹ˆ๋‹ค. ๊ทธ ์ด์œ ๋Š” ๋‹ค์Œ๊ณผ ๊ฐ™์Šต๋‹ˆ๋‹ค.",mt,N,Ul="<li><code>TrainingArguments</code>์—์„œ <code>eval_strategy</code>๋ฅผ <code>&quot;steps&quot;</code> (๋งค <code>eval_steps</code>๋งˆ๋‹ค ํ‰๊ฐ€) ๋˜๋Š” <code>&quot;epoch&quot;</code> (๊ฐ ์—ํฌํฌ ์ข…๋ฃŒ ์‹œ ํ‰๊ฐ€)๋กœ ์„ค์ •ํ•˜์ง€ ์•Š์•˜์Šต๋‹ˆ๋‹ค.</li> <li>ํ‰๊ฐ€ ์ค‘์— ๋ฉ”ํŠธ๋ฆญ์„ ๊ณ„์‚ฐํ•˜๊ธฐ ์œ„ํ•œ <code>compute_metrics()</code> ํ•จ์ˆ˜๋ฅผ <code>Trainer</code>์— ์ œ๊ณตํ•˜์ง€ ์•Š์•˜์Šต๋‹ˆ๋‹ค. ์ด ํ•จ์ˆ˜๊ฐ€ ์—†์œผ๋ฉด ํ‰๊ฐ€์—์„œ ์†์‹ค ๊ฐ’๋งŒ ์ถœ๋ ฅ๋˜๋Š”๋ฐ, ์ด ๊ฐ’๋งŒ์œผ๋กœ๋Š” ์„ฑ๋Šฅ์„ ํŒŒ์•…ํ•˜๊ธฐ ์–ด๋ ต์Šต๋‹ˆ๋‹ค.</li>",Mt,P,ft,S,bl="์ด์ œ ์œ ์šฉํ•œ <code>compute_metrics()</code> ํ•จ์ˆ˜๋ฅผ ์–ด๋–ป๊ฒŒ ๋งŒ๋“ค๊ณ  ๋‹ค์Œ ํ›ˆ๋ จ ์‹œ ์‚ฌ์šฉํ•  ์ˆ˜ ์žˆ๋Š”์ง€ ์•Œ์•„๋ณด๊ฒ ์Šต๋‹ˆ๋‹ค. ์ด ํ•จ์ˆ˜๋Š” <code>EvalPrediction</code> ๊ฐ์ฒด(<code>predictions</code> ํ•„๋“œ์™€ <code>label_ids</code> ํ•„๋“œ๋ฅผ ๊ฐ–๋Š” ๋ช…๋ช…๋œ ํŠœํ”Œ)๋ฅผ ์ž…๋ ฅ๋ฐ›์Šต๋‹ˆ๋‹ค. ๊ทธ๋ฆฌ๊ณ  ๊ฐ ๋ฉ”ํŠธ๋ฆญ์˜ ์ด๋ฆ„์„ ํ‚ค(๋ฌธ์ž์—ด)๋กœ, ์„ฑ๋Šฅ์„ ๊ฐ’(๋ถ€๋™์†Œ์ˆ˜์ )์œผ๋กœ ๊ฐ–๋Š” ๋”•์…”๋„ˆ๋ฆฌ๋ฅผ ๋ฐ˜ํ™˜ํ•ด์•ผ ํ•ฉ๋‹ˆ๋‹ค. ๋ชจ๋ธ์˜ ์˜ˆ์ธก๊ฐ’์„ ์–ป๊ธฐ ์œ„ํ•ด <code>Trainer.predict()</code>๋ฅผ ์‚ฌ์šฉํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.",dt,D,ut,O,Tt,K,wl="<code>predict()</code> ๋ฉ”์†Œ๋“œ์˜ ์ถœ๋ ฅ์€ <code>predictions</code>, <code>label_ids</code>, <code>metrics</code> ์„ธ ๊ฐœ์˜ ํ•„๋“œ๊ฐ€ ์žˆ๋Š” ๋˜ ๋‹ค๋ฅธ ๋ช…๋ช…๋œ ํŠœํ”Œ์ž…๋‹ˆ๋‹ค. <code>metrics</code> ํ•„๋“œ์—๋Š” ์ „๋‹ฌ๋œ ๋ฐ์ดํ„ฐ์…‹์— ๋Œ€ํ•œ ์†์‹ค ๊ฐ’๊ณผ ์‹œ๊ฐ„ ๊ด€๋ จ ๋ฉ”ํŠธ๋ฆญ(์ด ์˜ˆ์ธก ์‹œ๊ฐ„, ํ‰๊ท  ์˜ˆ์ธก ์‹œ๊ฐ„)๋งŒ ํฌํ•จ๋ฉ๋‹ˆ๋‹ค. ํ•˜์ง€๋งŒ <code>compute_metrics()</code> ํ•จ์ˆ˜๋ฅผ ์™„์„ฑํ•˜์—ฌ <code>Trainer</code>์— ์ „๋‹ฌํ•˜๋ฉด, ์ด ํ•„๋“œ์— <code>compute_metrics()</code>๊ฐ€ ๋ฐ˜ํ™˜ํ•˜๋Š” ๋ฉ”ํŠธ๋ฆญ๋“ค๋„ ํ•จ๊ป˜ ํฌํ•จ๋ฉ๋‹ˆ๋‹ค.",$t,ee,hl='๋ณด์‹œ๋‹ค์‹œํ”ผ, <code>predictions</code>๋Š” 408 x 2 ๋ชจ์–‘์˜ 2์ฐจ์› ๋ฐฐ์—ด์ž…๋‹ˆ๋‹ค (408์€ predict()์— ์ „๋‹ฌํ•œ ๋ฐ์ดํ„ฐ์…‹์˜ ์ƒ˜ํ”Œ ๊ฐœ์ˆ˜์ž…๋‹ˆ๋‹ค). ์ด ๊ฐ’๋“ค์€ <code>predict()</code>์— ์ „๋‹ฌํ•œ ๋ฐ์ดํ„ฐ์…‹์˜ ๊ฐ ์ƒ˜ํ”Œ์— ๋Œ€ํ•œ ๋กœ์ง“์ž…๋‹ˆ๋‹ค (<a href="/course/chapter2">์ด์ „ ์ฑ•ํ„ฐ</a>์—์„œ ๋ณด์•˜๋“ฏ์ด ๋ชจ๋“  Transformer ๋ชจ๋ธ์€ ๋กœ์ง“์„ ๋ฐ˜ํ™˜ํ•ฉ๋‹ˆ๋‹ค). ์ด ๋กœ์ง“์„ ์šฐ๋ฆฌ๊ฐ€ ๊ฐ€์ง„ ๋ ˆ์ด๋ธ”๊ณผ ๋น„๊ตํ•  ์ˆ˜ ์žˆ๋Š” ์˜ˆ์ธก๊ฐ’์œผ๋กœ ๋ณ€ํ™˜ํ•˜๋ ค๋ฉด, ๋‘ ๋ฒˆ์งธ ์ถ•์—์„œ ์ตœ๋Œ“๊ฐ’์„ ๊ฐ€์ง„ ์ธ๋ฑ์Šค๋ฅผ ๊ตฌํ•ด์•ผ ํ•ฉ๋‹ˆ๋‹ค.',yt,te,gt,le,jl='์ด์ œ ์ด <code>preds</code>๋ฅผ ๋ผ๋ฒจ๊ณผ ๋น„๊ตํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. <code>compute_metric()</code> ํ•จ์ˆ˜๋ฅผ ๋นŒ๋“œํ•˜๊ธฐ ์œ„ํ•ด ๐Ÿค— <a href="https://github.com/huggingface/evaluate/" rel="nofollow">Evaluate</a> ๋ผ์ด๋ธŒ๋Ÿฌ๋ฆฌ์˜ ๋ฉ”ํŠธ๋ฆญ์„ ํ™œ์šฉํ•˜๊ฒ ์Šต๋‹ˆ๋‹ค. ๋ฐ์ดํ„ฐ์…‹์„ ๋กœ๋“œํ–ˆ๋˜ ๊ฒƒ์ฒ˜๋Ÿผ, MRPC ๋ฐ์ดํ„ฐ์…‹๊ณผ ๊ด€๋ จ๋œ ๋ฉ”ํŠธ๋ฆญ๋„ <code>evaluate.load()</code> ํ•จ์ˆ˜๋กœ ์‰ฝ๊ฒŒ ๋กœ๋“œํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ๋ฐ˜ํ™˜๋œ ๊ฐ์ฒด์˜ <code>compute()</code> ๋ฉ”์„œ๋“œ๋ฅผ ์‚ฌ์šฉํ•ด ๋ฉ”ํŠธ๋ฆญ์„ ๊ณ„์‚ฐํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.',Jt,ne,Ut,se,bt,h,_l='<p>๋‹ค์–‘ํ•œ ํ‰๊ฐ€ ๋ฉ”ํŠธ๋ฆญ๊ณผ ์ „๋žต์— ๋Œ€ํ•ด ์•Œ์•„๋ณด๋ ค๋ฉด <a href="https://huggingface.co/docs/evaluate/" rel="nofollow">๐Ÿค— Evaluate ๋ฌธ์„œ</a>๋ฅผ ์ฐธ๊ณ ํ•˜์„ธ์š”.</p>',wt,ae,Cl='๋ชจ๋ธ ํ—ค๋“œ์˜ ๊ฐ€์ค‘์น˜๊ฐ€ ๋ฌด์ž‘์œ„๋กœ ์ดˆ๊ธฐํ™”๋˜๊ธฐ ๋•Œ๋ฌธ์— ์–ป๊ฒŒ ๋˜๋Š” ๊ฒฐ๊ณผ๋Š” ์กฐ๊ธˆ์”ฉ ๋‹ค๋ฅผ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ๊ฒฐ๊ณผ๋ฅผ ๋ณด๋ฉด ์šฐ๋ฆฌ ๋ชจ๋ธ์ด ๊ฒ€์ฆ ์„ธํŠธ์—์„œ 85.78%์˜ ์ •ํ™•๋„์™€ 89.97%์˜ F1 ์ ์ˆ˜๋ฅผ ๋‹ฌ์„ฑํ–ˆ์Œ์„ ๋ณผ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ์ด ๋‘ ๊ฐ€์ง€๋Š” GLUE ๋ฒค์น˜๋งˆํฌ์˜ MRPC ๋ฐ์ดํ„ฐ์…‹์—์„œ ๊ฒฐ๊ณผ๋ฅผ ํ‰๊ฐ€ํ•˜๋Š” ๋ฐ ์‚ฌ์šฉ๋˜๋Š” ๋ฉ”ํŠธ๋ฆญ์ž…๋‹ˆ๋‹ค. <a href="https://arxiv.org/pdf/1810.04805.pdf" rel="nofollow">BERT ๋…ผ๋ฌธ</a>์—์„œ๋Š” ๊ธฐ๋ณธ ๋ชจ๋ธ์˜ F1 ์ ์ˆ˜๋ฅผ 88.9๋กœ ๋ณด๊ณ ํ•˜์˜€์Šต๋‹ˆ๋‹ค. ๋‹น์‹œ์—๋Š” <code>uncased</code> ๋ชจ๋ธ์„ ์‚ฌ์šฉํ–ˆ์ง€๋งŒ, ์šฐ๋ฆฌ๋Š” ํ˜„์žฌ <code>cased</code> ๋ชจ๋ธ์„ ์‚ฌ์šฉํ•˜๊ณ  ์žˆ๊ธฐ ๋•Œ๋ฌธ์— ๋” ๋‚˜์€ ๊ฒฐ๊ณผ๊ฐ€ ๋‚˜์˜จ ๊ฒƒ์ž…๋‹ˆ๋‹ค.',ht,ie,kl="์ด ๋ชจ๋“  ๊ฒƒ์„ ์ข…ํ•ฉํ•˜๋ฉด, ๋‹ค์Œ์ฒ˜๋Ÿผ <code>compute_metrics()</code> ํ•จ์ˆ˜๋ฅผ ๋‹ค์Œ๊ณผ ๊ฐ™์ด ์ •์˜ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.",jt,re,_t,pe,vl="๊ฐ ์—ํญ์ด ๋๋‚  ๋•Œ๋งˆ๋‹ค ๋ฉ”ํŠธ๋ฆญ์ด ์ถœ๋ ฅ๋˜๋„๋ก, ์ด <code>compute_metrics()</code> ํ•จ์ˆ˜๊ฐ€ ํฌํ•จํ•˜์—ฌ <code>Trainer</code>๋ฅผ ์ƒˆ๋กœ ์ •์˜ํ•ด ๋ณด๊ฒ ์Šต๋‹ˆ๋‹ค.",Ct,oe,kt,ce,xl="์ฐธ๊ณ ๋กœ, ์šฐ๋ฆฌ๋Š” <code>eval_strategy</code>๋ฅผ <code>&quot;epoch&quot;</code>์œผ๋กœ ์„ค์ •ํ•œ ์ƒˆ๋กœ์šด <code>TrainingArguments</code>์™€ ์ƒˆ๋กœ์šด ๋ชจ๋ธ์„ ์ƒ์„ฑํ•ฉ๋‹ˆ๋‹ค. ์ด๋ ‡๊ฒŒ ํ•˜์ง€ ์•Š์œผ๋ฉด ์ด๋ฏธ ํ›ˆ๋ จ๋œ ๋ชจ๋ธ์˜ ํ›ˆ๋ จ์„ ๊ณ„์†ํ•˜๊ฒŒ ๋  ๊ฒ๋‹ˆ๋‹ค. ์ƒˆ๋กœ์šด ํ›ˆ๋ จ์„ ์‹œ์ž‘ํ•˜๋ ค๋ฉด ๋‹ค์Œ์„ ์‹คํ–‰ํ•˜์„ธ์š”.",vt,me,xt,Me,Rl="์ด๋ฒˆ์—๋Š” ํ›ˆ๋ จ ์†์‹ค ์™ธ์—๋„ ๊ฐ ์—ํญ์ด ๋๋‚  ๋•Œ๋งˆ๋‹ค ๊ฒ€์ฆ ์†์‹ค๊ณผ ๋ฉ”ํŠธ๋ฆญ์ด ํ•จ๊ป˜ ์ถœ๋ ฅ๋  ๊ฒ๋‹ˆ๋‹ค. ์•ž์„œ ๋งํ–ˆ๋“ฏ์ด ๋ชจ๋ธ ํ—ค๋“œ์˜ ๋ฌด์ž‘์œ„ ์ดˆ๊ธฐํ™” ๋•Œ๋ฌธ์— ์—ฌ๋Ÿฌ๋ถ„์ด ์–ป๋Š” ์ •ํ™•๋„/F1 ์ ์ˆ˜๋Š” ์šฐ๋ฆฌ๊ฐ€ ์–ป์€ ๊ฒฐ๊ณผ์™€ ์•ฝ๊ฐ„ ๋‹ค๋ฅผ ์ˆ˜ ์žˆ์ง€๋งŒ, ๋น„์Šทํ•œ ๋ฒ”์œ„์— ์žˆ์„ ๊ฒ๋‹ˆ๋‹ค.",Rt,fe,Ht,de,Hl="<code>Trainer</code>๋Š” ํ˜„๋Œ€ ๋”ฅ๋Ÿฌ๋‹์˜ ๋ชจ๋ฒ” ์‚ฌ๋ก€๋“ค์„ ์‰ฝ๊ฒŒ ํ™œ์šฉํ•  ์ˆ˜ ์žˆ๋„๋ก ๋‹ค์–‘ํ•œ ๋‚ด์žฅ ๊ธฐ๋Šฅ์„ ์ œ๊ณตํ•ฉ๋‹ˆ๋‹ค.",Wt,ue,Wl="<strong>ํ˜ผํ•ฉ ์ •๋ฐ€๋„ ํ›ˆ๋ จ</strong>: ๋” ๋น ๋ฅธ ํ›ˆ๋ จ๊ณผ ๋ฉ”๋ชจ๋ฆฌ ์‚ฌ์šฉ๋Ÿ‰ ๊ฐ์†Œ๋ฅผ ์œ„ํ•ด ํ›ˆ๋ จ ์ธ์ˆ˜์—์„œ <code>fp16=True</code>๋ฅผ ์„ค์ •ํ•˜์„ธ์š”.",Gt,Te,It,$e,Gl="<strong>๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ </strong>: GPU ๋ฉ”๋ชจ๋ฆฌ๊ฐ€ ๋ถ€์กฑํ•  ๋•Œ ๋” ํฐ ๋ฐฐ์น˜ ํฌ๊ธฐ๋กœ ํ•™์Šตํ•˜๋Š” ํšจ๊ณผ๋ฅผ ๋‚ผ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.",Zt,ye,Et,ge,Il="<strong>ํ•™์Šต๋ฅ  ์Šค์ผ€์ค„๋ง</strong>: Trainer๋Š” ๊ธฐ๋ณธ์ ์œผ๋กœ ์„ ํ˜• ๊ฐ์†Œ ๋ฐฉ์‹์„ ์‚ฌ์šฉํ•˜์ง€๋งŒ, ์‚ฌ์šฉ์ž ๋งž์ถค ์„ค์ •์ด ๊ฐ€๋Šฅํ•ฉ๋‹ˆ๋‹ค.",Qt,Je,Vt,j,Zl='<p>๐ŸŽฏ <strong>์„ฑ๋Šฅ ์ตœ์ ํ™”</strong>: ๋ถ„์‚ฐ ํ›ˆ๋ จ, ๋ฉ”๋ชจ๋ฆฌ ์ตœ์ ํ™”, ํ•˜๋“œ์›จ์–ด๋ณ„ ์ตœ์ ํ™”๋ฅผ ํฌํ•จํ•œ ๊ณ ๊ธ‰ ํ›ˆ๋ จ ๊ธฐ์ˆ ์— ๋Œ€ํ•ด์„œ๋Š” <a href="https://huggingface.co/docs/transformers/main/en/performance" rel="nofollow">๐Ÿค— Transformers ์„ฑ๋Šฅ ๊ฐ€์ด๋“œ</a>๋ฅผ ์‚ดํŽด๋ณด์„ธ์š”.</p>',Xt,Ue,El="<code>Trainer</code>๋Š” ์—ฌ๋Ÿฌ GPU ๋˜๋Š” TPU์—์„œ ์ฆ‰์‹œ ์ž‘๋™ํ•˜๋ฉฐ ๋ถ„์‚ฐ ํ›ˆ๋ จ์„ ์œ„ํ•œ ๋งŽ์€ ์˜ต์…˜์„ ์ œ๊ณตํ•ฉ๋‹ˆ๋‹ค. ์ด์™€ ๊ด€๋ จ๋œ ๋ชจ๋“  ๋‚ด์šฉ์€ Chapter 10์—์„œ ๋‹ค๋ฃจ๊ฒ ์Šต๋‹ˆ๋‹ค.",zt,be,Ql='์ด๊ฒƒ์œผ๋กœ <code>Trainer</code> API๋ฅผ ์‚ฌ์šฉํ•œ ๋ฏธ์„ธ ์กฐ์ • ์†Œ๊ฐœ๋ฅผ ๋งˆ์นฉ๋‹ˆ๋‹ค. ๋Œ€๋ถ€๋ถ„์˜ ์ผ๋ฐ˜์ ์ธ NLP ์ž‘์—…์— ๋Œ€ํ•œ ์˜ˆ์ œ๋Š” <a href="/course/chapter7">Chapter 7</a>์—์„œ ๋‹ค๋ฃฐ ์˜ˆ์ •์ด๋ฉฐ, ๋‹ค์Œ์œผ๋กœ๋Š” ์ˆœ์ˆ˜ PyTorch ์ฝ”๋“œ๋กœ ๋™์ผํ•œ ์ž‘์—…์„ ์ˆ˜ํ–‰ํ•˜๋Š” ๋ฐฉ๋ฒ•์„ ์‚ดํŽด๋ณด๊ฒ ์Šต๋‹ˆ๋‹ค.',Yt,_,Vl='<p>๐Ÿ“ <strong>๋” ๋งŽ์€ ์˜ˆ์ œ</strong>: <a href="https://huggingface.co/docs/transformers/main/en/notebooks" rel="nofollow">๐Ÿค— Transformers ๋…ธํŠธ๋ถ</a>์— ์žˆ๋Š” ๋ฐฉ๋Œ€ํ•œ ์ž๋ฃŒ๋ฅผ ํ™•์ธํ•ด ๋ณด์„ธ์š”.</p>',Ft,we,qt,he,Xl="Trainer API์™€ ๋ฏธ์„ธ ์กฐ์ • ๊ฐœ๋…์— ๋Œ€ํ•œ ์ดํ•ด๋ฅผ ํ…Œ์ŠคํŠธํ•ด๋ณด์„ธ์š”.",Bt,je,At,_e,Lt,Ce,Nt,ke,Pt,ve,St,xe,Dt,Re,Ot,He,Kt,We,el,Ge,tl,Ie,ll,Ze,nl,C,zl="<p>๐Ÿ’ก <strong>ํ•ต์‹ฌ ์š”์ :</strong></p> <ul><li><code>Trainer</code> API๋Š” ๋Œ€๋ถ€๋ถ„์˜ ํ›ˆ๋ จ ๋ณต์žก์„ฑ์„ ์ฒ˜๋ฆฌํ•˜๋Š” ๋†’์€ ์ˆ˜์ค€์˜ ์ธํ„ฐํŽ˜์ด์Šค๋ฅผ ์ œ๊ณตํ•ฉ๋‹ˆ๋‹ค.</li> <li><code>processing_class</code>๋Š” ์ ์ ˆํ•œ ๋ฐ์ดํ„ฐ ์ฒ˜๋ฆฌ๋ฅผ ์œ„ํ•ด ํ† ํฌ๋‚˜์ด์ €๋ฅผ ์ €์žฅํ•˜๋Š” ๋ฐ ์‚ฌ์šฉ๋ฉ๋‹ˆ๋‹ค.</li> <li><code>TrainingArguments</code>๋Š” ํ•™์Šต๋ฅ , ๋ฐฐ์น˜ ํฌ๊ธฐ, ํ‰๊ฐ€ ์ „๋žต, ์ตœ์ ํ™” ๋“ฑ ํ›ˆ๋ จ์˜ ๋ชจ๋“  ์ธก๋ฉด์„ ์ œ์–ดํ•ฉ๋‹ˆ๋‹ค.</li> <li><code>compute_metrics</code>๋ฅผ ์‚ฌ์šฉํ•˜๋ฉด ํ›ˆ๋ จ ์†์‹ค ์™ธ์— ์‚ฌ์šฉ์ž ์ •์˜ ํ‰๊ฐ€ ๋ฉ”ํŠธ๋ฆญ์„ ํ™œ์šฉํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.</li> <li>ํ˜ผํ•ฉ ์ •๋ฐ€๋„(<code>fp16=True</code>)์™€ ๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ ๊ณผ ๊ฐ™์€ ์ตœ์‹  ๊ธฐ๋Šฅ์€ ํ›ˆ๋ จ ํšจ์œจ์„ฑ์„ ํฌ๊ฒŒ ํ–ฅ์ƒ์‹œํ‚ฌ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.</li></ul>",sl,Ee,al,ze,il;return J=new en({props:{fw:rl[0]}}),k=new Sl({props:{containerStyle:"float: right; margin-left: 10px; display: inline-flex; position: relative; z-index: 10;"}}),v=new T({props:{title:"Trainer API๋กœ ๋ชจ๋ธ ๋ฏธ์„ธ ์กฐ์ •ํ•˜๊ธฐ",local:"fine-tuning-a-model-with-the-trainer-api",headingTag:"h1"}}),x=new Kl({props:{chapter:3,classNames:"absolute z-10 right-0 top-0",notebooks:[{label:"Google Colab",value:"https://colab.research.google.com/github/huggingface/notebooks/blob/master/course/ko/chapter3/section3.ipynb"},{label:"Aws Studio",value:"https://studiolab.sagemaker.aws/import/github/huggingface/notebooks/blob/master/course/ko/chapter3/section3.ipynb"}]}}),R=new Ol({props:{id:"nvBXf7s7vTI"}}),G=new u({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBZnJvbSUyMHRyYW5zZm9ybWVycyUyMGltcG9ydCUyMEF1dG9Ub2tlbml6ZXIlMkMlMjBEYXRhQ29sbGF0b3JXaXRoUGFkZGluZyUwQSUwQXJhd19kYXRhc2V0cyUyMCUzRCUyMGxvYWRfZGF0YXNldCglMjJnbHVlJTIyJTJDJTIwJTIybXJwYyUyMiklMEFjaGVja3BvaW50JTIwJTNEJTIwJTIyYmVydC1iYXNlLXVuY2FzZWQlMjIlMEF0b2tlbml6ZXIlMjAlM0QlMjBBdXRvVG9rZW5pemVyLmZyb21fcHJldHJhaW5lZChjaGVja3BvaW50KSUwQSUwQSUwQWRlZiUyMHRva2VuaXplX2Z1bmN0aW9uKGV4YW1wbGUpJTNBJTBBJTIwJTIwJTIwJTIwcmV0dXJuJTIwdG9rZW5pemVyKGV4YW1wbGUlNUIlMjJzZW50ZW5jZTElMjIlNUQlMkMlMjBleGFtcGxlJTVCJTIyc2VudGVuY2UyJTIyJTVEJTJDJTIwdHJ1bmNhdGlvbiUzRFRydWUpJTBBJTBBJTBBdG9rZW5pemVkX2RhdGFzZXRzJTIwJTNEJTIwcmF3X2RhdGFzZXRzLm1hcCh0b2tlbml6ZV9mdW5jdGlvbiUyQyUyMGJhdGNoZWQlM0RUcnVlKSUwQWRhdGFfY29sbGF0b3IlMjAlM0QlMjBEYXRhQ29sbGF0b3JXaXRoUGFkZGluZyh0b2tlbml6ZXIlM0R0b2tlbml6ZXIp",highlighted:`<span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset
<span class="hljs-keyword">from</span> transformers <span class="hljs-keyword">import</span> AutoTokenizer, DataCollatorWithPadding
raw_datasets = load_dataset(<span class="hljs-string">&quot;glue&quot;</span>, <span class="hljs-string">&quot;mrpc&quot;</span>)
checkpoint = <span class="hljs-string">&quot;bert-base-uncased&quot;</span>
tokenizer = AutoTokenizer.from_pretrained(checkpoint)
<span class="hljs-keyword">def</span> <span class="hljs-title function_">tokenize_function</span>(<span class="hljs-params">example</span>):
<span class="hljs-keyword">return</span> tokenizer(example[<span class="hljs-string">&quot;sentence1&quot;</span>], example[<span class="hljs-string">&quot;sentence2&quot;</span>], truncation=<span class="hljs-literal">True</span>)
tokenized_datasets = raw_datasets.<span class="hljs-built_in">map</span>(tokenize_function, batched=<span class="hljs-literal">True</span>)
data_collator = DataCollatorWithPadding(tokenizer=tokenizer)`,wrap:!1}}),I=new T({props:{title:"ํ›ˆ๋ จ",local:"training",headingTag:"h3"}}),E=new u({props:{code:"ZnJvbSUyMHRyYW5zZm9ybWVycyUyMGltcG9ydCUyMFRyYWluaW5nQXJndW1lbnRzJTBBJTBBdHJhaW5pbmdfYXJncyUyMCUzRCUyMFRyYWluaW5nQXJndW1lbnRzKCUyMnRlc3QtdHJhaW5lciUyMik=",highlighted:`<span class="hljs-keyword">from</span> transformers <span class="hljs-keyword">import</span> TrainingArguments
training_args = TrainingArguments(<span class="hljs-string">&quot;test-trainer&quot;</span>)`,wrap:!1}}),X=new u({props:{code:"ZnJvbSUyMHRyYW5zZm9ybWVycyUyMGltcG9ydCUyMEF1dG9Nb2RlbEZvclNlcXVlbmNlQ2xhc3NpZmljYXRpb24lMEElMEFtb2RlbCUyMCUzRCUyMEF1dG9Nb2RlbEZvclNlcXVlbmNlQ2xhc3NpZmljYXRpb24uZnJvbV9wcmV0cmFpbmVkKGNoZWNrcG9pbnQlMkMlMjBudW1fbGFiZWxzJTNEMik=",highlighted:`<span class="hljs-keyword">from</span> transformers <span class="hljs-keyword">import</span> AutoModelForSequenceClassification
model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=<span class="hljs-number">2</span>)`,wrap:!1}}),F=new u({props:{code:"ZnJvbSUyMHRyYW5zZm9ybWVycyUyMGltcG9ydCUyMFRyYWluZXIlMEElMEF0cmFpbmVyJTIwJTNEJTIwVHJhaW5lciglMEElMjAlMjAlMjAlMjBtb2RlbCUyQyUwQSUyMCUyMCUyMCUyMHRyYWluaW5nX2FyZ3MlMkMlMEElMjAlMjAlMjAlMjB0cmFpbl9kYXRhc2V0JTNEdG9rZW5pemVkX2RhdGFzZXRzJTVCJTIydHJhaW4lMjIlNUQlMkMlMEElMjAlMjAlMjAlMjBldmFsX2RhdGFzZXQlM0R0b2tlbml6ZWRfZGF0YXNldHMlNUIlMjJ2YWxpZGF0aW9uJTIyJTVEJTJDJTBBJTIwJTIwJTIwJTIwZGF0YV9jb2xsYXRvciUzRGRhdGFfY29sbGF0b3IlMkMlMEElMjAlMjAlMjAlMjBwcm9jZXNzaW5nX2NsYXNzJTNEdG9rZW5pemVyJTJDJTBBKQ==",highlighted:`<span class="hljs-keyword">from</span> transformers <span class="hljs-keyword">import</span> Trainer
trainer = Trainer(
model,
training_args,
train_dataset=tokenized_datasets[<span class="hljs-string">&quot;train&quot;</span>],
eval_dataset=tokenized_datasets[<span class="hljs-string">&quot;validation&quot;</span>],
data_collator=data_collator,
processing_class=tokenizer,
)`,wrap:!1}}),A=new u({props:{code:"dHJhaW5lci50cmFpbigp",highlighted:"trainer.train()",wrap:!1}}),P=new T({props:{title:"ํ‰๊ฐ€",local:"evaluation",headingTag:"h3"}}),D=new u({props:{code:"cHJlZGljdGlvbnMlMjAlM0QlMjB0cmFpbmVyLnByZWRpY3QodG9rZW5pemVkX2RhdGFzZXRzJTVCJTIydmFsaWRhdGlvbiUyMiU1RCklMEFwcmludChwcmVkaWN0aW9ucy5wcmVkaWN0aW9ucy5zaGFwZSUyQyUyMHByZWRpY3Rpb25zLmxhYmVsX2lkcy5zaGFwZSk=",highlighted:`predictions = trainer.predict(tokenized_datasets[<span class="hljs-string">&quot;validation&quot;</span>])
<span class="hljs-built_in">print</span>(predictions.predictions.shape, predictions.label_ids.shape)`,wrap:!1}}),O=new u({props:{code:"KDQwOCUyQyUyMDIpJTIwKDQwOCUyQyk=",highlighted:'(<span class="hljs-number">408</span>, <span class="hljs-number">2</span>) (<span class="hljs-number">408</span>,)',wrap:!1}}),te=new u({props:{code:"aW1wb3J0JTIwbnVtcHklMjBhcyUyMG5wJTBBJTBBcHJlZHMlMjAlM0QlMjBucC5hcmdtYXgocHJlZGljdGlvbnMucHJlZGljdGlvbnMlMkMlMjBheGlzJTNELTEp",highlighted:`<span class="hljs-keyword">import</span> numpy <span class="hljs-keyword">as</span> np
preds = np.argmax(predictions.predictions, axis=-<span class="hljs-number">1</span>)`,wrap:!1}}),ne=new u({props:{code:"aW1wb3J0JTIwZXZhbHVhdGUlMEElMEFtZXRyaWMlMjAlM0QlMjBldmFsdWF0ZS5sb2FkKCUyMmdsdWUlMjIlMkMlMjAlMjJtcnBjJTIyKSUwQW1ldHJpYy5jb21wdXRlKHByZWRpY3Rpb25zJTNEcHJlZHMlMkMlMjByZWZlcmVuY2VzJTNEcHJlZGljdGlvbnMubGFiZWxfaWRzKQ==",highlighted:`<span class="hljs-keyword">import</span> evaluate
metric = evaluate.load(<span class="hljs-string">&quot;glue&quot;</span>, <span class="hljs-string">&quot;mrpc&quot;</span>)
metric.compute(predictions=preds, references=predictions.label_ids)`,wrap:!1}}),se=new u({props:{code:"JTdCJ2FjY3VyYWN5JyUzQSUyMDAuODU3ODQzMTM3MjU0OTAxOSUyQyUyMCdmMSclM0ElMjAwLjg5OTY1Mzk3OTIzODc1NDIlN0Q=",highlighted:'{<span class="hljs-string">&#x27;accuracy&#x27;</span>: <span class="hljs-number">0.8578431372549019</span>, <span class="hljs-string">&#x27;f1&#x27;</span>: <span class="hljs-number">0.8996539792387542</span>}',wrap:!1}}),re=new u({props:{code:"ZGVmJTIwY29tcHV0ZV9tZXRyaWNzKGV2YWxfcHJlZHMpJTNBJTBBJTIwJTIwJTIwJTIwbWV0cmljJTIwJTNEJTIwZXZhbHVhdGUubG9hZCglMjJnbHVlJTIyJTJDJTIwJTIybXJwYyUyMiklMEElMjAlMjAlMjAlMjBsb2dpdHMlMkMlMjBsYWJlbHMlMjAlM0QlMjBldmFsX3ByZWRzJTBBJTIwJTIwJTIwJTIwcHJlZGljdGlvbnMlMjAlM0QlMjBucC5hcmdtYXgobG9naXRzJTJDJTIwYXhpcyUzRC0xKSUwQSUyMCUyMCUyMCUyMHJldHVybiUyMG1ldHJpYy5jb21wdXRlKHByZWRpY3Rpb25zJTNEcHJlZGljdGlvbnMlMkMlMjByZWZlcmVuY2VzJTNEbGFiZWxzKQ==",highlighted:`<span class="hljs-keyword">def</span> <span class="hljs-title function_">compute_metrics</span>(<span class="hljs-params">eval_preds</span>):
metric = evaluate.load(<span class="hljs-string">&quot;glue&quot;</span>, <span class="hljs-string">&quot;mrpc&quot;</span>)
logits, labels = eval_preds
predictions = np.argmax(logits, axis=-<span class="hljs-number">1</span>)
<span class="hljs-keyword">return</span> metric.compute(predictions=predictions, references=labels)`,wrap:!1}}),oe=new u({props:{code:"dHJhaW5pbmdfYXJncyUyMCUzRCUyMFRyYWluaW5nQXJndW1lbnRzKCUyMnRlc3QtdHJhaW5lciUyMiUyQyUyMGV2YWxfc3RyYXRlZ3klM0QlMjJlcG9jaCUyMiklMEFtb2RlbCUyMCUzRCUyMEF1dG9Nb2RlbEZvclNlcXVlbmNlQ2xhc3NpZmljYXRpb24uZnJvbV9wcmV0cmFpbmVkKGNoZWNrcG9pbnQlMkMlMjBudW1fbGFiZWxzJTNEMiklMEElMEF0cmFpbmVyJTIwJTNEJTIwVHJhaW5lciglMEElMjAlMjAlMjAlMjBtb2RlbCUyQyUwQSUyMCUyMCUyMCUyMHRyYWluaW5nX2FyZ3MlMkMlMEElMjAlMjAlMjAlMjB0cmFpbl9kYXRhc2V0JTNEdG9rZW5pemVkX2RhdGFzZXRzJTVCJTIydHJhaW4lMjIlNUQlMkMlMEElMjAlMjAlMjAlMjBldmFsX2RhdGFzZXQlM0R0b2tlbml6ZWRfZGF0YXNldHMlNUIlMjJ2YWxpZGF0aW9uJTIyJTVEJTJDJTBBJTIwJTIwJTIwJTIwZGF0YV9jb2xsYXRvciUzRGRhdGFfY29sbGF0b3IlMkMlMEElMjAlMjAlMjAlMjBwcm9jZXNzaW5nX2NsYXNzJTNEdG9rZW5pemVyJTJDJTBBJTIwJTIwJTIwJTIwY29tcHV0ZV9tZXRyaWNzJTNEY29tcHV0ZV9tZXRyaWNzJTJDJTBBKQ==",highlighted:`training_args = TrainingArguments(<span class="hljs-string">&quot;test-trainer&quot;</span>, eval_strategy=<span class="hljs-string">&quot;epoch&quot;</span>)
model = AutoModelForSequenceClassification.from_pretrained(checkpoint, num_labels=<span class="hljs-number">2</span>)
trainer = Trainer(
model,
training_args,
train_dataset=tokenized_datasets[<span class="hljs-string">&quot;train&quot;</span>],
eval_dataset=tokenized_datasets[<span class="hljs-string">&quot;validation&quot;</span>],
data_collator=data_collator,
processing_class=tokenizer,
compute_metrics=compute_metrics,
)`,wrap:!1}}),me=new u({props:{code:"dHJhaW5lci50cmFpbigp",highlighted:"trainer.train()",wrap:!1}}),fe=new T({props:{title:"๊ณ ๊ธ‰ ํ›ˆ๋ จ ๊ธฐ๋Šฅ",local:"advanced-training-features",headingTag:"h3"}}),Te=new u({props:{code:"dHJhaW5pbmdfYXJncyUyMCUzRCUyMFRyYWluaW5nQXJndW1lbnRzKCUwQSUyMCUyMCUyMCUyMCUyMnRlc3QtdHJhaW5lciUyMiUyQyUwQSUyMCUyMCUyMCUyMGV2YWxfc3RyYXRlZ3klM0QlMjJlcG9jaCUyMiUyQyUwQSUyMCUyMCUyMCUyMGZwMTYlM0RUcnVlJTJDJTIwJTIwJTIzJTIwJUVEJTk4JUJDJUVEJTk1JUE5JTIwJUVDJUEwJTk1JUVCJUIwJTgwJUVCJThGJTg0JTIwJUVEJTk5JTlDJUVDJTg0JUIxJUVEJTk5JTk0JTBBKQ==",highlighted:`training_args = TrainingArguments(
<span class="hljs-string">&quot;test-trainer&quot;</span>,
eval_strategy=<span class="hljs-string">&quot;epoch&quot;</span>,
fp16=<span class="hljs-literal">True</span>, <span class="hljs-comment"># ํ˜ผํ•ฉ ์ •๋ฐ€๋„ ํ™œ์„ฑํ™”</span>
)`,wrap:!1}}),ye=new u({props:{code:"dHJhaW5pbmdfYXJncyUyMCUzRCUyMFRyYWluaW5nQXJndW1lbnRzKCUwQSUyMCUyMCUyMCUyMCUyMnRlc3QtdHJhaW5lciUyMiUyQyUwQSUyMCUyMCUyMCUyMGV2YWxfc3RyYXRlZ3klM0QlMjJlcG9jaCUyMiUyQyUwQSUyMCUyMCUyMCUyMHBlcl9kZXZpY2VfdHJhaW5fYmF0Y2hfc2l6ZSUzRDQlMkMlMEElMjAlMjAlMjAlMjBncmFkaWVudF9hY2N1bXVsYXRpb25fc3RlcHMlM0Q0JTJDJTIwJTIwJTIzJTIwJUVDJTlDJUEwJUVEJTlBJUE4JTIwJUVCJUIwJUIwJUVDJUI5JTk4JTIwJUVEJTgxJUFDJUVBJUI4JUIwJTIwJTNEJTIwNCUyMColMjA0JTIwJTNEJTIwMTYlMEEp",highlighted:`training_args = TrainingArguments(
<span class="hljs-string">&quot;test-trainer&quot;</span>,
eval_strategy=<span class="hljs-string">&quot;epoch&quot;</span>,
per_device_train_batch_size=<span class="hljs-number">4</span>,
gradient_accumulation_steps=<span class="hljs-number">4</span>, <span class="hljs-comment"># ์œ ํšจ ๋ฐฐ์น˜ ํฌ๊ธฐ = 4 * 4 = 16</span>
)`,wrap:!1}}),Je=new u({props:{code:"dHJhaW5pbmdfYXJncyUyMCUzRCUyMFRyYWluaW5nQXJndW1lbnRzKCUwQSUyMCUyMCUyMCUyMCUyMnRlc3QtdHJhaW5lciUyMiUyQyUwQSUyMCUyMCUyMCUyMGV2YWxfc3RyYXRlZ3klM0QlMjJlcG9jaCUyMiUyQyUwQSUyMCUyMCUyMCUyMGxlYXJuaW5nX3JhdGUlM0QyZS01JTJDJTBBJTIwJTIwJTIwJTIwbHJfc2NoZWR1bGVyX3R5cGUlM0QlMjJjb3NpbmUlMjIlMkMlMjAlMjAlMjMlMjAlRUIlOEIlQTQlRUIlQTUlQjglMjAlRUMlOEElQTQlRUMlQkMlODAlRUMlQTQlODQlRUIlOUYlQUMlMjAlRUMlOEIlOUMlRUIlOEYlODQlMEEp",highlighted:`training_args = TrainingArguments(
<span class="hljs-string">&quot;test-trainer&quot;</span>,
eval_strategy=<span class="hljs-string">&quot;epoch&quot;</span>,
learning_rate=<span class="hljs-number">2e-5</span>,
lr_scheduler_type=<span class="hljs-string">&quot;cosine&quot;</span>, <span class="hljs-comment"># ๋‹ค๋ฅธ ์Šค์ผ€์ค„๋Ÿฌ ์‹œ๋„</span>
)`,wrap:!1}}),we=new T({props:{title:"์„น์…˜ ํ€ด์ฆˆ",local:"section-quiz",headingTag:"h2"}}),je=new T({props:{title:"1. Trainer ์—์„œ <code> processing_class </code> ๋งค๊ฐœ๋ณ€์ˆ˜์˜ ๋ชฉ์ ์€ ๋ฌด์—‡์ธ๊ฐ€์š”?",local:"1-trainer-์—์„œ-code-processingclass-code-๋งค๊ฐœ๋ณ€์ˆ˜์˜-๋ชฉ์ ์€-๋ฌด์—‡์ธ๊ฐ€์š”",headingTag:"h3"}}),_e=new Xe({props:{choices:[{text:"์‚ฌ์šฉํ•  ๋ชจ๋ธ ์•„ํ‚คํ…์ฒ˜๋ฅผ ์ง€์ •ํ•ฉ๋‹ˆ๋‹ค.",explain:"๋ชจ๋ธ ์•„ํ‚คํ…์ฒ˜๋Š” ๋ชจ๋ธ์„ ๋กœ๋“œํ•  ๋•Œ ์ง€์ •๋˜๋ฉฐ, Trainer์—์„œ ์ง€์ •ํ•˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค."},{text:"๋ฐ์ดํ„ฐ ์ฒ˜๋ฆฌ์— ์‚ฌ์šฉํ•  ํ† ํฌ๋‚˜์ด์ €๋ฅผ Trainer์— ์•Œ๋ ค์ค๋‹ˆ๋‹ค.",explain:"processing_class ๋งค๊ฐœ๋ณ€์ˆ˜๋Š” ์‚ฌ์šฉํ•  ํ† ํฌ๋‚˜์ด์ €๋ฅผ Trainer๊ฐ€ ์•Œ ์ˆ˜ ์žˆ๋„๋ก ๋„์™€์ฃผ๋Š” ์ตœ์‹  ์ถ”๊ฐ€ ์‚ฌํ•ญ์ž…๋‹ˆ๋‹ค.",correct:!0},{text:"ํ›ˆ๋ จ์„ ์œ„ํ•œ ๋ฐฐ์น˜ ํฌ๊ธฐ๋ฅผ ๊ฒฐ์ •ํ•ฉ๋‹ˆ๋‹ค.",explain:"๋ฐฐ์น˜ ํฌ๊ธฐ๋Š” processing_class๊ฐ€ ์•„๋‹Œ TrainingArguments์—์„œ ์„ค์ •๋ฉ๋‹ˆ๋‹ค."},{text:"ํ‰๊ฐ€ ๋นˆ๋„๋ฅผ ์ œ์–ดํ•ฉ๋‹ˆ๋‹ค.",explain:"ํ‰๊ฐ€ ๋นˆ๋„๋Š” TrainingArguments์˜ eval_strategy๋กœ ์ œ์–ด๋ฉ๋‹ˆ๋‹ค."}]}}),Ce=new T({props:{title:"2. ํ›ˆ๋ จ ์ค‘ ํ‰๊ฐ€๊ฐ€ ์–ผ๋งˆ๋‚˜ ์ž์ฃผ ๋ฐœ์ƒํ•˜๋Š”์ง€๋ฅผ ์ œ์–ดํ•˜๋Š” TrainingArguments ๋งค๊ฐœ๋ณ€์ˆ˜๋Š” ๋ฌด์—‡์ธ๊ฐ€์š”?",local:"2-ํ›ˆ๋ จ-์ค‘-ํ‰๊ฐ€๊ฐ€-์–ผ๋งˆ๋‚˜-์ž์ฃผ-๋ฐœ์ƒํ•˜๋Š”์ง€๋ฅผ-์ œ์–ดํ•˜๋Š”-trainingarguments-๋งค๊ฐœ๋ณ€์ˆ˜๋Š”-๋ฌด์—‡์ธ๊ฐ€์š”",headingTag:"h3"}}),ke=new Xe({props:{choices:[{text:"eval_frequency",explain:"TrainingArguments์—๋Š” eval_frequency ๋งค๊ฐœ๋ณ€์ˆ˜๊ฐ€ ์—†์Šต๋‹ˆ๋‹ค."},{text:"eval_strategy",explain:"eval_strategy๋Š” ํ‰๊ฐ€ ํƒ€์ด๋ฐ์„ ์ œ์–ดํ•˜๊ธฐ ์œ„ํ•ด 'epoch', 'steps', ๋˜๋Š” 'no'๋กœ ์„ค์ •ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.",correct:!0},{text:"evaluation_steps",explain:"eval_steps๋Š” ํ‰๊ฐ€ ์‚ฌ์ด์˜ ๋‹จ๊ณ„ ์ˆ˜๋ฅผ ์„ค์ •ํ•˜์ง€๋งŒ, eval_strategy๊ฐ€ ํ‰๊ฐ€ ๋ฐœ์ƒ ์—ฌ๋ถ€/์‹œ๊ธฐ๋ฅผ ๊ฒฐ์ •ํ•ฉ๋‹ˆ๋‹ค."},{text:"do_eval",explain:"์ตœ์‹  TrainingArguments์—๋Š” do_eval ๋งค๊ฐœ๋ณ€์ˆ˜๊ฐ€ ์—†์Šต๋‹ˆ๋‹ค."}]}}),ve=new T({props:{title:"3. TrainingArguments์—์„œ <code> fp16=True </code> ๋Š” ๋ฌด์—‡์„ ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”?",local:"3-trainingarguments์—์„œ-code-fp16true-code-๋Š”-๋ฌด์—‡์„-ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”",headingTag:"h3"}}),xe=new Xe({props:{choices:[{text:"๋” ๋น ๋ฅธ ํ›ˆ๋ จ์„ ์œ„ํ•œ 16๋น„ํŠธ ์ •์ˆ˜ ์ •๋ฐ€๋„",explain:"fp16์€ ์ •์ˆ˜ ์ •๋ฐ€๋„๊ฐ€ ์•„๋‹Œ ๋ถ€๋™์†Œ์ˆ˜์  ์ •๋ฐ€๋„๋ฅผ ์˜๋ฏธํ•ฉ๋‹ˆ๋‹ค."},{text:"๋” ๋น ๋ฅธ ํ›ˆ๋ จ๊ณผ ๋ฉ”๋ชจ๋ฆฌ ์‚ฌ์šฉ๋Ÿ‰ ๊ฐ์†Œ๋ฅผ ์œ„ํ•œ 16๋น„ํŠธ ๋ถ€๋™์†Œ์ˆ˜์  ์ˆ˜๋ฅผ ์‚ฌ์šฉํ•œ ํ˜ผํ•ฉ ์ •๋ฐ€๋„ ํ›ˆ๋ จ",explain:"ํ˜ผํ•ฉ ์ •๋ฐ€๋„ ํ›ˆ๋ จ์€ ์ˆœ์ „ํŒŒ์—๋Š” 16๋น„ํŠธ ํ”Œ๋กœํŠธ๋ฅผ, ๊ทธ๋ ˆ์ด๋””์–ธํŠธ์—๋Š” 32๋น„ํŠธ๋ฅผ ์‚ฌ์šฉํ•˜์—ฌ ์†๋„๋ฅผ ํ–ฅ์ƒ์‹œํ‚ค๊ณ  ๋ฉ”๋ชจ๋ฆฌ ์‚ฌ์šฉ๋Ÿ‰์„ ์ค„์ž…๋‹ˆ๋‹ค.",correct:!0},{text:"์ •ํ™•ํžˆ 16 ์—ํฌํฌ ๋™์•ˆ ํ›ˆ๋ จ",explain:"fp16์€ ์—ํฌํฌ ์ˆ˜์™€ ๊ด€๋ จ์ด ์—†์Šต๋‹ˆ๋‹ค."},{text:"๋ถ„์‚ฐ ํ›ˆ๋ จ์„ ์œ„ํ•œ 16๊ฐœ GPU ์‚ฌ์šฉ",explain:"GPU ์ˆ˜๋Š” fp16 ๋งค๊ฐœ๋ณ€์ˆ˜๋กœ ์ œ์–ด๋˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค."}]}}),Re=new T({props:{title:"4. Trainer์—์„œ <code> compute_metrics </code> ํ•จ์ˆ˜์˜ ์—ญํ• ์€ ๋ฌด์—‡์ธ๊ฐ€์š”?",local:"4-trainer์—์„œ-code-computemetrics-code-ํ•จ์ˆ˜์˜-์—ญํ• ์€-๋ฌด์—‡์ธ๊ฐ€์š”",headingTag:"h3"}}),He=new Xe({props:{choices:[{text:"ํ›ˆ๋ จ ์ค‘ ์†์‹ค์„ ๊ณ„์‚ฐํ•ฉ๋‹ˆ๋‹ค.",explain:"์†์‹ค ๊ณ„์‚ฐ์€ compute_metrics๊ฐ€ ์•„๋‹Œ ๋ชจ๋ธ์—์„œ ์ž๋™์œผ๋กœ ์ฒ˜๋ฆฌ๋ฉ๋‹ˆ๋‹ค."},{text:"๋กœ์ง“์„ ์˜ˆ์ธก์œผ๋กœ ๋ณ€ํ™˜ํ•˜๊ณ  ์ •ํ™•๋„ ๋ฐ F1๊ณผ ๊ฐ™์€ ํ‰๊ฐ€ ๋ฉ”ํŠธ๋ฆญ์„ ๊ณ„์‚ฐํ•ฉ๋‹ˆ๋‹ค.",explain:"compute_metrics๋Š” ์˜ˆ์ธก๊ณผ ๋ผ๋ฒจ์„ ๋ฐ›์•„์„œ ํ‰๊ฐ€๋ฅผ ์œ„ํ•œ ๋ฉ”ํŠธ๋ฆญ์„ ๋ฐ˜ํ™˜ํ•ฉ๋‹ˆ๋‹ค.",correct:!0},{text:"์‚ฌ์šฉํ•  ์˜ตํ‹ฐ๋งˆ์ด์ €๋ฅผ ๊ฒฐ์ •ํ•ฉ๋‹ˆ๋‹ค.",explain:"์˜ตํ‹ฐ๋งˆ์ด์ € ์„ ํƒ์€ compute_metrics๋กœ ์ฒ˜๋ฆฌ๋˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค."},{text:"ํ›ˆ๋ จ ๋ฐ์ดํ„ฐ๋ฅผ ์ „์ฒ˜๋ฆฌํ•ฉ๋‹ˆ๋‹ค.",explain:"๋ฐ์ดํ„ฐ ์ „์ฒ˜๋ฆฌ๋Š” ํ›ˆ๋ จ ์ „์— ์ˆ˜ํ–‰๋˜๋ฉฐ, ํ‰๊ฐ€ ์ค‘ compute_metrics๋กœ ์ˆ˜ํ–‰๋˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค."}]}}),We=new T({props:{title:"5. Trainer์— <code> eval_dataset </code> ์„ ์ œ๊ณตํ•˜์ง€ ์•Š์œผ๋ฉด ์–ด๋–ป๊ฒŒ ๋˜๋‚˜์š”?",local:"5-trainer์—-code-evaldataset-code-์„-์ œ๊ณตํ•˜์ง€-์•Š์œผ๋ฉด-์–ด๋–ป๊ฒŒ-๋˜๋‚˜์š”",headingTag:"h3"}}),Ge=new Xe({props:{choices:[{text:"ํ›ˆ๋ จ์ด ์˜ค๋ฅ˜์™€ ํ•จ๊ป˜ ์‹คํŒจํ•ฉ๋‹ˆ๋‹ค.",explain:"eval_dataset ์—†์ด๋„ ํ›ˆ๋ จ์„ ์ง„ํ–‰ํ•  ์ˆ˜ ์žˆ์ง€๋งŒ, ํ‰๊ฐ€ ๋ฉ”ํŠธ๋ฆญ์€ ์–ป์„ ์ˆ˜ ์—†์Šต๋‹ˆ๋‹ค."},{text:"Trainer๊ฐ€ ์ž๋™์œผ๋กœ ํ›ˆ๋ จ ๋ฐ์ดํ„ฐ๋ฅผ ํ‰๊ฐ€์šฉ์œผ๋กœ ๋ถ„ํ• ํ•ฉ๋‹ˆ๋‹ค.",explain:"Trainer๋Š” ์ž๋™์œผ๋กœ ๊ฒ€์ฆ ๋ถ„ํ• ์„ ์ƒ์„ฑํ•˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค."},{text:"ํ›ˆ๋ จ ์ค‘ ํ‰๊ฐ€ ๋ฉ”ํŠธ๋ฆญ์„ ์–ป์„ ์ˆ˜ ์—†์ง€๋งŒ ํ›ˆ๋ จ์€ ์—ฌ์ „ํžˆ ์ž‘๋™ํ•ฉ๋‹ˆ๋‹ค.",explain:"ํ‰๊ฐ€๋Š” ์„ ํƒ์‚ฌํ•ญ์ž…๋‹ˆ๋‹ค - ํ‰๊ฐ€ ์—†์ด๋„ ํ›ˆ๋ จํ•  ์ˆ˜ ์žˆ์ง€๋งŒ ๊ฒ€์ฆ ๋ฉ”ํŠธ๋ฆญ์€ ๋ณผ ์ˆ˜ ์—†์Šต๋‹ˆ๋‹ค.",correct:!0},{text:"๋ชจ๋ธ์ด ํ‰๊ฐ€๋ฅผ ์œ„ํ•ด ํ›ˆ๋ จ ๋ฐ์ดํ„ฐ๋ฅผ ์‚ฌ์šฉํ•ฉ๋‹ˆ๋‹ค.",explain:"Trainer๋Š” ์ž๋™์œผ๋กœ ํ‰๊ฐ€๋ฅผ ์œ„ํ•ด ํ›ˆ๋ จ ๋ฐ์ดํ„ฐ๋ฅผ ์‚ฌ์šฉํ•˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค - ๋‹จ์ˆœํžˆ ํ‰๊ฐ€ํ•˜์ง€ ์•Š์Šต๋‹ˆ๋‹ค."}]}}),Ie=new T({props:{title:"6. ๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ ์ด๋ž€ ๋ฌด์—‡์ด๋ฉฐ ์–ด๋–ป๊ฒŒ ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”?",local:"6-๊ทธ๋ ˆ์ด๋””์–ธํŠธ-๋ˆ„์ ์ด๋ž€-๋ฌด์—‡์ด๋ฉฐ-์–ด๋–ป๊ฒŒ-ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”",headingTag:"h3"}}),Ze=new Xe({props:{choices:[{text:"๊ทธ๋ ˆ์ด๋””์–ธํŠธ๋ฅผ ๋””์Šคํฌ์— ์ €์žฅํ•˜๋Š” ๊ฒƒ์œผ๋กœ, save_gradients=True๋กœ ํ™œ์„ฑํ™”๋ฉ๋‹ˆ๋‹ค.",explain:"๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ ์€ ๊ทธ๋ ˆ์ด๋””์–ธํŠธ๋ฅผ ๋””์Šคํฌ์— ์ €์žฅํ•˜๋Š” ๊ฒƒ๊ณผ ๊ด€๋ จ์ด ์—†์Šต๋‹ˆ๋‹ค."},{text:"์—…๋ฐ์ดํŠธ ์ „์— ์—ฌ๋Ÿฌ ๋ฐฐ์น˜์— ๊ฑธ์ณ ๊ทธ๋ ˆ์ด๋””์–ธํŠธ๋ฅผ ๋ˆ„์ ํ•˜๋Š” ๊ฒƒ์œผ๋กœ, gradient_accumulation_steps๋กœ ํ™œ์„ฑํ™”๋ฉ๋‹ˆ๋‹ค.",explain:"์ด๋ฅผ ํ†ตํ•ด ์—ฌ๋Ÿฌ ์ˆœ์ „ํŒŒ์— ๊ฑธ์ณ ๊ทธ๋ ˆ์ด๋””์–ธํŠธ๋ฅผ ๋ˆ„์ ํ•˜์—ฌ ๋” ํฐ ๋ฐฐ์น˜ ํฌ๊ธฐ๋ฅผ ์‹œ๋ฎฌ๋ ˆ์ด์…˜ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.",correct:!0},{text:"๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๊ณ„์‚ฐ์„ ๊ฐ€์†ํ™”ํ•˜๋Š” ๊ฒƒ์œผ๋กœ, fp16๊ณผ ํ•จ๊ป˜ ์ž๋™์œผ๋กœ ํ™œ์„ฑํ™”๋ฉ๋‹ˆ๋‹ค.",explain:"fp16์ด ํ›ˆ๋ จ์„ ๊ฐ€์†ํ™”ํ•  ์ˆ˜ ์žˆ์ง€๋งŒ, ๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ ์€ ๋ณ„๋„์˜ ๊ธฐ์ˆ ์ž…๋‹ˆ๋‹ค."},{text:"๊ทธ๋ ˆ์ด๋””์–ธํŠธ ์˜ค๋ฒ„ํ”Œ๋กœ์šฐ๋ฅผ ๋ฐฉ์ง€ํ•˜๋Š” ๊ฒƒ์œผ๋กœ, gradient_clipping=True๋กœ ํ™œ์„ฑํ™”๋ฉ๋‹ˆ๋‹ค.",explain:"์ด๋Š” ๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ ์ด ์•„๋‹Œ ๊ทธ๋ ˆ์ด๋””์–ธํŠธ ํด๋ฆฌํ•‘์„ ์„ค๋ช…ํ•ฉ๋‹ˆ๋‹ค."}]}}),Ee=new Dl({props:{source:"https://github.com/huggingface/course/blob/main/chapters/ko/chapter3/3.mdx"}}),{c(){$=M("meta"),Qe=s(),g=M("p"),Ve=s(),i(J.$$.fragment),Ye=s(),i(k.$$.fragment),Fe=s(),i(v.$$.fragment),qe=s(),i(x.$$.fragment),Be=s(),i(R.$$.fragment),Ae=s(),H=M("p"),H.innerHTML=pl,Le=s(),U=M("blockquote"),U.innerHTML=ol,Ne=s(),W=M("p"),W.textContent=cl,Pe=s(),i(G.$$.fragment),Se=s(),i(I.$$.fragment),De=s(),Z=M("p"),Z.innerHTML=ml,Oe=s(),i(E.$$.fragment),Ke=s(),Q=M("p"),Q.innerHTML=Ml,et=s(),b=M("blockquote"),b.innerHTML=fl,tt=s(),V=M("p"),V.innerHTML=dl,lt=s(),i(X.$$.fragment),nt=s(),z=M("p"),z.innerHTML=ul,st=s(),Y=M("p"),Y.innerHTML=Tl,at=s(),i(F.$$.fragment),it=s(),q=M("p"),q.innerHTML=$l,rt=s(),w=M("blockquote"),w.innerHTML=yl,pt=s(),B=M("p"),B.innerHTML=gl,ot=s(),i(A.$$.fragment),ct=s(),L=M("p"),L.textContent=Jl,mt=s(),N=M("ol"),N.innerHTML=Ul,Mt=s(),i(P.$$.fragment),ft=s(),S=M("p"),S.innerHTML=bl,dt=s(),i(D.$$.fragment),ut=s(),i(O.$$.fragment),Tt=s(),K=M("p"),K.innerHTML=wl,$t=s(),ee=M("p"),ee.innerHTML=hl,yt=s(),i(te.$$.fragment),gt=s(),le=M("p"),le.innerHTML=jl,Jt=s(),i(ne.$$.fragment),Ut=s(),i(se.$$.fragment),bt=s(),h=M("blockquote"),h.innerHTML=_l,wt=s(),ae=M("p"),ae.innerHTML=Cl,ht=s(),ie=M("p"),ie.innerHTML=kl,jt=s(),i(re.$$.fragment),_t=s(),pe=M("p"),pe.innerHTML=vl,Ct=s(),i(oe.$$.fragment),kt=s(),ce=M("p"),ce.innerHTML=xl,vt=s(),i(me.$$.fragment),xt=s(),Me=M("p"),Me.textContent=Rl,Rt=s(),i(fe.$$.fragment),Ht=s(),de=M("p"),de.innerHTML=Hl,Wt=s(),ue=M("p"),ue.innerHTML=Wl,Gt=s(),i(Te.$$.fragment),It=s(),$e=M("p"),$e.innerHTML=Gl,Zt=s(),i(ye.$$.fragment),Et=s(),ge=M("p"),ge.innerHTML=Il,Qt=s(),i(Je.$$.fragment),Vt=s(),j=M("blockquote"),j.innerHTML=Zl,Xt=s(),Ue=M("p"),Ue.innerHTML=El,zt=s(),be=M("p"),be.innerHTML=Ql,Yt=s(),_=M("blockquote"),_.innerHTML=Vl,Ft=s(),i(we.$$.fragment),qt=s(),he=M("p"),he.textContent=Xl,Bt=s(),i(je.$$.fragment),At=s(),i(_e.$$.fragment),Lt=s(),i(Ce.$$.fragment),Nt=s(),i(ke.$$.fragment),Pt=s(),i(ve.$$.fragment),St=s(),i(xe.$$.fragment),Dt=s(),i(Re.$$.fragment),Ot=s(),i(He.$$.fragment),Kt=s(),i(We.$$.fragment),el=s(),i(Ge.$$.fragment),tl=s(),i(Ie.$$.fragment),ll=s(),i(Ze.$$.fragment),nl=s(),C=M("blockquote"),C.innerHTML=zl,sl=s(),i(Ee.$$.fragment),al=s(),ze=M("p"),this.h()},l(e){const t=Nl("svelte-u9bgzb",document.head);$=f(t,"META",{name:!0,content:!0}),t.forEach(l),Qe=a(e),g=f(e,"P",{}),Fl(g).forEach(l),Ve=a(e),r(J.$$.fragment,e),Ye=a(e),r(k.$$.fragment,e),Fe=a(e),r(v.$$.fragment,e),qe=a(e),r(x.$$.fragment,e),Be=a(e),r(R.$$.fragment,e),Ae=a(e),H=f(e,"P",{"data-svelte-h":!0}),d(H)!=="svelte-knkc89"&&(H.innerHTML=pl),Le=a(e),U=f(e,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),d(U)!=="svelte-1v6278y"&&(U.innerHTML=ol),Ne=a(e),W=f(e,"P",{"data-svelte-h":!0}),d(W)!=="svelte-hs8a7l"&&(W.textContent=cl),Pe=a(e),r(G.$$.fragment,e),Se=a(e),r(I.$$.fragment,e),De=a(e),Z=f(e,"P",{"data-svelte-h":!0}),d(Z)!=="svelte-1enyha7"&&(Z.innerHTML=ml),Oe=a(e),r(E.$$.fragment,e),Ke=a(e),Q=f(e,"P",{"data-svelte-h":!0}),d(Q)!=="svelte-18au6nv"&&(Q.innerHTML=Ml),et=a(e),b=f(e,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),d(b)!=="svelte-1poujc4"&&(b.innerHTML=fl),tt=a(e),V=f(e,"P",{"data-svelte-h":!0}),d(V)!=="svelte-nt9c4b"&&(V.innerHTML=dl),lt=a(e),r(X.$$.fragment,e),nt=a(e),z=f(e,"P",{"data-svelte-h":!0}),d(z)!=="svelte-s3sck9"&&(z.innerHTML=ul),st=a(e),Y=f(e,"P",{"data-svelte-h":!0}),d(Y)!=="svelte-4ai6qh"&&(Y.innerHTML=Tl),at=a(e),r(F.$$.fragment,e),it=a(e),q=f(e,"P",{"data-svelte-h":!0}),d(q)!=="svelte-1m2yas3"&&(q.innerHTML=$l),rt=a(e),w=f(e,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),d(w)!=="svelte-8phhlb"&&(w.innerHTML=yl),pt=a(e),B=f(e,"P",{"data-svelte-h":!0}),d(B)!=="svelte-13y4n8x"&&(B.innerHTML=gl),ot=a(e),r(A.$$.fragment,e),ct=a(e),L=f(e,"P",{"data-svelte-h":!0}),d(L)!=="svelte-1vb1ztl"&&(L.textContent=Jl),mt=a(e),N=f(e,"OL",{"data-svelte-h":!0}),d(N)!=="svelte-1kijd9m"&&(N.innerHTML=Ul),Mt=a(e),r(P.$$.fragment,e),ft=a(e),S=f(e,"P",{"data-svelte-h":!0}),d(S)!=="svelte-1kov8l9"&&(S.innerHTML=bl),dt=a(e),r(D.$$.fragment,e),ut=a(e),r(O.$$.fragment,e),Tt=a(e),K=f(e,"P",{"data-svelte-h":!0}),d(K)!=="svelte-44hwg3"&&(K.innerHTML=wl),$t=a(e),ee=f(e,"P",{"data-svelte-h":!0}),d(ee)!=="svelte-1f3lia8"&&(ee.innerHTML=hl),yt=a(e),r(te.$$.fragment,e),gt=a(e),le=f(e,"P",{"data-svelte-h":!0}),d(le)!=="svelte-4of9x9"&&(le.innerHTML=jl),Jt=a(e),r(ne.$$.fragment,e),Ut=a(e),r(se.$$.fragment,e),bt=a(e),h=f(e,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),d(h)!=="svelte-4q6lfi"&&(h.innerHTML=_l),wt=a(e),ae=f(e,"P",{"data-svelte-h":!0}),d(ae)!=="svelte-1ylr8sj"&&(ae.innerHTML=Cl),ht=a(e),ie=f(e,"P",{"data-svelte-h":!0}),d(ie)!=="svelte-2jb62l"&&(ie.innerHTML=kl),jt=a(e),r(re.$$.fragment,e),_t=a(e),pe=f(e,"P",{"data-svelte-h":!0}),d(pe)!=="svelte-vtoh1f"&&(pe.innerHTML=vl),Ct=a(e),r(oe.$$.fragment,e),kt=a(e),ce=f(e,"P",{"data-svelte-h":!0}),d(ce)!=="svelte-14c26ht"&&(ce.innerHTML=xl),vt=a(e),r(me.$$.fragment,e),xt=a(e),Me=f(e,"P",{"data-svelte-h":!0}),d(Me)!=="svelte-1yytiyu"&&(Me.textContent=Rl),Rt=a(e),r(fe.$$.fragment,e),Ht=a(e),de=f(e,"P",{"data-svelte-h":!0}),d(de)!=="svelte-1lmwzzc"&&(de.innerHTML=Hl),Wt=a(e),ue=f(e,"P",{"data-svelte-h":!0}),d(ue)!=="svelte-1h0qf0f"&&(ue.innerHTML=Wl),Gt=a(e),r(Te.$$.fragment,e),It=a(e),$e=f(e,"P",{"data-svelte-h":!0}),d($e)!=="svelte-pmu9yq"&&($e.innerHTML=Gl),Zt=a(e),r(ye.$$.fragment,e),Et=a(e),ge=f(e,"P",{"data-svelte-h":!0}),d(ge)!=="svelte-umpq8u"&&(ge.innerHTML=Il),Qt=a(e),r(Je.$$.fragment,e),Vt=a(e),j=f(e,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),d(j)!=="svelte-2zhea"&&(j.innerHTML=Zl),Xt=a(e),Ue=f(e,"P",{"data-svelte-h":!0}),d(Ue)!=="svelte-kboajh"&&(Ue.innerHTML=El),zt=a(e),be=f(e,"P",{"data-svelte-h":!0}),d(be)!=="svelte-1p27re0"&&(be.innerHTML=Ql),Yt=a(e),_=f(e,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),d(_)!=="svelte-1vkb1bk"&&(_.innerHTML=Vl),Ft=a(e),r(we.$$.fragment,e),qt=a(e),he=f(e,"P",{"data-svelte-h":!0}),d(he)!=="svelte-1f5akmu"&&(he.textContent=Xl),Bt=a(e),r(je.$$.fragment,e),At=a(e),r(_e.$$.fragment,e),Lt=a(e),r(Ce.$$.fragment,e),Nt=a(e),r(ke.$$.fragment,e),Pt=a(e),r(ve.$$.fragment,e),St=a(e),r(xe.$$.fragment,e),Dt=a(e),r(Re.$$.fragment,e),Ot=a(e),r(He.$$.fragment,e),Kt=a(e),r(We.$$.fragment,e),el=a(e),r(Ge.$$.fragment,e),tl=a(e),r(Ie.$$.fragment,e),ll=a(e),r(Ze.$$.fragment,e),nl=a(e),C=f(e,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),d(C)!=="svelte-1a04z6w"&&(C.innerHTML=zl),sl=a(e),r(Ee.$$.fragment,e),al=a(e),ze=f(e,"P",{}),Fl(ze).forEach(l),this.h()},h(){y($,"name","hf:doc:metadata"),y($,"content",ln),y(U,"class","tip"),y(b,"class","tip"),y(w,"class","tip"),y(h,"class","tip"),y(j,"class","tip"),y(_,"class","tip"),y(C,"class","tip")},m(e,t){Pl(document.head,$),n(e,Qe,t),n(e,g,t),n(e,Ve,t),p(J,e,t),n(e,Ye,t),p(k,e,t),n(e,Fe,t),p(v,e,t),n(e,qe,t),p(x,e,t),n(e,Be,t),p(R,e,t),n(e,Ae,t),n(e,H,t),n(e,Le,t),n(e,U,t),n(e,Ne,t),n(e,W,t),n(e,Pe,t),p(G,e,t),n(e,Se,t),p(I,e,t),n(e,De,t),n(e,Z,t),n(e,Oe,t),p(E,e,t),n(e,Ke,t),n(e,Q,t),n(e,et,t),n(e,b,t),n(e,tt,t),n(e,V,t),n(e,lt,t),p(X,e,t),n(e,nt,t),n(e,z,t),n(e,st,t),n(e,Y,t),n(e,at,t),p(F,e,t),n(e,it,t),n(e,q,t),n(e,rt,t),n(e,w,t),n(e,pt,t),n(e,B,t),n(e,ot,t),p(A,e,t),n(e,ct,t),n(e,L,t),n(e,mt,t),n(e,N,t),n(e,Mt,t),p(P,e,t),n(e,ft,t),n(e,S,t),n(e,dt,t),p(D,e,t),n(e,ut,t),p(O,e,t),n(e,Tt,t),n(e,K,t),n(e,$t,t),n(e,ee,t),n(e,yt,t),p(te,e,t),n(e,gt,t),n(e,le,t),n(e,Jt,t),p(ne,e,t),n(e,Ut,t),p(se,e,t),n(e,bt,t),n(e,h,t),n(e,wt,t),n(e,ae,t),n(e,ht,t),n(e,ie,t),n(e,jt,t),p(re,e,t),n(e,_t,t),n(e,pe,t),n(e,Ct,t),p(oe,e,t),n(e,kt,t),n(e,ce,t),n(e,vt,t),p(me,e,t),n(e,xt,t),n(e,Me,t),n(e,Rt,t),p(fe,e,t),n(e,Ht,t),n(e,de,t),n(e,Wt,t),n(e,ue,t),n(e,Gt,t),p(Te,e,t),n(e,It,t),n(e,$e,t),n(e,Zt,t),p(ye,e,t),n(e,Et,t),n(e,ge,t),n(e,Qt,t),p(Je,e,t),n(e,Vt,t),n(e,j,t),n(e,Xt,t),n(e,Ue,t),n(e,zt,t),n(e,be,t),n(e,Yt,t),n(e,_,t),n(e,Ft,t),p(we,e,t),n(e,qt,t),n(e,he,t),n(e,Bt,t),p(je,e,t),n(e,At,t),p(_e,e,t),n(e,Lt,t),p(Ce,e,t),n(e,Nt,t),p(ke,e,t),n(e,Pt,t),p(ve,e,t),n(e,St,t),p(xe,e,t),n(e,Dt,t),p(Re,e,t),n(e,Ot,t),p(He,e,t),n(e,Kt,t),p(We,e,t),n(e,el,t),p(Ge,e,t),n(e,tl,t),p(Ie,e,t),n(e,ll,t),p(Ze,e,t),n(e,nl,t),n(e,C,t),n(e,sl,t),p(Ee,e,t),n(e,al,t),n(e,ze,t),il=!0},p(e,[t]){const Yl={};t&1&&(Yl.fw=e[0]),J.$set(Yl)},i(e){il||(o(J.$$.fragment,e),o(k.$$.fragment,e),o(v.$$.fragment,e),o(x.$$.fragment,e),o(R.$$.fragment,e),o(G.$$.fragment,e),o(I.$$.fragment,e),o(E.$$.fragment,e),o(X.$$.fragment,e),o(F.$$.fragment,e),o(A.$$.fragment,e),o(P.$$.fragment,e),o(D.$$.fragment,e),o(O.$$.fragment,e),o(te.$$.fragment,e),o(ne.$$.fragment,e),o(se.$$.fragment,e),o(re.$$.fragment,e),o(oe.$$.fragment,e),o(me.$$.fragment,e),o(fe.$$.fragment,e),o(Te.$$.fragment,e),o(ye.$$.fragment,e),o(Je.$$.fragment,e),o(we.$$.fragment,e),o(je.$$.fragment,e),o(_e.$$.fragment,e),o(Ce.$$.fragment,e),o(ke.$$.fragment,e),o(ve.$$.fragment,e),o(xe.$$.fragment,e),o(Re.$$.fragment,e),o(He.$$.fragment,e),o(We.$$.fragment,e),o(Ge.$$.fragment,e),o(Ie.$$.fragment,e),o(Ze.$$.fragment,e),o(Ee.$$.fragment,e),il=!0)},o(e){c(J.$$.fragment,e),c(k.$$.fragment,e),c(v.$$.fragment,e),c(x.$$.fragment,e),c(R.$$.fragment,e),c(G.$$.fragment,e),c(I.$$.fragment,e),c(E.$$.fragment,e),c(X.$$.fragment,e),c(F.$$.fragment,e),c(A.$$.fragment,e),c(P.$$.fragment,e),c(D.$$.fragment,e),c(O.$$.fragment,e),c(te.$$.fragment,e),c(ne.$$.fragment,e),c(se.$$.fragment,e),c(re.$$.fragment,e),c(oe.$$.fragment,e),c(me.$$.fragment,e),c(fe.$$.fragment,e),c(Te.$$.fragment,e),c(ye.$$.fragment,e),c(Je.$$.fragment,e),c(we.$$.fragment,e),c(je.$$.fragment,e),c(_e.$$.fragment,e),c(Ce.$$.fragment,e),c(ke.$$.fragment,e),c(ve.$$.fragment,e),c(xe.$$.fragment,e),c(Re.$$.fragment,e),c(He.$$.fragment,e),c(We.$$.fragment,e),c(Ge.$$.fragment,e),c(Ie.$$.fragment,e),c(Ze.$$.fragment,e),c(Ee.$$.fragment,e),il=!1},d(e){e&&(l(Qe),l(g),l(Ve),l(Ye),l(Fe),l(qe),l(Be),l(Ae),l(H),l(Le),l(U),l(Ne),l(W),l(Pe),l(Se),l(De),l(Z),l(Oe),l(Ke),l(Q),l(et),l(b),l(tt),l(V),l(lt),l(nt),l(z),l(st),l(Y),l(at),l(it),l(q),l(rt),l(w),l(pt),l(B),l(ot),l(ct),l(L),l(mt),l(N),l(Mt),l(ft),l(S),l(dt),l(ut),l(Tt),l(K),l($t),l(ee),l(yt),l(gt),l(le),l(Jt),l(Ut),l(bt),l(h),l(wt),l(ae),l(ht),l(ie),l(jt),l(_t),l(pe),l(Ct),l(kt),l(ce),l(vt),l(xt),l(Me),l(Rt),l(Ht),l(de),l(Wt),l(ue),l(Gt),l(It),l($e),l(Zt),l(Et),l(ge),l(Qt),l(Vt),l(j),l(Xt),l(Ue),l(zt),l(be),l(Yt),l(_),l(Ft),l(qt),l(he),l(Bt),l(At),l(Lt),l(Nt),l(Pt),l(St),l(Dt),l(Ot),l(Kt),l(el),l(tl),l(ll),l(nl),l(C),l(sl),l(al),l(ze)),l($),m(J,e),m(k,e),m(v,e),m(x,e),m(R,e),m(G,e),m(I,e),m(E,e),m(X,e),m(F,e),m(A,e),m(P,e),m(D,e),m(O,e),m(te,e),m(ne,e),m(se,e),m(re,e),m(oe,e),m(me,e),m(fe,e),m(Te,e),m(ye,e),m(Je,e),m(we,e),m(je,e),m(_e,e),m(Ce,e),m(ke,e),m(ve,e),m(xe,e),m(Re,e),m(He,e),m(We,e),m(Ge,e),m(Ie,e),m(Ze,e),m(Ee,e)}}}const ln='{"title":"Trainer API๋กœ ๋ชจ๋ธ ๋ฏธ์„ธ ์กฐ์ •ํ•˜๊ธฐ","local":"fine-tuning-a-model-with-the-trainer-api","sections":[{"title":"ํ›ˆ๋ จ","local":"training","sections":[],"depth":3},{"title":"ํ‰๊ฐ€","local":"evaluation","sections":[],"depth":3},{"title":"๊ณ ๊ธ‰ ํ›ˆ๋ จ ๊ธฐ๋Šฅ","local":"advanced-training-features","sections":[],"depth":3},{"title":"์„น์…˜ ํ€ด์ฆˆ","local":"section-quiz","sections":[{"title":"1. Trainer ์—์„œ <code> processing_class </code> ๋งค๊ฐœ๋ณ€์ˆ˜์˜ ๋ชฉ์ ์€ ๋ฌด์—‡์ธ๊ฐ€์š”?","local":"1-trainer-์—์„œ-code-processingclass-code-๋งค๊ฐœ๋ณ€์ˆ˜์˜-๋ชฉ์ ์€-๋ฌด์—‡์ธ๊ฐ€์š”","sections":[],"depth":3},{"title":"2. ํ›ˆ๋ จ ์ค‘ ํ‰๊ฐ€๊ฐ€ ์–ผ๋งˆ๋‚˜ ์ž์ฃผ ๋ฐœ์ƒํ•˜๋Š”์ง€๋ฅผ ์ œ์–ดํ•˜๋Š” TrainingArguments ๋งค๊ฐœ๋ณ€์ˆ˜๋Š” ๋ฌด์—‡์ธ๊ฐ€์š”?","local":"2-ํ›ˆ๋ จ-์ค‘-ํ‰๊ฐ€๊ฐ€-์–ผ๋งˆ๋‚˜-์ž์ฃผ-๋ฐœ์ƒํ•˜๋Š”์ง€๋ฅผ-์ œ์–ดํ•˜๋Š”-trainingarguments-๋งค๊ฐœ๋ณ€์ˆ˜๋Š”-๋ฌด์—‡์ธ๊ฐ€์š”","sections":[],"depth":3},{"title":"3. TrainingArguments์—์„œ <code> fp16=True </code> ๋Š” ๋ฌด์—‡์„ ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”?","local":"3-trainingarguments์—์„œ-code-fp16true-code-๋Š”-๋ฌด์—‡์„-ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”","sections":[],"depth":3},{"title":"4. Trainer์—์„œ <code> compute_metrics </code> ํ•จ์ˆ˜์˜ ์—ญํ• ์€ ๋ฌด์—‡์ธ๊ฐ€์š”?","local":"4-trainer์—์„œ-code-computemetrics-code-ํ•จ์ˆ˜์˜-์—ญํ• ์€-๋ฌด์—‡์ธ๊ฐ€์š”","sections":[],"depth":3},{"title":"5. Trainer์— <code> eval_dataset </code> ์„ ์ œ๊ณตํ•˜์ง€ ์•Š์œผ๋ฉด ์–ด๋–ป๊ฒŒ ๋˜๋‚˜์š”?","local":"5-trainer์—-code-evaldataset-code-์„-์ œ๊ณตํ•˜์ง€-์•Š์œผ๋ฉด-์–ด๋–ป๊ฒŒ-๋˜๋‚˜์š”","sections":[],"depth":3},{"title":"6. ๊ทธ๋ ˆ์ด๋””์–ธํŠธ ๋ˆ„์ ์ด๋ž€ ๋ฌด์—‡์ด๋ฉฐ ์–ด๋–ป๊ฒŒ ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”?","local":"6-๊ทธ๋ ˆ์ด๋””์–ธํŠธ-๋ˆ„์ ์ด๋ž€-๋ฌด์—‡์ด๋ฉฐ-์–ด๋–ป๊ฒŒ-ํ™œ์„ฑํ™”ํ•˜๋‚˜์š”","sections":[],"depth":3}],"depth":2}],"depth":1}';function nn(rl,$,Qe){let g="pt";return Bl(()=>{const Ve=new URLSearchParams(window.location.search);Qe(0,g=Ve.get("fw")||"pt")}),[g]}class fn extends Al{constructor($){super(),Ll(this,$,nn,tn,ql,{})}}export{fn as component};

Xet Storage Details

Size:
43.6 kB
ยท
Xet hash:
18d876946752553f436ce62eb3899353e123fdaafcb874f15f5d07917e107fd8

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.