Buckets:

rtrm's picture
download
raw
90.3 kB
import{s as Ta,o as wa,n as Ce}from"../chunks/scheduler.37c15a92.js";import{S as Ua,i as fa,g as b,s as c,r as h,m as it,H as Ma,A as ja,h as T,f as s,c as r,j as ve,u as M,x as U,n as ct,E as Ja,k as Le,y as I,a,v as J,t as m,b as v,d as o,w as u,p as _}from"../chunks/index.2bf4358c.js";import{T as _e}from"../chunks/Tip.363c041f.js";import{Y as ua}from"../chunks/Youtube.1e50a667.js";import{C as w}from"../chunks/CodeBlock.4e987730.js";import{C as ya}from"../chunks/CourseFloatingBanner.9ff4c771.js";import{F as ga}from"../chunks/FrameworkSwitchCourse.8d4d4ab6.js";import{H as Be,E as ka}from"../chunks/getInferenceSnippets.24b50994.js";function Ia(y){let l,i;return l=new ya({props:{chapter:6,classNames:"absolute z-10 right-0 top-0",notebooks:[{label:"Google Colab",value:"https://colab.research.google.com/github/huggingface/notebooks/blob/master/course/vi/chapter6/section3b_tf.ipynb"},{label:"Aws Studio",value:"https://studiolab.sagemaker.aws/import/github/huggingface/notebooks/blob/master/course/vi/chapter6/section3b_tf.ipynb"}]}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function va(y){let l,i;return l=new ya({props:{chapter:6,classNames:"absolute z-10 right-0 top-0",notebooks:[{label:"Google Colab",value:"https://colab.research.google.com/github/huggingface/notebooks/blob/master/course/vi/chapter6/section3b_pt.ipynb"},{label:"Aws Studio",value:"https://studiolab.sagemaker.aws/import/github/huggingface/notebooks/blob/master/course/vi/chapter6/section3b_pt.ipynb"}]}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function _a(y){let l,i;return l=new ua({props:{id:"b3u8RzBCX9Y"}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Ba(y){let l,i;return l=new ua({props:{id:"_wxyB3j3mk4"}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Ca(y){let l,i;return l=new w({props:{code:"ZnJvbSUyMHRyYW5zZm9ybWVycyUyMGltcG9ydCUyMEF1dG9Ub2tlbml6ZXIlMkMlMjBURkF1dG9Nb2RlbEZvclF1ZXN0aW9uQW5zd2VyaW5nJTBBJTBBbW9kZWxfY2hlY2twb2ludCUyMCUzRCUyMCUyMmRpc3RpbGJlcnQtYmFzZS1jYXNlZC1kaXN0aWxsZWQtc3F1YWQlMjIlMEF0b2tlbml6ZXIlMjAlM0QlMjBBdXRvVG9rZW5pemVyLmZyb21fcHJldHJhaW5lZChtb2RlbF9jaGVja3BvaW50KSUwQW1vZGVsJTIwJTNEJTIwVEZBdXRvTW9kZWxGb3JRdWVzdGlvbkFuc3dlcmluZy5mcm9tX3ByZXRyYWluZWQobW9kZWxfY2hlY2twb2ludCklMEElMEFpbnB1dHMlMjAlM0QlMjB0b2tlbml6ZXIocXVlc3Rpb24lMkMlMjBjb250ZXh0JTJDJTIwcmV0dXJuX3RlbnNvcnMlM0QlMjJ0ZiUyMiklMEFvdXRwdXRzJTIwJTNEJTIwbW9kZWwoKippbnB1dHMp",highlighted:`<span class="hljs-keyword">from</span> transformers <span class="hljs-keyword">import</span> AutoTokenizer, TFAutoModelForQuestionAnswering
model_checkpoint = <span class="hljs-string">&quot;distilbert-base-cased-distilled-squad&quot;</span>
tokenizer = AutoTokenizer.from_pretrained(model_checkpoint)
model = TFAutoModelForQuestionAnswering.from_pretrained(model_checkpoint)
inputs = tokenizer(question, context, return_tensors=<span class="hljs-string">&quot;tf&quot;</span>)
outputs = model(**inputs)`,wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function $a(y){let l,i;return l=new w({props:{code:"ZnJvbSUyMHRyYW5zZm9ybWVycyUyMGltcG9ydCUyMEF1dG9Ub2tlbml6ZXIlMkMlMjBBdXRvTW9kZWxGb3JRdWVzdGlvbkFuc3dlcmluZyUwQSUwQW1vZGVsX2NoZWNrcG9pbnQlMjAlM0QlMjAlMjJkaXN0aWxiZXJ0LWJhc2UtY2FzZWQtZGlzdGlsbGVkLXNxdWFkJTIyJTBBdG9rZW5pemVyJTIwJTNEJTIwQXV0b1Rva2VuaXplci5mcm9tX3ByZXRyYWluZWQobW9kZWxfY2hlY2twb2ludCklMEFtb2RlbCUyMCUzRCUyMEF1dG9Nb2RlbEZvclF1ZXN0aW9uQW5zd2VyaW5nLmZyb21fcHJldHJhaW5lZChtb2RlbF9jaGVja3BvaW50KSUwQSUwQWlucHV0cyUyMCUzRCUyMHRva2VuaXplcihxdWVzdGlvbiUyQyUyMGNvbnRleHQlMkMlMjByZXR1cm5fdGVuc29ycyUzRCUyMnB0JTIyKSUwQW91dHB1dHMlMjAlM0QlMjBtb2RlbCgqKmlucHV0cyk=",highlighted:`<span class="hljs-keyword">from</span> transformers <span class="hljs-keyword">import</span> AutoTokenizer, AutoModelForQuestionAnswering
model_checkpoint = <span class="hljs-string">&quot;distilbert-base-cased-distilled-squad&quot;</span>
tokenizer = AutoTokenizer.from_pretrained(model_checkpoint)
model = AutoModelForQuestionAnswering.from_pretrained(model_checkpoint)
inputs = tokenizer(question, context, return_tensors=<span class="hljs-string">&quot;pt&quot;</span>)
outputs = model(**inputs)`,wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Za(y){let l,i;return l=new w({props:{code:"KDElMkMlMjA2NiklMjAoMSUyQyUyMDY2KQ==",highlighted:'(<span class="hljs-number">1</span>, <span class="hljs-number">66</span>) (<span class="hljs-number">1</span>, <span class="hljs-number">66</span>)',wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function xa(y){let l,i;return l=new w({props:{code:"dG9yY2guU2l6ZSglNUIxJTJDJTIwNjYlNUQpJTIwdG9yY2guU2l6ZSglNUIxJTJDJTIwNjYlNUQp",highlighted:'torch.Size([<span class="hljs-number">1</span>, <span class="hljs-number">66</span>]) torch.Size([<span class="hljs-number">1</span>, <span class="hljs-number">66</span>])',wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Ga(y){let l,i;return l=new w({props:{code:"aW1wb3J0JTIwdGVuc29yZmxvdyUyMGFzJTIwdGYlMEElMEFzZXF1ZW5jZV9pZHMlMjAlM0QlMjBpbnB1dHMuc2VxdWVuY2VfaWRzKCklMEElMjMlMjBDaGUlMjB0JUUxJUJBJUE1dCUyMGMlRTElQkElQTMlMjBtJUUxJUJCJThEaSUyMHRoJUUxJUJCJUE5JTIwdHIlRTElQkIlQUIlMjB0b2tlbiUyMGMlRTElQkIlQTdhJTIwbmclRTElQkIlQUYlMjBjJUUxJUJBJUEzbmglMEFtYXNrJTIwJTNEJTIwJTVCaSUyMCElM0QlMjAxJTIwZm9yJTIwaSUyMGluJTIwc2VxdWVuY2VfaWRzJTVEJTBBJTIzJTIwSGklRTElQkIlODNuJTIwdGglRTElQkIlOEIlMjB0b2tlbiUyMCU1QkNMUyU1RCUwQW1hc2slNUIwJTVEJTIwJTNEJTIwRmFsc2UlMEFtYXNrJTIwJTNEJTIwdGYuY29uc3RhbnQobWFzayklNUJOb25lJTVEJTBBJTBBc3RhcnRfbG9naXRzJTIwJTNEJTIwdGYud2hlcmUobWFzayUyQyUyMC0xMDAwMCUyQyUyMHN0YXJ0X2xvZ2l0cyklMEFlbmRfbG9naXRzJTIwJTNEJTIwdGYud2hlcmUobWFzayUyQyUyMC0xMDAwMCUyQyUyMGVuZF9sb2dpdHMp",highlighted:`<span class="hljs-keyword">import</span> tensorflow <span class="hljs-keyword">as</span> tf
sequence_ids = inputs.sequence_ids()
<span class="hljs-comment"># Che tất cả mọi thứ trừ token của ngữ cảnh</span>
mask = [i != <span class="hljs-number">1</span> <span class="hljs-keyword">for</span> i <span class="hljs-keyword">in</span> sequence_ids]
<span class="hljs-comment"># Hiển thị token [CLS]</span>
mask[<span class="hljs-number">0</span>] = <span class="hljs-literal">False</span>
mask = tf.constant(mask)[<span class="hljs-literal">None</span>]
start_logits = tf.where(mask, -<span class="hljs-number">10000</span>, start_logits)
end_logits = tf.where(mask, -<span class="hljs-number">10000</span>, end_logits)`,wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Va(y){let l,i;return l=new w({props:{code:"aW1wb3J0JTIwdG9yY2glMEElMEFzZXF1ZW5jZV9pZHMlMjAlM0QlMjBpbnB1dHMuc2VxdWVuY2VfaWRzKCklMEElMjMlMjBDaGUlMjB0JUUxJUJBJUE1dCUyMGMlRTElQkElQTMlMjBtJUUxJUJCJThEaSUyMHRoJUUxJUJCJUE5JTIwdHIlRTElQkIlQUIlMjB0b2tlbiUyMGMlRTElQkIlQTdhJTIwbmclRTElQkIlQUYlMjBjJUUxJUJBJUEzbmglMEFtYXNrJTIwJTNEJTIwJTVCaSUyMCElM0QlMjAxJTIwZm9yJTIwaSUyMGluJTIwc2VxdWVuY2VfaWRzJTVEJTBBJTIzJTIwSGklRTElQkIlODNuJTIwdGglRTElQkIlOEIlMjB0b2tlbiUyMCU1QkNMUyU1RCUwQW1hc2slNUIwJTVEJTIwJTNEJTIwRmFsc2UlMEFtYXNrJTIwJTNEJTIwdG9yY2gudGVuc29yKG1hc2spJTVCTm9uZSU1RCUwQSUwQXN0YXJ0X2xvZ2l0cyU1Qm1hc2slNUQlMjAlM0QlMjAtMTAwMDAlMEFlbmRfbG9naXRzJTVCbWFzayU1RCUyMCUzRCUyMC0xMDAwMA==",highlighted:`<span class="hljs-keyword">import</span> torch
sequence_ids = inputs.sequence_ids()
<span class="hljs-comment"># Che tất cả mọi thứ trừ token của ngữ cảnh</span>
mask = [i != <span class="hljs-number">1</span> <span class="hljs-keyword">for</span> i <span class="hljs-keyword">in</span> sequence_ids]
<span class="hljs-comment"># Hiển thị token [CLS]</span>
mask[<span class="hljs-number">0</span>] = <span class="hljs-literal">False</span>
mask = torch.tensor(mask)[<span class="hljs-literal">None</span>]
start_logits[mask] = -<span class="hljs-number">10000</span>
end_logits[mask] = -<span class="hljs-number">10000</span>`,wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Na(y){let l,i;return l=new w({props:{code:"c3RhcnRfcHJvYmFiaWxpdGllcyUyMCUzRCUyMHRmLm1hdGguc29mdG1heChzdGFydF9sb2dpdHMlMkMlMjBheGlzJTNELTEpJTVCMCU1RC5udW1weSgpJTBBZW5kX3Byb2JhYmlsaXRpZXMlMjAlM0QlMjB0Zi5tYXRoLnNvZnRtYXgoZW5kX2xvZ2l0cyUyQyUyMGF4aXMlM0QtMSklNUIwJTVELm51bXB5KCk=",highlighted:`start_probabilities = tf.math.softmax(start_logits, axis=-<span class="hljs-number">1</span>)[<span class="hljs-number">0</span>].numpy()
end_probabilities = tf.math.softmax(end_logits, axis=-<span class="hljs-number">1</span>)[<span class="hljs-number">0</span>].numpy()`,wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Ra(y){let l,i;return l=new w({props:{code:"c3RhcnRfcHJvYmFiaWxpdGllcyUyMCUzRCUyMHRvcmNoLm5uLmZ1bmN0aW9uYWwuc29mdG1heChzdGFydF9sb2dpdHMlMkMlMjBkaW0lM0QtMSklNUIwJTVEJTBBZW5kX3Byb2JhYmlsaXRpZXMlMjAlM0QlMjB0b3JjaC5ubi5mdW5jdGlvbmFsLnNvZnRtYXgoZW5kX2xvZ2l0cyUyQyUyMGRpbSUzRC0xKSU1QjAlNUQ=",highlighted:`start_probabilities = torch.nn.functional.softmax(start_logits, dim=-<span class="hljs-number">1</span>)[<span class="hljs-number">0</span>]
end_probabilities = torch.nn.functional.softmax(end_logits, dim=-<span class="hljs-number">1</span>)[<span class="hljs-number">0</span>]`,wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Wa(y){let l,i="Sau đó, chúng tôi sẽ che các giá trị trong đó <code>start_index &gt; end_index</code> bằng cách đặt chúng thành <code>0</code> (các xác suất khác đều là số dương). Hàm <code>np.triu()</code> trả về phần tam giác phía trên của tensor 2D được truyền dưới dạng tham số, vì vậy nó sẽ thực hiện việc che đó cho chúng ta:",n,p,d;return p=new w({props:{code:"aW1wb3J0JTIwbnVtcHklMjBhcyUyMG5wJTBBJTBBc2NvcmVzJTIwJTNEJTIwbnAudHJpdShzY29yZXMp",highlighted:`<span class="hljs-keyword">import</span> numpy <span class="hljs-keyword">as</span> np
scores = np.triu(scores)`,wrap:!1}}),{c(){l=b("p"),l.innerHTML=i,n=c(),h(p.$$.fragment)},l(f){l=T(f,"P",{"data-svelte-h":!0}),U(l)!=="svelte-1oqxu7v"&&(l.innerHTML=i),n=r(f),M(p.$$.fragment,f)},m(f,j){a(f,l,j),a(f,n,j),J(p,f,j),d=!0},i(f){d||(o(p.$$.fragment,f),d=!0)},o(f){m(p.$$.fragment,f),d=!1},d(f){f&&(s(l),s(n)),u(p,f)}}}function Xa(y){let l,i="Sau đó, chúng tôi sẽ che các giá trị trong đó <code>start_index &gt; end_index</code> bằng cách đặt chúng thành <code>0</code> (các xác suất khác đều là số dương). Hàm <code>torch.triu()</code> trả về phần tam giác phía trên của tensor 2D được truyền dưới dạng tham số, vì vậy nó sẽ thực hiện việc che đó cho chúng ta:",n,p,d;return p=new w({props:{code:"c2NvcmVzJTIwJTNEJTIwdG9yY2gudHJpdShzY29yZXMp",highlighted:"scores = torch.triu(scores)",wrap:!1}}),{c(){l=b("p"),l.innerHTML=i,n=c(),h(p.$$.fragment)},l(f){l=T(f,"P",{"data-svelte-h":!0}),U(l)!=="svelte-1cu0hmx"&&(l.innerHTML=i),n=r(f),M(p.$$.fragment,f)},m(f,j){a(f,l,j),a(f,n,j),J(p,f,j),d=!0},i(f){d||(o(p.$$.fragment,f),d=!0)},o(f){m(p.$$.fragment,f),d=!1},d(f){f&&(s(l),s(n)),u(p,f)}}}function za(y){let l,i="✏️ <strong>Thử nghiệm thôi!</strong> Tính chỉ mục bắt đầu và kết thúc cho năm cấu trả lời đầu tiện.";return{c(){l=b("p"),l.innerHTML=i},l(n){l=T(n,"P",{"data-svelte-h":!0}),U(l)!=="svelte-kp1d7g"&&(l.innerHTML=i)},m(n,p){a(n,l,p)},p:Ce,d(n){n&&s(l)}}}function Qa(y){let l,i="✏️ <strong>Thử nghiệm thôi!</strong> Sử dụng điểm tốt nhất mà bạn đã tính toán trước đó để hiển thị năm câu trả lời có khả năng nhất. Để kiểm tra kết quả của bạn, hãy quay lại đường dẫn đầu tiên và truyền vào <code>top_k=5</code> khi gọi nó.";return{c(){l=b("p"),l.innerHTML=i},l(n){l=T(n,"P",{"data-svelte-h":!0}),U(l)!=="svelte-1y0c4jh"&&(l.innerHTML=i)},m(n,p){a(n,l,p)},p:Ce,d(n){n&&s(l)}}}function Ea(y){let l,i,n,p;return l=new w({props:{code:"XyUyMCUzRCUyMGlucHV0cy5wb3AoJTIyb3ZlcmZsb3dfdG9fc2FtcGxlX21hcHBpbmclMjIpJTBBb2Zmc2V0cyUyMCUzRCUyMGlucHV0cy5wb3AoJTIyb2Zmc2V0X21hcHBpbmclMjIpJTBBJTBBaW5wdXRzJTIwJTNEJTIwaW5wdXRzLmNvbnZlcnRfdG9fdGVuc29ycyglMjJ0ZiUyMiklMEFwcmludChpbnB1dHMlNUIlMjJpbnB1dF9pZHMlMjIlNUQuc2hhcGUp",highlighted:`_ = inputs.pop(<span class="hljs-string">&quot;overflow_to_sample_mapping&quot;</span>)
offsets = inputs.pop(<span class="hljs-string">&quot;offset_mapping&quot;</span>)
inputs = inputs.convert_to_tensors(<span class="hljs-string">&quot;tf&quot;</span>)
<span class="hljs-built_in">print</span>(inputs[<span class="hljs-string">&quot;input_ids&quot;</span>].shape)`,wrap:!1}}),n=new w({props:{code:"KDIlMkMlMjAzODQp",highlighted:'(<span class="hljs-number">2</span>, <span class="hljs-number">384</span>)',wrap:!1}}),{c(){h(l.$$.fragment),i=c(),h(n.$$.fragment)},l(d){M(l.$$.fragment,d),i=r(d),M(n.$$.fragment,d)},m(d,f){J(l,d,f),a(d,i,f),J(n,d,f),p=!0},i(d){p||(o(l.$$.fragment,d),o(n.$$.fragment,d),p=!0)},o(d){m(l.$$.fragment,d),m(n.$$.fragment,d),p=!1},d(d){d&&s(i),u(l,d),u(n,d)}}}function Ha(y){let l,i,n,p;return l=new w({props:{code:"XyUyMCUzRCUyMGlucHV0cy5wb3AoJTIyb3ZlcmZsb3dfdG9fc2FtcGxlX21hcHBpbmclMjIpJTBBb2Zmc2V0cyUyMCUzRCUyMGlucHV0cy5wb3AoJTIyb2Zmc2V0X21hcHBpbmclMjIpJTBBJTBBaW5wdXRzJTIwJTNEJTIwaW5wdXRzLmNvbnZlcnRfdG9fdGVuc29ycyglMjJwdCUyMiklMEFwcmludChpbnB1dHMlNUIlMjJpbnB1dF9pZHMlMjIlNUQuc2hhcGUp",highlighted:`_ = inputs.pop(<span class="hljs-string">&quot;overflow_to_sample_mapping&quot;</span>)
offsets = inputs.pop(<span class="hljs-string">&quot;offset_mapping&quot;</span>)
inputs = inputs.convert_to_tensors(<span class="hljs-string">&quot;pt&quot;</span>)
<span class="hljs-built_in">print</span>(inputs[<span class="hljs-string">&quot;input_ids&quot;</span>].shape)`,wrap:!1}}),n=new w({props:{code:"dG9yY2guU2l6ZSglNUIyJTJDJTIwMzg0JTVEKQ==",highlighted:'torch.Size([<span class="hljs-number">2</span>, <span class="hljs-number">384</span>])',wrap:!1}}),{c(){h(l.$$.fragment),i=c(),h(n.$$.fragment)},l(d){M(l.$$.fragment,d),i=r(d),M(n.$$.fragment,d)},m(d,f){J(l,d,f),a(d,i,f),J(n,d,f),p=!0},i(d){p||(o(l.$$.fragment,d),o(n.$$.fragment,d),p=!0)},o(d){m(l.$$.fragment,d),m(n.$$.fragment,d),p=!1},d(d){d&&s(i),u(l,d),u(n,d)}}}function Fa(y){let l,i;return l=new w({props:{code:"KDIlMkMlMjAzODQpJTIwKDIlMkMlMjAzODQp",highlighted:'(<span class="hljs-number">2</span>, <span class="hljs-number">384</span>) (<span class="hljs-number">2</span>, <span class="hljs-number">384</span>)',wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Ya(y){let l,i;return l=new w({props:{code:"dG9yY2guU2l6ZSglNUIyJTJDJTIwMzg0JTVEKSUyMHRvcmNoLlNpemUoJTVCMiUyQyUyMDM4NCU1RCk=",highlighted:'torch.Size([<span class="hljs-number">2</span>, <span class="hljs-number">384</span>]) torch.Size([<span class="hljs-number">2</span>, <span class="hljs-number">384</span>])',wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Sa(y){let l,i;return l=new w({props:{code:"c2VxdWVuY2VfaWRzJTIwJTNEJTIwaW5wdXRzLnNlcXVlbmNlX2lkcygpJTBBJTIzJTIwQ2hlJTIwdCVFMSVCQSVBNXQlMjBjJUUxJUJBJUEzJTIwbSVFMSVCQiU4RGklMjB0aCVFMSVCQiVBOSUyMHRyJUUxJUJCJUFCJTIwdG9rZW4lMjBjJUUxJUJCJUE3YSUyMG5nJUUxJUJCJUFGJTIwYyVFMSVCQSVBM25oJTBBbWFzayUyMCUzRCUyMCU1QmklMjAhJTNEJTIwMSUyMGZvciUyMGklMjBpbiUyMHNlcXVlbmNlX2lkcyU1RCUwQSUyMyUyMEhpJUUxJUJCJTgzbiUyMHRoJUUxJUJCJThCJTIwdG9rZW4lMjAlNUJDTFMlNUQlMEFtYXNrJTVCMCU1RCUyMCUzRCUyMEZhbHNlJTBBJTIzJTIwQ2hlJTIwdCVFMSVCQSVBNXQlMjBjJUUxJUJBJUEzJTIwdG9rZW4lMjAlNUJQQUQlNUQlMEFtYXNrJTIwJTNEJTIwdGYubWF0aC5sb2dpY2FsX29yKHRmLmNvbnN0YW50KG1hc2spJTVCTm9uZSU1RCUyQyUyMGlucHV0cyU1QiUyMmF0dGVudGlvbl9tYXNrJTIyJTVEJTIwJTNEJTNEJTIwMCklMEElMEFzdGFydF9sb2dpdHMlMjAlM0QlMjB0Zi53aGVyZShtYXNrJTJDJTIwLTEwMDAwJTJDJTIwc3RhcnRfbG9naXRzKSUwQWVuZF9sb2dpdHMlMjAlM0QlMjB0Zi53aGVyZShtYXNrJTJDJTIwLTEwMDAwJTJDJTIwZW5kX2xvZ2l0cyk=",highlighted:`sequence_ids = inputs.sequence_ids()
<span class="hljs-comment"># Che tất cả mọi thứ trừ token của ngữ cảnh</span>
mask = [i != <span class="hljs-number">1</span> <span class="hljs-keyword">for</span> i <span class="hljs-keyword">in</span> sequence_ids]
<span class="hljs-comment"># Hiển thị token [CLS]</span>
mask[<span class="hljs-number">0</span>] = <span class="hljs-literal">False</span>
<span class="hljs-comment"># Che tất cả token [PAD]</span>
mask = tf.math.logical_or(tf.constant(mask)[<span class="hljs-literal">None</span>], inputs[<span class="hljs-string">&quot;attention_mask&quot;</span>] == <span class="hljs-number">0</span>)
start_logits = tf.where(mask, -<span class="hljs-number">10000</span>, start_logits)
end_logits = tf.where(mask, -<span class="hljs-number">10000</span>, end_logits)`,wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Aa(y){let l,i;return l=new w({props:{code:"c2VxdWVuY2VfaWRzJTIwJTNEJTIwaW5wdXRzLnNlcXVlbmNlX2lkcygpJTBBJTIzJTIwQ2hlJTIwdCVFMSVCQSVBNXQlMjBjJUUxJUJBJUEzJTIwbSVFMSVCQiU4RGklMjB0aCVFMSVCQiVBOSUyMHRyJUUxJUJCJUFCJTIwdG9rZW4lMjBjJUUxJUJCJUE3YSUyMG5nJUUxJUJCJUFGJTIwYyVFMSVCQSVBM25oJTBBbWFzayUyMCUzRCUyMCU1QmklMjAhJTNEJTIwMSUyMGZvciUyMGklMjBpbiUyMHNlcXVlbmNlX2lkcyU1RCUwQSUyMyUyMEhpJUUxJUJCJTgzbiUyMHRoJUUxJUJCJThCJTIwdG9rZW4lMjAlNUJDTFMlNUQlMEFtYXNrJTVCMCU1RCUyMCUzRCUyMEZhbHNlJTBBJTIzJTIwQ2hlJTIwdCVFMSVCQSVBNXQlMjBjJUUxJUJBJUEzJTIwdG9rZW4lMjAlNUJQQUQlNUQlMEFtYXNrJTIwJTNEJTIwdG9yY2gubG9naWNhbF9vcih0b3JjaC50ZW5zb3IobWFzayklNUJOb25lJTVEJTJDJTIwKGlucHV0cyU1QiUyMmF0dGVudGlvbl9tYXNrJTIyJTVEJTIwJTNEJTNEJTIwMCkpJTBBJTBBc3RhcnRfbG9naXRzJTVCbWFzayU1RCUyMCUzRCUyMC0xMDAwMCUwQWVuZF9sb2dpdHMlNUJtYXNrJTVEJTIwJTNEJTIwLTEwMDAw",highlighted:`sequence_ids = inputs.sequence_ids()
<span class="hljs-comment"># Che tất cả mọi thứ trừ token của ngữ cảnh</span>
mask = [i != <span class="hljs-number">1</span> <span class="hljs-keyword">for</span> i <span class="hljs-keyword">in</span> sequence_ids]
<span class="hljs-comment"># Hiển thị token [CLS]</span>
mask[<span class="hljs-number">0</span>] = <span class="hljs-literal">False</span>
<span class="hljs-comment"># Che tất cả token [PAD]</span>
mask = torch.logical_or(torch.tensor(mask)[<span class="hljs-literal">None</span>], (inputs[<span class="hljs-string">&quot;attention_mask&quot;</span>] == <span class="hljs-number">0</span>))
start_logits[mask] = -<span class="hljs-number">10000</span>
end_logits[mask] = -<span class="hljs-number">10000</span>`,wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function qa(y){let l,i;return l=new w({props:{code:"c3RhcnRfcHJvYmFiaWxpdGllcyUyMCUzRCUyMHRmLm1hdGguc29mdG1heChzdGFydF9sb2dpdHMlMkMlMjBheGlzJTNELTEpLm51bXB5KCklMEFlbmRfcHJvYmFiaWxpdGllcyUyMCUzRCUyMHRmLm1hdGguc29mdG1heChlbmRfbG9naXRzJTJDJTIwYXhpcyUzRC0xKS5udW1weSgp",highlighted:`start_probabilities = tf.math.softmax(start_logits, axis=-<span class="hljs-number">1</span>).numpy()
end_probabilities = tf.math.softmax(end_logits, axis=-<span class="hljs-number">1</span>).numpy()`,wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function La(y){let l,i;return l=new w({props:{code:"c3RhcnRfcHJvYmFiaWxpdGllcyUyMCUzRCUyMHRvcmNoLm5uLmZ1bmN0aW9uYWwuc29mdG1heChzdGFydF9sb2dpdHMlMkMlMjBkaW0lM0QtMSklMEFlbmRfcHJvYmFiaWxpdGllcyUyMCUzRCUyMHRvcmNoLm5uLmZ1bmN0aW9uYWwuc29mdG1heChlbmRfbG9naXRzJTJDJTIwZGltJTNELTEp",highlighted:`start_probabilities = torch.nn.functional.softmax(start_logits, dim=-<span class="hljs-number">1</span>)
end_probabilities = torch.nn.functional.softmax(end_logits, dim=-<span class="hljs-number">1</span>)`,wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Da(y){let l,i;return l=new w({props:{code:"Y2FuZGlkYXRlcyUyMCUzRCUyMCU1QiU1RCUwQWZvciUyMHN0YXJ0X3Byb2JzJTJDJTIwZW5kX3Byb2JzJTIwaW4lMjB6aXAoc3RhcnRfcHJvYmFiaWxpdGllcyUyQyUyMGVuZF9wcm9iYWJpbGl0aWVzKSUzQSUwQSUyMCUyMCUyMCUyMHNjb3JlcyUyMCUzRCUyMHN0YXJ0X3Byb2JzJTVCJTNBJTJDJTIwTm9uZSU1RCUyMColMjBlbmRfcHJvYnMlNUJOb25lJTJDJTIwJTNBJTVEJTBBJTIwJTIwJTIwJTIwaWR4JTIwJTNEJTIwbnAudHJpdShzY29yZXMpLmFyZ21heCgpLml0ZW0oKSUwQSUwQSUyMCUyMCUyMCUyMHN0YXJ0X2lkeCUyMCUzRCUyMGlkeCUyMCUyRiUyRiUyMHNjb3Jlcy5zaGFwZSU1QjElNUQlMEElMjAlMjAlMjAlMjBlbmRfaWR4JTIwJTNEJTIwaWR4JTIwJTI1JTIwc2NvcmVzLnNoYXBlJTVCMSU1RCUwQSUyMCUyMCUyMCUyMHNjb3JlJTIwJTNEJTIwc2NvcmVzJTVCc3RhcnRfaWR4JTJDJTIwZW5kX2lkeCU1RC5pdGVtKCklMEElMjAlMjAlMjAlMjBjYW5kaWRhdGVzLmFwcGVuZCgoc3RhcnRfaWR4JTJDJTIwZW5kX2lkeCUyQyUyMHNjb3JlKSklMEElMEFwcmludChjYW5kaWRhdGVzKQ==",highlighted:`candidates = []
<span class="hljs-keyword">for</span> start_probs, end_probs <span class="hljs-keyword">in</span> <span class="hljs-built_in">zip</span>(start_probabilities, end_probabilities):
scores = start_probs[:, <span class="hljs-literal">None</span>] * end_probs[<span class="hljs-literal">None</span>, :]
idx = np.triu(scores).argmax().item()
start_idx = idx // scores.shape[<span class="hljs-number">1</span>]
end_idx = idx % scores.shape[<span class="hljs-number">1</span>]
score = scores[start_idx, end_idx].item()
candidates.append((start_idx, end_idx, score))
<span class="hljs-built_in">print</span>(candidates)`,wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Pa(y){let l,i;return l=new w({props:{code:"Y2FuZGlkYXRlcyUyMCUzRCUyMCU1QiU1RCUwQWZvciUyMHN0YXJ0X3Byb2JzJTJDJTIwZW5kX3Byb2JzJTIwaW4lMjB6aXAoc3RhcnRfcHJvYmFiaWxpdGllcyUyQyUyMGVuZF9wcm9iYWJpbGl0aWVzKSUzQSUwQSUyMCUyMCUyMCUyMHNjb3JlcyUyMCUzRCUyMHN0YXJ0X3Byb2JzJTVCJTNBJTJDJTIwTm9uZSU1RCUyMColMjBlbmRfcHJvYnMlNUJOb25lJTJDJTIwJTNBJTVEJTBBJTIwJTIwJTIwJTIwaWR4JTIwJTNEJTIwdG9yY2gudHJpdShzY29yZXMpLmFyZ21heCgpLml0ZW0oKSUwQSUwQSUyMCUyMCUyMCUyMHN0YXJ0X2lkeCUyMCUzRCUyMGlkeCUyMCUyRiUyRiUyMHNjb3Jlcy5zaGFwZSU1QjElNUQlMEElMjAlMjAlMjAlMjBlbmRfaWR4JTIwJTNEJTIwaWR4JTIwJTI1JTIwc2NvcmVzLnNoYXBlJTVCMSU1RCUwQSUyMCUyMCUyMCUyMHNjb3JlJTIwJTNEJTIwc2NvcmVzJTVCc3RhcnRfaWR4JTJDJTIwZW5kX2lkeCU1RC5pdGVtKCklMEElMjAlMjAlMjAlMjBjYW5kaWRhdGVzLmFwcGVuZCgoc3RhcnRfaWR4JTJDJTIwZW5kX2lkeCUyQyUyMHNjb3JlKSklMEElMEFwcmludChjYW5kaWRhdGVzKQ==",highlighted:`candidates = []
<span class="hljs-keyword">for</span> start_probs, end_probs <span class="hljs-keyword">in</span> <span class="hljs-built_in">zip</span>(start_probabilities, end_probabilities):
scores = start_probs[:, <span class="hljs-literal">None</span>] * end_probs[<span class="hljs-literal">None</span>, :]
idx = torch.triu(scores).argmax().item()
start_idx = idx // scores.shape[<span class="hljs-number">1</span>]
end_idx = idx % scores.shape[<span class="hljs-number">1</span>]
score = scores[start_idx, end_idx].item()
candidates.append((start_idx, end_idx, score))
<span class="hljs-built_in">print</span>(candidates)`,wrap:!1}}),{c(){h(l.$$.fragment)},l(n){M(l.$$.fragment,n)},m(n,p){J(l,n,p),i=!0},i(n){i||(o(l.$$.fragment,n),i=!0)},o(n){m(l.$$.fragment,n),i=!1},d(n){u(l,n)}}}function Ka(y){let l,i="✏️ <strong>Thử nghiệm thôi!</strong> Hãy điều chỉnh đoạn mã trên để trả về điểm và khoảng cho năm câu trả lời có nhiều khả năng nhất (tổng cộng, không phải cho mỗi đoạn).";return{c(){l=b("p"),l.innerHTML=i},l(n){l=T(n,"P",{"data-svelte-h":!0}),U(l)!=="svelte-24pghw"&&(l.innerHTML=i)},m(n,p){a(n,l,p)},p:Ce,d(n){n&&s(l)}}}function Oa(y){let l,i="✏️ <strong>Thử nghiệm thôi!</strong> Sử dụng điểm tốt nhất bạn đã tính toán trước đó để hiển thị năm câu trả lời có khả năng xảy ra nhất (cho toàn bộ ngữ cảnh, không phải từng đoạn). Để kiểm tra kết quả của bạn, hãy quay lại pipeline đầu tiên và truyền vào <code>top_k=5</code> khi gọi nó.";return{c(){l=b("p"),l.innerHTML=i},l(n){l=T(n,"P",{"data-svelte-h":!0}),U(l)!=="svelte-497a89"&&(l.innerHTML=i)},m(n,p){a(n,l,p)},p:Ce,d(n){n&&s(l)}}}function ti(y){let l,i,n,p,d,f,j,tl,B,C,Nn,rt,De="Giờ chúng ta sẽ đi sâu vào pipeline <code>question-answering</code> và xem cách tận dụng các offset để lấy câu trả lời cho các câu hỏi dựa theo từ ngữ cảnh, giống như chúng ta đã làm với các thực thể được nhóm trong phần trước. Sau đó, chúng ta sẽ xem làm thế nào có thể đối phó với những ngữ cảnh rất dài mà cuối cùng lại bị cắt bớt. Bạn có thể bỏ qua phần này nếu không quan tâm đến tác vụ hỏi đáp.",nl,$,Z,Rn,mt,ll,ot,Pe='Như đã thấy trong <a href="/course/chapter1">Chương 1</a>, ta có thể sử dụng pipeline <code>question-answering</code> như sau để nhận được câu trả lời cho câu hỏi:',el,pt,sl,ht,al,Mt,Ke="Không như các pipeline khác không thể cắt gọn và chia văn bản dài hơn độ dài tối đa cho phép của mô hình (dẫn đến bỏ lỡ những thông tin ở phần cuối văn bản), pipeline này có thể xử lý tốt với những ngữ cảnh dài và sẽ trả về câu trả lời kể cả khi nó nằm ở cuối văn bản:",il,Jt,cl,ut,rl,yt,Oe="Hãy cùng nhau xem nó làm thế nào!",ml,dt,ol,bt,ts='Như những pipeline khác, ta sẽ bắt đầu với việc tokenize đầu vào và sau đó truyền chúng vào trong mô hình. Mặc định checkpoint được sử dụng cho pipeline <code>question-answering</code> là <a href="https://huggingface.co/distilbert-base-cased-distilled-squad" rel="nofollow"><code>distilbert-base-cased-distilled-squad</code></a> ( “squad” trong tên bắt nguồn từ bộ dữ liệu mà mô hình sử dụng để tinh chỉnh; ta sẽ nói sâu hơn về bộ dữ liệu SQuAD này ở <a href="/course/chapter7/7">Chương 7</a>):',pl,x,G,Wn,Tt,ns="Lưu ý rằng chúng ta tokenize câu hỏi và ngữ cảnh như một cặp, với câu hỏi đứng trước.",hl,nt,ls='<img class="block dark:hidden" src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter6/question_tokens.svg" alt="An example of tokenization of question and context"/> <img class="hidden dark:block" src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter6/question_tokens-dark.svg" alt="An example of tokenization of question and context"/>',Ml,wt,es="Các mô hình hỏi đáp hoạt động hơi khác so với các mô hình mà ta đã thấy cho đến nay. Sử dụng hình trên làm ví dụ, mô hình đã được huấn luyện để dự đoán chỉ mục của token bắt đầu câu trả lời (ở đây là 21) và chỉ mục của token nơi câu trả lời kết thúc (ở đây là 24). Đây là lý do tại sao các mô hình đó không trả về một tensor logit mà là hai: một cho các logit tương ứng với token bắt đầu của câu trả lời và một cho các các logit tương ứng với token kết thúc của câu trả lời. Vì trong trường hợp này, chúng ta chỉ có một đầu vào chứa 66 token, ta nhận được:",Jl,Ut,ul,V,N,Xn,ft,ss="Để chuyển đổi các logit đó thành xác suất, chúng ta sẽ áp dụng một hàm softmax - nhưng trước đó, chúng ta cần đảm bảo rằng chúng ta che dấu các chỉ mục không phải là một phần của ngữ cảnh. Đầu vào của chúng tôi là <code>[CLS] question [SEP] context [SEP]</code>, vì vậy chúng ta cần che dấu các token của câu hỏi cũng như token <code>[SEP]</code>. Tuy nhiên, chúng ta sẽ giữ token <code>[CLS]</code> vì một số mô hình sử dụng nó để chỉ ra rằng câu trả lời không nằm trong ngữ cảnh.",yl,jt,as="Vì chúng ta sẽ áp dụng softmax sau đó, chúng ta chỉ cần thay thế các logit muốn che bằng một số âm lớn. Ở đây, chúng ta sử dụng <code>-10000</code>:",dl,R,W,zn,gt,is="Giờ chúng ta đã che các logit tương ứng với các vị trí mà chúng ta không muốn dự đoán, chúng ta có thể áp dụng softmax:",bl,X,z,Qn,kt,cs="Ở giai đoạn này, chúng ta có thể lấy argmax xác suất bắt đầu và kết thúc - nhưng chúng ta có thể kết thúc với chỉ mục bắt đầu lớn hơn kết thúc, vì vậy chúng ta cần thực hiện thêm một số biện pháp phòng ngừa. Chúng ta sẽ tính toán xác suất của từng <code>start_index</code> và <code>end_index</code> có thể trong đó <code>start_index &lt;= end_index</code>, sau đó lấy <code>(start_index, end_index)</code> với xác suất cao nhất.",Tl,g,$e,En,rs="start_index",Ze,Hn,ms="end_index",xe,Fn,os="start_index",Ge,Yn,ps="end_index",Ve,wl,da='<span class="katex-display"><span class="katex"><span class="katex-mathml"><math xmlns="http://www.w3.org/1998/Math/MathML" display="block"><semantics><mrow><mrow><mi mathvariant="normal">s</mi><mi mathvariant="normal">t</mi><mi mathvariant="normal">a</mi><mi mathvariant="normal">r</mi><mi mathvariant="normal">t</mi><mi mathvariant="normal">_</mi><mi mathvariant="normal">p</mi><mi mathvariant="normal">r</mi><mi mathvariant="normal">o</mi><mi mathvariant="normal">b</mi><mi mathvariant="normal">a</mi><mi mathvariant="normal">b</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">l</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">t</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">e</mi><mi mathvariant="normal">s</mi></mrow><mo stretchy="false">[</mo><mrow><mi mathvariant="normal">s</mi><mi mathvariant="normal">t</mi><mi mathvariant="normal">a</mi><mi mathvariant="normal">r</mi><mi mathvariant="normal">t</mi><mi mathvariant="normal">_</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">n</mi><mi mathvariant="normal">d</mi><mi mathvariant="normal">e</mi><mi mathvariant="normal">x</mi></mrow><mo stretchy="false">]</mo><mo>×</mo><mrow><mi mathvariant="normal">e</mi><mi mathvariant="normal">n</mi><mi mathvariant="normal">d</mi><mi mathvariant="normal">_</mi><mi mathvariant="normal">p</mi><mi mathvariant="normal">r</mi><mi mathvariant="normal">o</mi><mi mathvariant="normal">b</mi><mi mathvariant="normal">a</mi><mi mathvariant="normal">b</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">l</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">t</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">e</mi><mi mathvariant="normal">s</mi></mrow><mo stretchy="false">[</mo><mrow><mi mathvariant="normal">e</mi><mi mathvariant="normal">n</mi><mi mathvariant="normal">d</mi><mi mathvariant="normal">_</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">n</mi><mi mathvariant="normal">d</mi><mi mathvariant="normal">e</mi><mi mathvariant="normal">x</mi></mrow><mo stretchy="false">]</mo></mrow><annotation encoding="application/x-tex">\\mathrm{start\\_probabilities}[\\mathrm{start\\_index}] \\times \\mathrm{end\\_probabilities}[\\mathrm{end\\_index}]</annotation></semantics></math></span><span class="katex-html" aria-hidden="true"><span class="base"><span class="strut" style="height:1.06em;vertical-align:-0.31em;"></span><span class="mord"><span class="mord mathrm">start_probabilities</span></span><span class="mopen">[</span><span class="mord"><span class="mord mathrm">start_index</span></span><span class="mclose">]</span><span class="mspace" style="margin-right:0.2222em;"></span><span class="mbin">×</span><span class="mspace" style="margin-right:0.2222em;"></span></span><span class="base"><span class="strut" style="height:1.06em;vertical-align:-0.31em;"></span><span class="mord"><span class="mord mathrm">end_probabilities</span></span><span class="mopen">[</span><span class="mord"><span class="mord mathrm">end_index</span></span><span class="mclose">]</span></span></span></span></span>',Ul,O,Ne,fl,ba='<span class="katex"><span class="katex-mathml"><math xmlns="http://www.w3.org/1998/Math/MathML"><semantics><mrow><mrow><mi mathvariant="normal">s</mi><mi mathvariant="normal">t</mi><mi mathvariant="normal">a</mi><mi mathvariant="normal">r</mi><mi mathvariant="normal">t</mi><mi mathvariant="normal">_</mi><mi mathvariant="normal">p</mi><mi mathvariant="normal">r</mi><mi mathvariant="normal">o</mi><mi mathvariant="normal">b</mi><mi mathvariant="normal">a</mi><mi mathvariant="normal">b</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">l</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">t</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">e</mi><mi mathvariant="normal">s</mi></mrow><mo stretchy="false">[</mo><mrow><mi mathvariant="normal">s</mi><mi mathvariant="normal">t</mi><mi mathvariant="normal">a</mi><mi mathvariant="normal">r</mi><mi mathvariant="normal">t</mi><mi mathvariant="normal">_</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">n</mi><mi mathvariant="normal">d</mi><mi mathvariant="normal">e</mi><mi mathvariant="normal">x</mi></mrow><mo stretchy="false">]</mo><mo>×</mo><mrow><mi mathvariant="normal">e</mi><mi mathvariant="normal">n</mi><mi mathvariant="normal">d</mi><mi mathvariant="normal">_</mi><mi mathvariant="normal">p</mi><mi mathvariant="normal">r</mi><mi mathvariant="normal">o</mi><mi mathvariant="normal">b</mi><mi mathvariant="normal">a</mi><mi mathvariant="normal">b</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">l</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">t</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">e</mi><mi mathvariant="normal">s</mi></mrow><mo stretchy="false">[</mo><mrow><mi mathvariant="normal">e</mi><mi mathvariant="normal">n</mi><mi mathvariant="normal">d</mi><mi mathvariant="normal">_</mi><mi mathvariant="normal">i</mi><mi mathvariant="normal">n</mi><mi mathvariant="normal">d</mi><mi mathvariant="normal">e</mi><mi mathvariant="normal">x</mi></mrow><mo stretchy="false">]</mo></mrow><annotation encoding="application/x-tex">\\mathrm{start\\_probabilities}[\\mathrm{start\\_index}] \\times \\mathrm{end\\_probabilities}[\\mathrm{end\\_index}]</annotation></semantics></math></span><span class="katex-html" aria-hidden="true"><span class="base"><span class="strut" style="height:1.06em;vertical-align:-0.31em;"></span><span class="mord"><span class="mord mathrm">start_probabilities</span></span><span class="mopen">[</span><span class="mord"><span class="mord mathrm">start_index</span></span><span class="mclose">]</span><span class="mspace" style="margin-right:0.2222em;"></span><span class="mbin">×</span><span class="mspace" style="margin-right:0.2222em;"></span></span><span class="base"><span class="strut" style="height:1.06em;vertical-align:-0.31em;"></span><span class="mord"><span class="mord mathrm">end_probabilities</span></span><span class="mopen">[</span><span class="mord"><span class="mord mathrm">end_index</span></span><span class="mclose">]</span></span></span></span>',jl,Sn,hs="start_index <= end_index",Re,gl,It,Ms="Đầu tiên, hãy tính toán tất cả các đầu ra có thể có:",kl,vt,Il,Q,E,An,_t,Js="Bây giờ chúng ta chỉ cần lấy chỉ mục tối đa. Vì PyTorch sẽ trả về chỉ mục trong tensor phẳng, chúng ta cần sử dụng phép chia làm tròn xuống <code>//</code> và lấy dư <code>%</code> để nhận được <code>start_index</code> và <code>end_index</code>:",vl,Bt,_l,Ct,us="Chúng ta chưa xong đâu, nhưng ít nhất chúng ta đã có điểm chính xác cho câu trả lời (bạn có thể kiểm tra điều này bằng cách so sánh nó với kết quả đầu tiên trong phần trước):",Bl,$t,Cl,lt,$l,Zt,ys="Ta có <code>start_index</code> và <code>end_index</code> của câu trả lời theo token nên ta chỉ cần chuyển đổi các chỉ mục kí tự trong ngữ cảnh. Đấy là nơi offset sẽ cực kì hữu ích. Ta có thể lấy và sử dụng chúng như cách ta làm trong tác vụ phân loại token:",Zl,xt,xl,Gt,ds="Bây giờ chúng ta chỉ cần định dạng mọi thứ để có được kết quả:",Gl,Vt,Vl,Nt,Nl,Rt,bs="Tuyệt quá! Kết quả đó giống như trong ví dụ đầu tiên của chúng ta!",Rl,et,Wl,Wt,Xl,Xt,Ts="Nếu chúng ta cố gắng tokenize các câu hỏi và ngữ cảnh dài ta từng lấy làm ví dụ trước đó, ta sẽ nhận được số token nhiều hơn độ dài tối da sử dụng trong pipeline <code>question-answering</code> (đó là 384):",zl,zt,Ql,Qt,El,Et,ws="Vì vậy, chúng ta sẽ cần phải cắt bớt đầu vào của mình ở độ dài tối đa đó. Có một số cách ta có thể làm điều này, nhưng chúng ta không muốn cắt ngắn câu hỏi, chỉ cắt bỏ ngữ cảnh. Vì ngữ cảnh là câu thứ hai, chúng ta sẽ sử dụng chiến lược cắt ngắn <code>&quot;only_second&quot;</code>. Vấn đề nảy sinh sau đó là câu trả lời cho câu hỏi có thể không nằm trong ngữ cảnh đã bị cắt ngắn. Ví dụ: ở đây, chúng ta đã chọn một câu hỏi trong đó câu trả lời nằm ở cuối ngữ cảnh và khi cắt ngắn câu trả lời đó thì câu trả lời không còn:",Hl,Ht,Fl,Ft,Yl,Yt,Us="Điều này có nghĩa là mô hình sẽ gặp khó khăn trong việc chọn ra câu trả lời chính xác. Để khắc phục điều này, pipeline hỏi đáp cho phép chúng ta chia ngữ cảnh thành các phần nhỏ hơn, chỉ định độ dài tối đa. Để đảm bảo rằng chúng ta không chia bối cảnh chính xác ở vị trí sai để có thể tìm ra câu trả lời, nó cũng bao gồm một số phần trùng lặp giữa các phần.",Sl,St,fs="Chúng ta có thể yêu cầu tokenizer (nhanh hoặc chậm) thực hiện việc này bằng cách thêm <code>return_overflowing_tokens=True</code> và ta có thể chỉ định sự giao thoa mà ta muốn qua than số <code>stride</code>. Đây là một ví dụ, sử dụng một câu nhỏ hơn:",Al,At,ql,qt,Ll,Lt,js="Có thể thấy, câu đã bị chia thành các đoạn sao cho mỗi phần trong <code>inputs[&quot;input_ids&quot;]</code> có nhiều nhất 6 token (ta sẽ cần thêm đệm để đảm bảo chúng có cùng kích thước) và sẽ có sử giao thoa của 2 token giữa các phần.",Dl,Dt,gs="Hãy cùng nhìn kĩ hơn vào kết quả tokenize:",Pl,Pt,Kl,Kt,Ol,Ot,ks="Như dự đoán, ta nhận được ID đầu vào và attention mask.Ở đây, <code>overflow_to_sample_mapping</code> là một phép ánh xạ cho ta biết câu nào trong kết quả liên quan — ta có 7 kết quả dều từ câu mà ta truyền vào tokenizer:",te,tn,ne,nn,le,ln,Is="Điều này hữu ích hơn khi ta tokenize nhiều câu cùng nhau, Ví dụ:",ee,en,se,sn,vs="trả cho ta:",ae,an,ie,cn,_s="nghĩa là câu đầu tiên được chia thành 7 đoạn như phần phía trước, và 4 đoạn tiếp theo đến từ câu thứ hai.",ce,rn,Bs="Bây giờ chúng ta hãy cùng quay trở lại ngữ cảnh dài. Theo mặc định, pipeline `<code>question-answering</code> sử dụng độ dài tối đa là 384, như đã đề cập trước đó và khoảng cách 128, tương ứng với cách mô hình được tinh chỉnh (bạn có thể điều chỉnh các tham số đó bằng cách truyền <code>max_seq_len</code> và <code>stride</code> khi gọi pipeline). Do đó, chúng ta sẽ sử dụng các tham số đó khi tokenize. Chúng ta cũng sẽ thêm phần đệm (để có các mẫu có cùng chiều dài, vì vậy chúng ta có thể tạo ra các tensor) cũng như yêu cầu các offset:",re,mn,me,on,Cs="Các <code>inputs</code> sẽ chứa các ID đầu vào và các attention mask mà mô hình kì vọng, cũng như offset và <code>overflow_to_sample_mapping</code> ta vừa trao đổi ở trên. Vì hai tham số đó không phải là tham số được sử dụng bởi mô hình, chúng ta sẽ đưa chúng ra khỏi <code>inputs</code> (và không lưu trữ ánh xạ, vì nó không hữu ích ở đây) trước khi chuyển đổi nó thành tensor:",oe,H,F,qn,pn,$s="Bối cảnh dài của chúng ta được chia làm hai, đồng nghĩa sau khi nó đi qua mô hình, chúng ta sẽ có hai bộ logit bắt đầu và kết thúc:",pe,hn,he,Y,S,Ln,Mn,Zs="Giống như trước đây, đầu tiên chúng ta che các token không phải là một phần của ngữ cảnh trước khi sử dụng softmax. Chúng ta cũng che tất cả các token đệm (được gắn mác bởi attention mask):",Me,A,q,Dn,Jn,xs="Sau đó, chúng ta có thể sử dụng softmax để chuyển đổi các logit của chúng ta thành xác suất:",Je,L,D,Pn,un,Gs="Bước tiếp theo tương tự như những gì chúng ta đã làm cho bối cảnh nhỏ, nhưng chúng ta lặp lại nó cho mỗi phần trong hai phần của mình. Chúng ta tính điểm cho tất cả các khoảng câu trả lời có thể có, sau đó lấy phần có điểm tốt nhất:",ue,P,K,Kn,yn,ye,dn,Vs="Hai ứng cử viên đó tương ứng với các câu trả lời tốt nhất mà mô hình có thể tìm thấy trong mỗi đoạn. Mô hình chắc chắn hơn rằng câu trả lời đúng nằm ở phần thứ hai (đó là một dấu hiệu tốt!). Bây giờ chúng ta chỉ cần ánh xạ khoảng hai token đó với khoảng các ký tự trong ngữ cảnh (chúng ta chỉ cần lập ánh xạ cái thứ hai để có câu trả lời, nhưng thật thú vị khi xem mô hình đã chọn những gì trong đoạn đầu tiên).",de,st,be,bn,Ns="<code>offsets</code> mà chúng ta đã nắm được trước đó thực sự là một danh sách các offset, với một danh sách trên mỗi đoạn văn bản:",Te,Tn,we,wn,Ue,Un,Rs="Nếu chúng ta bỏ qua kết quả đầu tiên, chúng ta sẽ nhận được kết quả tương tự như pipeline cho ngữ cảnh dài này - yayy!",fe,at,je,fn,Ws="Điều này kết thúc phần đi sâu vào các khả năng của tokenizer. Chúng ta sẽ đưa tất cả những điều này vào thực tế một lần nữa trong chương tiếp theo, khi chúng tôi hướng dẫn bạn cách tinh chỉnh một mô hình về một loạt các tác vụ NLP phổ biến.",ge,jn,ke,On,Ie;d=new ga({props:{fw:y[0]}}),j=new Be({props:{title:"Fast tokenizers in the QA pipeline",local:"fast-tokenizers-in-the-qa-pipeline",headingTag:"h1"}});const Xs=[va,Ia],gn=[];function zs(t,e){return t[0]==="pt"?0:1}B=zs(y),C=gn[B]=Xs[B](y);const Qs=[Ba,_a],kn=[];function Es(t,e){return t[0]==="pt"?0:1}$=Es(y),Z=kn[$]=Qs[$](y),mt=new Be({props:{title:"Sử dụng pipeline question-answering",local:"sử-dụng-pipeline-question-answering",headingTag:"h2"}}),pt=new w({props:{code:"ZnJvbSUyMHRyYW5zZm9ybWVycyUyMGltcG9ydCUyMHBpcGVsaW5lJTBBJTBBcXVlc3Rpb25fYW5zd2VyZXIlMjAlM0QlMjBwaXBlbGluZSglMjJxdWVzdGlvbi1hbnN3ZXJpbmclMjIpJTBBY29udGV4dCUyMCUzRCUyMCUyMiUyMiUyMiUwQSVGMCU5RiVBNCU5NyUyMFRyYW5zZm9ybWVycyUyMGlzJTIwYmFja2VkJTIwYnklMjB0aGUlMjB0aHJlZSUyMG1vc3QlMjBwb3B1bGFyJTIwZGVlcCUyMGxlYXJuaW5nJTIwbGlicmFyaWVzJTIwJUUyJTgwJTk0JTIwSmF4JTJDJTIwUHlUb3JjaCUyQyUyMGFuZCUyMFRlbnNvckZsb3clMjAlRTIlODAlOTQlMjB3aXRoJTIwYSUyMHNlYW1sZXNzJTIwaW50ZWdyYXRpb24lMEFiZXR3ZWVuJTIwdGhlbS4lMjBJdCdzJTIwc3RyYWlnaHRmb3J3YXJkJTIwdG8lMjB0cmFpbiUyMHlvdXIlMjBtb2RlbHMlMjB3aXRoJTIwb25lJTIwYmVmb3JlJTIwbG9hZGluZyUyMHRoZW0lMjBmb3IlMjBpbmZlcmVuY2UlMjB3aXRoJTIwdGhlJTIwb3RoZXIuJTBBJTIyJTIyJTIyJTBBcXVlc3Rpb24lMjAlM0QlMjAlMjJXaGljaCUyMGRlZXAlMjBsZWFybmluZyUyMGxpYnJhcmllcyUyMGJhY2slMjAlRjAlOUYlQTQlOTclMjBUcmFuc2Zvcm1lcnMlM0YlMjIlMEFxdWVzdGlvbl9hbnN3ZXJlcihxdWVzdGlvbiUzRHF1ZXN0aW9uJTJDJTIwY29udGV4dCUzRGNvbnRleHQp",highlighted:`<span class="hljs-keyword">from</span> transformers <span class="hljs-keyword">import</span> pipeline
question_answerer = pipeline(<span class="hljs-string">&quot;question-answering&quot;</span>)
context = <span class="hljs-string">&quot;&quot;&quot;
🤗 Transformers is backed by the three most popular deep learning libraries — Jax, PyTorch, and TensorFlow — with a seamless integration
between them. It&#x27;s straightforward to train your models with one before loading them for inference with the other.
&quot;&quot;&quot;</span>
question = <span class="hljs-string">&quot;Which deep learning libraries back 🤗 Transformers?&quot;</span>
question_answerer(question=question, context=context)`,wrap:!1}}),ht=new w({props:{code:"JTdCJ3Njb3JlJyUzQSUyMDAuOTc3NzMlMkMlMEElMjAnc3RhcnQnJTNBJTIwNzglMkMlMEElMjAnZW5kJyUzQSUyMDEwNSUyQyUwQSUyMCdhbnN3ZXInJTNBJTIwJ0pheCUyQyUyMFB5VG9yY2glMjBhbmQlMjBUZW5zb3JGbG93JyU3RA==",highlighted:`{<span class="hljs-string">&#x27;score&#x27;</span>: <span class="hljs-number">0.97773</span>,
<span class="hljs-string">&#x27;start&#x27;</span>: <span class="hljs-number">78</span>,
<span class="hljs-string">&#x27;end&#x27;</span>: <span class="hljs-number">105</span>,
<span class="hljs-string">&#x27;answer&#x27;</span>: <span class="hljs-string">&#x27;Jax, PyTorch and TensorFlow&#x27;</span>}`,wrap:!1}}),Jt=new w({props:{code:"bG9uZ19jb250ZXh0JTIwJTNEJTIwJTIyJTIyJTIyJTBBJUYwJTlGJUE0JTk3JTIwVHJhbnNmb3JtZXJzJTNBJTIwU3RhdGUlMjBvZiUyMHRoZSUyMEFydCUyME5MUCUwQSUwQSVGMCU5RiVBNCU5NyUyMFRyYW5zZm9ybWVycyUyMHByb3ZpZGVzJTIwdGhvdXNhbmRzJTIwb2YlMjBwcmV0cmFpbmVkJTIwbW9kZWxzJTIwdG8lMjBwZXJmb3JtJTIwdGFza3MlMjBvbiUyMHRleHRzJTIwc3VjaCUyMGFzJTIwY2xhc3NpZmljYXRpb24lMkMlMjBpbmZvcm1hdGlvbiUyMGV4dHJhY3Rpb24lMkMlMEFxdWVzdGlvbiUyMGFuc3dlcmluZyUyQyUyMHN1bW1hcml6YXRpb24lMkMlMjB0cmFuc2xhdGlvbiUyQyUyMHRleHQlMjBnZW5lcmF0aW9uJTIwYW5kJTIwbW9yZSUyMGluJTIwb3ZlciUyMDEwMCUyMGxhbmd1YWdlcy4lMEFJdHMlMjBhaW0lMjBpcyUyMHRvJTIwbWFrZSUyMGN1dHRpbmctZWRnZSUyME5MUCUyMGVhc2llciUyMHRvJTIwdXNlJTIwZm9yJTIwZXZlcnlvbmUuJTBBJTBBJUYwJTlGJUE0JTk3JTIwVHJhbnNmb3JtZXJzJTIwcHJvdmlkZXMlMjBBUElzJTIwdG8lMjBxdWlja2x5JTIwZG93bmxvYWQlMjBhbmQlMjB1c2UlMjB0aG9zZSUyMHByZXRyYWluZWQlMjBtb2RlbHMlMjBvbiUyMGElMjBnaXZlbiUyMHRleHQlMkMlMjBmaW5lLXR1bmUlMjB0aGVtJTIwb24lMjB5b3VyJTIwb3duJTIwZGF0YXNldHMlMjBhbmQlMEF0aGVuJTIwc2hhcmUlMjB0aGVtJTIwd2l0aCUyMHRoZSUyMGNvbW11bml0eSUyMG9uJTIwb3VyJTIwbW9kZWwlMjBodWIuJTIwQXQlMjB0aGUlMjBzYW1lJTIwdGltZSUyQyUyMGVhY2glMjBweXRob24lMjBtb2R1bGUlMjBkZWZpbmluZyUyMGFuJTIwYXJjaGl0ZWN0dXJlJTIwaXMlMjBmdWxseSUyMHN0YW5kYWxvbmUlMjBhbmQlMEFjYW4lMjBiZSUyMG1vZGlmaWVkJTIwdG8lMjBlbmFibGUlMjBxdWljayUyMHJlc2VhcmNoJTIwZXhwZXJpbWVudHMuJTBBJTBBV2h5JTIwc2hvdWxkJTIwSSUyMHVzZSUyMHRyYW5zZm9ybWVycyUzRiUwQSUwQTEuJTIwRWFzeS10by11c2UlMjBzdGF0ZS1vZi10aGUtYXJ0JTIwbW9kZWxzJTNBJTBBJTIwJTIwLSUyMEhpZ2glMjBwZXJmb3JtYW5jZSUyMG9uJTIwTkxVJTIwYW5kJTIwTkxHJTIwdGFza3MuJTBBJTIwJTIwLSUyMExvdyUyMGJhcnJpZXIlMjB0byUyMGVudHJ5JTIwZm9yJTIwZWR1Y2F0b3JzJTIwYW5kJTIwcHJhY3RpdGlvbmVycy4lMEElMjAlMjAtJTIwRmV3JTIwdXNlci1mYWNpbmclMjBhYnN0cmFjdGlvbnMlMjB3aXRoJTIwanVzdCUyMHRocmVlJTIwY2xhc3NlcyUyMHRvJTIwbGVhcm4uJTBBJTIwJTIwLSUyMEElMjB1bmlmaWVkJTIwQVBJJTIwZm9yJTIwdXNpbmclMjBhbGwlMjBvdXIlMjBwcmV0cmFpbmVkJTIwbW9kZWxzLiUwQSUyMCUyMC0lMjBMb3dlciUyMGNvbXB1dGUlMjBjb3N0cyUyQyUyMHNtYWxsZXIlMjBjYXJib24lMjBmb290cHJpbnQlM0ElMEElMEEyLiUyMFJlc2VhcmNoZXJzJTIwY2FuJTIwc2hhcmUlMjB0cmFpbmVkJTIwbW9kZWxzJTIwaW5zdGVhZCUyMG9mJTIwYWx3YXlzJTIwcmV0cmFpbmluZy4lMEElMjAlMjAtJTIwUHJhY3RpdGlvbmVycyUyMGNhbiUyMHJlZHVjZSUyMGNvbXB1dGUlMjB0aW1lJTIwYW5kJTIwcHJvZHVjdGlvbiUyMGNvc3RzLiUwQSUyMCUyMC0lMjBEb3plbnMlMjBvZiUyMGFyY2hpdGVjdHVyZXMlMjB3aXRoJTIwb3ZlciUyMDEwJTJDMDAwJTIwcHJldHJhaW5lZCUyMG1vZGVscyUyQyUyMHNvbWUlMjBpbiUyMG1vcmUlMjB0aGFuJTIwMTAwJTIwbGFuZ3VhZ2VzLiUwQSUwQTMuJTIwQ2hvb3NlJTIwdGhlJTIwcmlnaHQlMjBmcmFtZXdvcmslMjBmb3IlMjBldmVyeSUyMHBhcnQlMjBvZiUyMGElMjBtb2RlbCdzJTIwbGlmZXRpbWUlM0ElMEElMjAlMjAtJTIwVHJhaW4lMjBzdGF0ZS1vZi10aGUtYXJ0JTIwbW9kZWxzJTIwaW4lMjAzJTIwbGluZXMlMjBvZiUyMGNvZGUuJTBBJTIwJTIwLSUyME1vdmUlMjBhJTIwc2luZ2xlJTIwbW9kZWwlMjBiZXR3ZWVuJTIwVEYyLjAlMkZQeVRvcmNoJTIwZnJhbWV3b3JrcyUyMGF0JTIwd2lsbC4lMEElMjAlMjAtJTIwU2VhbWxlc3NseSUyMHBpY2slMjB0aGUlMjByaWdodCUyMGZyYW1ld29yayUyMGZvciUyMHRyYWluaW5nJTJDJTIwZXZhbHVhdGlvbiUyMGFuZCUyMHByb2R1Y3Rpb24uJTBBJTBBNC4lMjBFYXNpbHklMjBjdXN0b21pemUlMjBhJTIwbW9kZWwlMjBvciUyMGFuJTIwZXhhbXBsZSUyMHRvJTIweW91ciUyMG5lZWRzJTNBJTBBJTIwJTIwLSUyMFdlJTIwcHJvdmlkZSUyMGV4YW1wbGVzJTIwZm9yJTIwZWFjaCUyMGFyY2hpdGVjdHVyZSUyMHRvJTIwcmVwcm9kdWNlJTIwdGhlJTIwcmVzdWx0cyUyMHB1Ymxpc2hlZCUyMGJ5JTIwaXRzJTIwb3JpZ2luYWwlMjBhdXRob3JzLiUwQSUyMCUyMC0lMjBNb2RlbCUyMGludGVybmFscyUyMGFyZSUyMGV4cG9zZWQlMjBhcyUyMGNvbnNpc3RlbnRseSUyMGFzJTIwcG9zc2libGUuJTBBJTIwJTIwLSUyME1vZGVsJTIwZmlsZXMlMjBjYW4lMjBiZSUyMHVzZWQlMjBpbmRlcGVuZGVudGx5JTIwb2YlMjB0aGUlMjBsaWJyYXJ5JTIwZm9yJTIwcXVpY2slMjBleHBlcmltZW50cy4lMEElMEElRjAlOUYlQTQlOTclMjBUcmFuc2Zvcm1lcnMlMjBpcyUyMGJhY2tlZCUyMGJ5JTIwdGhlJTIwdGhyZWUlMjBtb3N0JTIwcG9wdWxhciUyMGRlZXAlMjBsZWFybmluZyUyMGxpYnJhcmllcyUyMCVFMiU4MCU5NCUyMEpheCUyQyUyMFB5VG9yY2glMjBhbmQlMjBUZW5zb3JGbG93JTIwJUUyJTgwJTk0JTIwd2l0aCUyMGElMjBzZWFtbGVzcyUyMGludGVncmF0aW9uJTBBYmV0d2VlbiUyMHRoZW0uJTIwSXQncyUyMHN0cmFpZ2h0Zm9yd2FyZCUyMHRvJTIwdHJhaW4lMjB5b3VyJTIwbW9kZWxzJTIwd2l0aCUyMG9uZSUyMGJlZm9yZSUyMGxvYWRpbmclMjB0aGVtJTIwZm9yJTIwaW5mZXJlbmNlJTIwd2l0aCUyMHRoZSUyMG90aGVyLiUwQSUyMiUyMiUyMiUwQXF1ZXN0aW9uX2Fuc3dlcmVyKHF1ZXN0aW9uJTNEcXVlc3Rpb24lMkMlMjBjb250ZXh0JTNEbG9uZ19jb250ZXh0KQ==",highlighted:`long_context = <span class="hljs-string">&quot;&quot;&quot;
🤗 Transformers: State of the Art NLP
🤗 Transformers provides thousands of pretrained models to perform tasks on texts such as classification, information extraction,
question answering, summarization, translation, text generation and more in over 100 languages.
Its aim is to make cutting-edge NLP easier to use for everyone.
🤗 Transformers provides APIs to quickly download and use those pretrained models on a given text, fine-tune them on your own datasets and
then share them with the community on our model hub. At the same time, each python module defining an architecture is fully standalone and
can be modified to enable quick research experiments.
Why should I use transformers?
1. Easy-to-use state-of-the-art models:
- High performance on NLU and NLG tasks.
- Low barrier to entry for educators and practitioners.
- Few user-facing abstractions with just three classes to learn.
- A unified API for using all our pretrained models.
- Lower compute costs, smaller carbon footprint:
2. Researchers can share trained models instead of always retraining.
- Practitioners can reduce compute time and production costs.
- Dozens of architectures with over 10,000 pretrained models, some in more than 100 languages.
3. Choose the right framework for every part of a model&#x27;s lifetime:
- Train state-of-the-art models in 3 lines of code.
- Move a single model between TF2.0/PyTorch frameworks at will.
- Seamlessly pick the right framework for training, evaluation and production.
4. Easily customize a model or an example to your needs:
- We provide examples for each architecture to reproduce the results published by its original authors.
- Model internals are exposed as consistently as possible.
- Model files can be used independently of the library for quick experiments.
🤗 Transformers is backed by the three most popular deep learning libraries — Jax, PyTorch and TensorFlow — with a seamless integration
between them. It&#x27;s straightforward to train your models with one before loading them for inference with the other.
&quot;&quot;&quot;</span>
question_answerer(question=question, context=long_context)`,wrap:!1}}),ut=new w({props:{code:"JTdCJ3Njb3JlJyUzQSUyMDAuOTcxNDklMkMlMEElMjAnc3RhcnQnJTNBJTIwMTg5MiUyQyUwQSUyMCdlbmQnJTNBJTIwMTkxOSUyQyUwQSUyMCdhbnN3ZXInJTNBJTIwJ0pheCUyQyUyMFB5VG9yY2glMjBhbmQlMjBUZW5zb3JGbG93JyU3RA==",highlighted:`{<span class="hljs-string">&#x27;score&#x27;</span>: <span class="hljs-number">0.97149</span>,
<span class="hljs-string">&#x27;start&#x27;</span>: <span class="hljs-number">1892</span>,
<span class="hljs-string">&#x27;end&#x27;</span>: <span class="hljs-number">1919</span>,
<span class="hljs-string">&#x27;answer&#x27;</span>: <span class="hljs-string">&#x27;Jax, PyTorch and TensorFlow&#x27;</span>}`,wrap:!1}}),dt=new Be({props:{title:"Sử dụng mô hình cho tác vụ hỏi đáp",local:"sử-dụng-mô-hình-cho-tác-vụ-hỏi-đáp",headingTag:"h2"}});const Hs=[$a,Ca],In=[];function Fs(t,e){return t[0]==="pt"?0:1}x=Fs(y),G=In[x]=Hs[x](y),Ut=new w({props:{code:"c3RhcnRfbG9naXRzJTIwJTNEJTIwb3V0cHV0cy5zdGFydF9sb2dpdHMlMEFlbmRfbG9naXRzJTIwJTNEJTIwb3V0cHV0cy5lbmRfbG9naXRzJTBBcHJpbnQoc3RhcnRfbG9naXRzLnNoYXBlJTJDJTIwZW5kX2xvZ2l0cy5zaGFwZSk=",highlighted:`start_logits = outputs.start_logits
end_logits = outputs.end_logits
<span class="hljs-built_in">print</span>(start_logits.shape, end_logits.shape)`,wrap:!1}});const Ys=[xa,Za],vn=[];function Ss(t,e){return t[0]==="pt"?0:1}V=Ss(y),N=vn[V]=Ys[V](y);const As=[Va,Ga],_n=[];function qs(t,e){return t[0]==="pt"?0:1}R=qs(y),W=_n[R]=As[R](y);const Ls=[Ra,Na],Bn=[];function Ds(t,e){return t[0]==="pt"?0:1}X=Ds(y),z=Bn[X]=Ls[X](y),vt=new w({props:{code:"c2NvcmVzJTIwJTNEJTIwc3RhcnRfcHJvYmFiaWxpdGllcyU1QiUzQSUyQyUyME5vbmUlNUQlMjAqJTIwZW5kX3Byb2JhYmlsaXRpZXMlNUJOb25lJTJDJTIwJTNBJTVE",highlighted:'scores = start_probabilities[:, <span class="hljs-literal">None</span>] * end_probabilities[<span class="hljs-literal">None</span>, :]',wrap:!1}});const Ps=[Xa,Wa],Cn=[];function Ks(t,e){return t[0]==="pt"?0:1}Q=Ks(y),E=Cn[Q]=Ps[Q](y),Bt=new w({props:{code:"bWF4X2luZGV4JTIwJTNEJTIwc2NvcmVzLmFyZ21heCgpLml0ZW0oKSUwQXN0YXJ0X2luZGV4JTIwJTNEJTIwbWF4X2luZGV4JTIwJTJGJTJGJTIwc2NvcmVzLnNoYXBlJTVCMSU1RCUwQWVuZF9pbmRleCUyMCUzRCUyMG1heF9pbmRleCUyMCUyNSUyMHNjb3Jlcy5zaGFwZSU1QjElNUQlMEFwcmludChzY29yZXMlNUJzdGFydF9pbmRleCUyQyUyMGVuZF9pbmRleCU1RCk=",highlighted:`max_index = scores.argmax().item()
start_index = max_index // scores.shape[<span class="hljs-number">1</span>]
end_index = max_index % scores.shape[<span class="hljs-number">1</span>]
<span class="hljs-built_in">print</span>(scores[start_index, end_index])`,wrap:!1}}),$t=new w({props:{code:"MC45Nzc3Mw==",highlighted:'<span class="hljs-number">0.97773</span>',wrap:!1}}),lt=new _e({props:{$$slots:{default:[za]},$$scope:{ctx:y}}}),xt=new w({props:{code:"aW5wdXRzX3dpdGhfb2Zmc2V0cyUyMCUzRCUyMHRva2VuaXplcihxdWVzdGlvbiUyQyUyMGNvbnRleHQlMkMlMjByZXR1cm5fb2Zmc2V0c19tYXBwaW5nJTNEVHJ1ZSklMEFvZmZzZXRzJTIwJTNEJTIwaW5wdXRzX3dpdGhfb2Zmc2V0cyU1QiUyMm9mZnNldF9tYXBwaW5nJTIyJTVEJTBBJTBBc3RhcnRfY2hhciUyQyUyMF8lMjAlM0QlMjBvZmZzZXRzJTVCc3RhcnRfaW5kZXglNUQlMEFfJTJDJTIwZW5kX2NoYXIlMjAlM0QlMjBvZmZzZXRzJTVCZW5kX2luZGV4JTVEJTBBYW5zd2VyJTIwJTNEJTIwY29udGV4dCU1QnN0YXJ0X2NoYXIlM0FlbmRfY2hhciU1RA==",highlighted:`inputs_with_offsets = tokenizer(question, context, return_offsets_mapping=<span class="hljs-literal">True</span>)
offsets = inputs_with_offsets[<span class="hljs-string">&quot;offset_mapping&quot;</span>]
start_char, _ = offsets[start_index]
_, end_char = offsets[end_index]
answer = context[start_char:end_char]`,wrap:!1}}),Vt=new w({props:{code:"cmVzdWx0JTIwJTNEJTIwJTdCJTBBJTIwJTIwJTIwJTIwJTIyYW5zd2VyJTIyJTNBJTIwYW5zd2VyJTJDJTBBJTIwJTIwJTIwJTIwJTIyc3RhcnQlMjIlM0ElMjBzdGFydF9jaGFyJTJDJTBBJTIwJTIwJTIwJTIwJTIyZW5kJTIyJTNBJTIwZW5kX2NoYXIlMkMlMEElMjAlMjAlMjAlMjAlMjJzY29yZSUyMiUzQSUyMHNjb3JlcyU1QnN0YXJ0X2luZGV4JTJDJTIwZW5kX2luZGV4JTVEJTJDJTBBJTdEJTBBcHJpbnQocmVzdWx0KQ==",highlighted:`result = {
<span class="hljs-string">&quot;answer&quot;</span>: answer,
<span class="hljs-string">&quot;start&quot;</span>: start_char,
<span class="hljs-string">&quot;end&quot;</span>: end_char,
<span class="hljs-string">&quot;score&quot;</span>: scores[start_index, end_index],
}
<span class="hljs-built_in">print</span>(result)`,wrap:!1}}),Nt=new w({props:{code:"JTdCJ2Fuc3dlciclM0ElMjAnSmF4JTJDJTIwUHlUb3JjaCUyMGFuZCUyMFRlbnNvckZsb3cnJTJDJTBBJTIwJ3N0YXJ0JyUzQSUyMDc4JTJDJTBBJTIwJ2VuZCclM0ElMjAxMDUlMkMlMEElMjAnc2NvcmUnJTNBJTIwMC45Nzc3MyU3RA==",highlighted:`{<span class="hljs-string">&#x27;answer&#x27;</span>: <span class="hljs-string">&#x27;Jax, PyTorch and TensorFlow&#x27;</span>,
<span class="hljs-string">&#x27;start&#x27;</span>: <span class="hljs-number">78</span>,
<span class="hljs-string">&#x27;end&#x27;</span>: <span class="hljs-number">105</span>,
<span class="hljs-string">&#x27;score&#x27;</span>: <span class="hljs-number">0.97773</span>}`,wrap:!1}}),et=new _e({props:{$$slots:{default:[Qa]},$$scope:{ctx:y}}}),Wt=new Be({props:{title:"Xử lý các ngữ cảnh dài",local:"xử-lý-các-ngữ-cảnh-dài",headingTag:"h2"}}),zt=new w({props:{code:"aW5wdXRzJTIwJTNEJTIwdG9rZW5pemVyKHF1ZXN0aW9uJTJDJTIwbG9uZ19jb250ZXh0KSUwQXByaW50KGxlbihpbnB1dHMlNUIlMjJpbnB1dF9pZHMlMjIlNUQpKQ==",highlighted:`inputs = tokenizer(question, long_context)
<span class="hljs-built_in">print</span>(<span class="hljs-built_in">len</span>(inputs[<span class="hljs-string">&quot;input_ids&quot;</span>]))`,wrap:!1}}),Qt=new w({props:{code:"NDYx",highlighted:'<span class="hljs-number">461</span>',wrap:!1}}),Ht=new w({props:{code:"aW5wdXRzJTIwJTNEJTIwdG9rZW5pemVyKHF1ZXN0aW9uJTJDJTIwbG9uZ19jb250ZXh0JTJDJTIwbWF4X2xlbmd0aCUzRDM4NCUyQyUyMHRydW5jYXRpb24lM0QlMjJvbmx5X3NlY29uZCUyMiklMEFwcmludCh0b2tlbml6ZXIuZGVjb2RlKGlucHV0cyU1QiUyMmlucHV0X2lkcyUyMiU1RCkp",highlighted:`inputs = tokenizer(question, long_context, max_length=<span class="hljs-number">384</span>, truncation=<span class="hljs-string">&quot;only_second&quot;</span>)
<span class="hljs-built_in">print</span>(tokenizer.decode(inputs[<span class="hljs-string">&quot;input_ids&quot;</span>]))`,wrap:!1}}),Ft=new w({props:{code:"JTIyJTIyJTIyJTBBJTVCQ0xTJTVEJTIwV2hpY2glMjBkZWVwJTIwbGVhcm5pbmclMjBsaWJyYXJpZXMlMjBiYWNrJTIwJTVCVU5LJTVEJTIwVHJhbnNmb3JtZXJzJTNGJTIwJTVCU0VQJTVEJTIwJTVCVU5LJTVEJTIwVHJhbnNmb3JtZXJzJTIwJTNBJTIwU3RhdGUlMjBvZiUyMHRoZSUyMEFydCUyME5MUCUwQSUwQSU1QlVOSyU1RCUyMFRyYW5zZm9ybWVycyUyMHByb3ZpZGVzJTIwdGhvdXNhbmRzJTIwb2YlMjBwcmV0cmFpbmVkJTIwbW9kZWxzJTIwdG8lMjBwZXJmb3JtJTIwdGFza3MlMjBvbiUyMHRleHRzJTIwc3VjaCUyMGFzJTIwY2xhc3NpZmljYXRpb24lMkMlMjBpbmZvcm1hdGlvbiUyMGV4dHJhY3Rpb24lMkMlMEFxdWVzdGlvbiUyMGFuc3dlcmluZyUyQyUyMHN1bW1hcml6YXRpb24lMkMlMjB0cmFuc2xhdGlvbiUyQyUyMHRleHQlMjBnZW5lcmF0aW9uJTIwYW5kJTIwbW9yZSUyMGluJTIwb3ZlciUyMDEwMCUyMGxhbmd1YWdlcy4lMEFJdHMlMjBhaW0lMjBpcyUyMHRvJTIwbWFrZSUyMGN1dHRpbmctZWRnZSUyME5MUCUyMGVhc2llciUyMHRvJTIwdXNlJTIwZm9yJTIwZXZlcnlvbmUuJTBBJTBBJTVCVU5LJTVEJTIwVHJhbnNmb3JtZXJzJTIwcHJvdmlkZXMlMjBBUElzJTIwdG8lMjBxdWlja2x5JTIwZG93bmxvYWQlMjBhbmQlMjB1c2UlMjB0aG9zZSUyMHByZXRyYWluZWQlMjBtb2RlbHMlMjBvbiUyMGElMjBnaXZlbiUyMHRleHQlMkMlMjBmaW5lLXR1bmUlMjB0aGVtJTIwb24lMjB5b3VyJTIwb3duJTIwZGF0YXNldHMlMjBhbmQlMEF0aGVuJTIwc2hhcmUlMjB0aGVtJTIwd2l0aCUyMHRoZSUyMGNvbW11bml0eSUyMG9uJTIwb3VyJTIwbW9kZWwlMjBodWIuJTIwQXQlMjB0aGUlMjBzYW1lJTIwdGltZSUyQyUyMGVhY2glMjBweXRob24lMjBtb2R1bGUlMjBkZWZpbmluZyUyMGFuJTIwYXJjaGl0ZWN0dXJlJTIwaXMlMjBmdWxseSUyMHN0YW5kYWxvbmUlMjBhbmQlMEFjYW4lMjBiZSUyMG1vZGlmaWVkJTIwdG8lMjBlbmFibGUlMjBxdWljayUyMHJlc2VhcmNoJTIwZXhwZXJpbWVudHMuJTBBJTBBV2h5JTIwc2hvdWxkJTIwSSUyMHVzZSUyMHRyYW5zZm9ybWVycyUzRiUwQSUwQTEuJTIwRWFzeS10by11c2UlMjBzdGF0ZS1vZi10aGUtYXJ0JTIwbW9kZWxzJTNBJTBBJTIwJTIwLSUyMEhpZ2glMjBwZXJmb3JtYW5jZSUyMG9uJTIwTkxVJTIwYW5kJTIwTkxHJTIwdGFza3MuJTBBJTIwJTIwLSUyMExvdyUyMGJhcnJpZXIlMjB0byUyMGVudHJ5JTIwZm9yJTIwZWR1Y2F0b3JzJTIwYW5kJTIwcHJhY3RpdGlvbmVycy4lMEElMjAlMjAtJTIwRmV3JTIwdXNlci1mYWNpbmclMjBhYnN0cmFjdGlvbnMlMjB3aXRoJTIwanVzdCUyMHRocmVlJTIwY2xhc3NlcyUyMHRvJTIwbGVhcm4uJTBBJTIwJTIwLSUyMEElMjB1bmlmaWVkJTIwQVBJJTIwZm9yJTIwdXNpbmclMjBhbGwlMjBvdXIlMjBwcmV0cmFpbmVkJTIwbW9kZWxzLiUwQSUyMCUyMC0lMjBMb3dlciUyMGNvbXB1dGUlMjBjb3N0cyUyQyUyMHNtYWxsZXIlMjBjYXJib24lMjBmb290cHJpbnQlM0ElMEElMEEyLiUyMFJlc2VhcmNoZXJzJTIwY2FuJTIwc2hhcmUlMjB0cmFpbmVkJTIwbW9kZWxzJTIwaW5zdGVhZCUyMG9mJTIwYWx3YXlzJTIwcmV0cmFpbmluZy4lMEElMjAlMjAtJTIwUHJhY3RpdGlvbmVycyUyMGNhbiUyMHJlZHVjZSUyMGNvbXB1dGUlMjB0aW1lJTIwYW5kJTIwcHJvZHVjdGlvbiUyMGNvc3RzLiUwQSUyMCUyMC0lMjBEb3plbnMlMjBvZiUyMGFyY2hpdGVjdHVyZXMlMjB3aXRoJTIwb3ZlciUyMDEwJTJDMDAwJTIwcHJldHJhaW5lZCUyMG1vZGVscyUyQyUyMHNvbWUlMjBpbiUyMG1vcmUlMjB0aGFuJTIwMTAwJTIwbGFuZ3VhZ2VzLiUwQSUwQTMuJTIwQ2hvb3NlJTIwdGhlJTIwcmlnaHQlMjBmcmFtZXdvcmslMjBmb3IlMjBldmVyeSUyMHBhcnQlMjBvZiUyMGElMjBtb2RlbCdzJTIwbGlmZXRpbWUlM0ElMEElMjAlMjAtJTIwVHJhaW4lMjBzdGF0ZS1vZi10aGUtYXJ0JTIwbW9kZWxzJTIwaW4lMjAzJTIwbGluZXMlMjBvZiUyMGNvZGUuJTBBJTIwJTIwLSUyME1vdmUlMjBhJTIwc2luZ2xlJTIwbW9kZWwlMjBiZXR3ZWVuJTIwVEYyLjAlMkZQeVRvcmNoJTIwZnJhbWV3b3JrcyUyMGF0JTIwd2lsbC4lMEElMjAlMjAtJTIwU2VhbWxlc3NseSUyMHBpY2slMjB0aGUlMjByaWdodCUyMGZyYW1ld29yayUyMGZvciUyMHRyYWluaW5nJTJDJTIwZXZhbHVhdGlvbiUyMGFuZCUyMHByb2R1Y3Rpb24uJTBBJTBBNC4lMjBFYXNpbHklMjBjdXN0b21pemUlMjBhJTIwbW9kZWwlMjBvciUyMGFuJTIwZXhhbXBsZSUyMHRvJTIweW91ciUyMG5lZWRzJTNBJTBBJTIwJTIwLSUyMFdlJTIwcHJvdmlkZSUyMGV4YW1wbGVzJTIwZm9yJTIwZWFjaCUyMGFyY2hpdGVjdHVyZSUyMHRvJTIwcmVwcm9kdWNlJTIwdGhlJTIwcmVzdWx0cyUyMHB1Ymxpc2hlZCUyMGJ5JTIwaXRzJTIwb3JpZ2luYWwlMjBhdXRob3JzLiUwQSUyMCUyMC0lMjBNb2RlbCUyMGludGVybmFsJTIwJTVCU0VQJTVEJTBBJTIyJTIyJTIy",highlighted:`<span class="hljs-string">&quot;&quot;&quot;
[CLS] Which deep learning libraries back [UNK] Transformers? [SEP] [UNK] Transformers : State of the Art NLP
[UNK] Transformers provides thousands of pretrained models to perform tasks on texts such as classification, information extraction,
question answering, summarization, translation, text generation and more in over 100 languages.
Its aim is to make cutting-edge NLP easier to use for everyone.
[UNK] Transformers provides APIs to quickly download and use those pretrained models on a given text, fine-tune them on your own datasets and
then share them with the community on our model hub. At the same time, each python module defining an architecture is fully standalone and
can be modified to enable quick research experiments.
Why should I use transformers?
1. Easy-to-use state-of-the-art models:
- High performance on NLU and NLG tasks.
- Low barrier to entry for educators and practitioners.
- Few user-facing abstractions with just three classes to learn.
- A unified API for using all our pretrained models.
- Lower compute costs, smaller carbon footprint:
2. Researchers can share trained models instead of always retraining.
- Practitioners can reduce compute time and production costs.
- Dozens of architectures with over 10,000 pretrained models, some in more than 100 languages.
3. Choose the right framework for every part of a model&#x27;s lifetime:
- Train state-of-the-art models in 3 lines of code.
- Move a single model between TF2.0/PyTorch frameworks at will.
- Seamlessly pick the right framework for training, evaluation and production.
4. Easily customize a model or an example to your needs:
- We provide examples for each architecture to reproduce the results published by its original authors.
- Model internal [SEP]
&quot;&quot;&quot;</span>`,wrap:!1}}),At=new w({props:{code:"c2VudGVuY2UlMjAlM0QlMjAlMjJUaGlzJTIwc2VudGVuY2UlMjBpcyUyMG5vdCUyMHRvbyUyMGxvbmclMjBidXQlMjB3ZSUyMGFyZSUyMGdvaW5nJTIwdG8lMjBzcGxpdCUyMGl0JTIwYW55d2F5LiUyMiUwQWlucHV0cyUyMCUzRCUyMHRva2VuaXplciglMEElMjAlMjAlMjAlMjBzZW50ZW5jZSUyQyUyMHRydW5jYXRpb24lM0RUcnVlJTJDJTIwcmV0dXJuX292ZXJmbG93aW5nX3Rva2VucyUzRFRydWUlMkMlMjBtYXhfbGVuZ3RoJTNENiUyQyUyMHN0cmlkZSUzRDIlMEEpJTBBJTBBZm9yJTIwaWRzJTIwaW4lMjBpbnB1dHMlNUIlMjJpbnB1dF9pZHMlMjIlNUQlM0ElMEElMjAlMjAlMjAlMjBwcmludCh0b2tlbml6ZXIuZGVjb2RlKGlkcykp",highlighted:`sentence = <span class="hljs-string">&quot;This sentence is not too long but we are going to split it anyway.&quot;</span>
inputs = tokenizer(
sentence, truncation=<span class="hljs-literal">True</span>, return_overflowing_tokens=<span class="hljs-literal">True</span>, max_length=<span class="hljs-number">6</span>, stride=<span class="hljs-number">2</span>
)
<span class="hljs-keyword">for</span> ids <span class="hljs-keyword">in</span> inputs[<span class="hljs-string">&quot;input_ids&quot;</span>]:
<span class="hljs-built_in">print</span>(tokenizer.decode(ids))`,wrap:!1}}),qt=new w({props:{code:"JyU1QkNMUyU1RCUyMFRoaXMlMjBzZW50ZW5jZSUyMGlzJTIwbm90JTIwJTVCU0VQJTVEJyUwQSclNUJDTFMlNUQlMjBpcyUyMG5vdCUyMHRvbyUyMGxvbmclMjAlNUJTRVAlNUQnJTBBJyU1QkNMUyU1RCUyMHRvbyUyMGxvbmclMjBidXQlMjB3ZSUyMCU1QlNFUCU1RCclMEEnJTVCQ0xTJTVEJTIwYnV0JTIwd2UlMjBhcmUlMjBnb2luZyUyMCU1QlNFUCU1RCclMEEnJTVCQ0xTJTVEJTIwYXJlJTIwZ29pbmclMjB0byUyMHNwbGl0JTIwJTVCU0VQJTVEJyUwQSclNUJDTFMlNUQlMjB0byUyMHNwbGl0JTIwaXQlMjBhbnl3YXklMjAlNUJTRVAlNUQnJTBBJyU1QkNMUyU1RCUyMGl0JTIwYW55d2F5LiUyMCU1QlNFUCU1RCc=",highlighted:`<span class="hljs-string">&#x27;[CLS] This sentence is not [SEP]&#x27;</span>
<span class="hljs-string">&#x27;[CLS] is not too long [SEP]&#x27;</span>
<span class="hljs-string">&#x27;[CLS] too long but we [SEP]&#x27;</span>
<span class="hljs-string">&#x27;[CLS] but we are going [SEP]&#x27;</span>
<span class="hljs-string">&#x27;[CLS] are going to split [SEP]&#x27;</span>
<span class="hljs-string">&#x27;[CLS] to split it anyway [SEP]&#x27;</span>
<span class="hljs-string">&#x27;[CLS] it anyway. [SEP]&#x27;</span>`,wrap:!1}}),Pt=new w({props:{code:"cHJpbnQoaW5wdXRzLmtleXMoKSk=",highlighted:'<span class="hljs-built_in">print</span>(inputs.keys())',wrap:!1}}),Kt=new w({props:{code:"ZGljdF9rZXlzKCU1QidpbnB1dF9pZHMnJTJDJTIwJ2F0dGVudGlvbl9tYXNrJyUyQyUyMCdvdmVyZmxvd190b19zYW1wbGVfbWFwcGluZyclNUQp",highlighted:'dict_keys([<span class="hljs-string">&#x27;input_ids&#x27;</span>, <span class="hljs-string">&#x27;attention_mask&#x27;</span>, <span class="hljs-string">&#x27;overflow_to_sample_mapping&#x27;</span>])',wrap:!1}}),tn=new w({props:{code:"cHJpbnQoaW5wdXRzJTVCJTIyb3ZlcmZsb3dfdG9fc2FtcGxlX21hcHBpbmclMjIlNUQp",highlighted:'<span class="hljs-built_in">print</span>(inputs[<span class="hljs-string">&quot;overflow_to_sample_mapping&quot;</span>])',wrap:!1}}),nn=new w({props:{code:"JTVCMCUyQyUyMDAlMkMlMjAwJTJDJTIwMCUyQyUyMDAlMkMlMjAwJTJDJTIwMCU1RA==",highlighted:'[<span class="hljs-number">0</span>, <span class="hljs-number">0</span>, <span class="hljs-number">0</span>, <span class="hljs-number">0</span>, <span class="hljs-number">0</span>, <span class="hljs-number">0</span>, <span class="hljs-number">0</span>]',wrap:!1}}),en=new w({props:{code:"c2VudGVuY2VzJTIwJTNEJTIwJTVCJTBBJTIwJTIwJTIwJTIwJTIyVGhpcyUyMHNlbnRlbmNlJTIwaXMlMjBub3QlMjB0b28lMjBsb25nJTIwYnV0JTIwd2UlMjBhcmUlMjBnb2luZyUyMHRvJTIwc3BsaXQlMjBpdCUyMGFueXdheS4lMjIlMkMlMEElMjAlMjAlMjAlMjAlMjJUaGlzJTIwc2VudGVuY2UlMjBpcyUyMHNob3J0ZXIlMjBidXQlMjB3aWxsJTIwc3RpbGwlMjBnZXQlMjBzcGxpdC4lMjIlMkMlMEElNUQlMEFpbnB1dHMlMjAlM0QlMjB0b2tlbml6ZXIoJTBBJTIwJTIwJTIwJTIwc2VudGVuY2VzJTJDJTIwdHJ1bmNhdGlvbiUzRFRydWUlMkMlMjByZXR1cm5fb3ZlcmZsb3dpbmdfdG9rZW5zJTNEVHJ1ZSUyQyUyMG1heF9sZW5ndGglM0Q2JTJDJTIwc3RyaWRlJTNEMiUwQSklMEElMEFwcmludChpbnB1dHMlNUIlMjJvdmVyZmxvd190b19zYW1wbGVfbWFwcGluZyUyMiU1RCk=",highlighted:`sentences = [
<span class="hljs-string">&quot;This sentence is not too long but we are going to split it anyway.&quot;</span>,
<span class="hljs-string">&quot;This sentence is shorter but will still get split.&quot;</span>,
]
inputs = tokenizer(
sentences, truncation=<span class="hljs-literal">True</span>, return_overflowing_tokens=<span class="hljs-literal">True</span>, max_length=<span class="hljs-number">6</span>, stride=<span class="hljs-number">2</span>
)
<span class="hljs-built_in">print</span>(inputs[<span class="hljs-string">&quot;overflow_to_sample_mapping&quot;</span>])`,wrap:!1}}),an=new w({props:{code:"JTVCMCUyQyUyMDAlMkMlMjAwJTJDJTIwMCUyQyUyMDAlMkMlMjAwJTJDJTIwMCUyQyUyMDElMkMlMjAxJTJDJTIwMSUyQyUyMDElNUQ=",highlighted:'[<span class="hljs-number">0</span>, <span class="hljs-number">0</span>, <span class="hljs-number">0</span>, <span class="hljs-number">0</span>, <span class="hljs-number">0</span>, <span class="hljs-number">0</span>, <span class="hljs-number">0</span>, <span class="hljs-number">1</span>, <span class="hljs-number">1</span>, <span class="hljs-number">1</span>, <span class="hljs-number">1</span>]',wrap:!1}}),mn=new w({props:{code:"aW5wdXRzJTIwJTNEJTIwdG9rZW5pemVyKCUwQSUyMCUyMCUyMCUyMHF1ZXN0aW9uJTJDJTBBJTIwJTIwJTIwJTIwbG9uZ19jb250ZXh0JTJDJTBBJTIwJTIwJTIwJTIwc3RyaWRlJTNEMTI4JTJDJTBBJTIwJTIwJTIwJTIwbWF4X2xlbmd0aCUzRDM4NCUyQyUwQSUyMCUyMCUyMCUyMHBhZGRpbmclM0QlMjJsb25nZXN0JTIyJTJDJTBBJTIwJTIwJTIwJTIwdHJ1bmNhdGlvbiUzRCUyMm9ubHlfc2Vjb25kJTIyJTJDJTBBJTIwJTIwJTIwJTIwcmV0dXJuX292ZXJmbG93aW5nX3Rva2VucyUzRFRydWUlMkMlMEElMjAlMjAlMjAlMjByZXR1cm5fb2Zmc2V0c19tYXBwaW5nJTNEVHJ1ZSUyQyUwQSk=",highlighted:`inputs = tokenizer(
question,
long_context,
stride=<span class="hljs-number">128</span>,
max_length=<span class="hljs-number">384</span>,
padding=<span class="hljs-string">&quot;longest&quot;</span>,
truncation=<span class="hljs-string">&quot;only_second&quot;</span>,
return_overflowing_tokens=<span class="hljs-literal">True</span>,
return_offsets_mapping=<span class="hljs-literal">True</span>,
)`,wrap:!1}});const Os=[Ha,Ea],$n=[];function ta(t,e){return t[0]==="pt"?0:1}H=ta(y),F=$n[H]=Os[H](y),hn=new w({props:{code:"b3V0cHV0cyUyMCUzRCUyMG1vZGVsKCoqaW5wdXRzKSUwQSUwQXN0YXJ0X2xvZ2l0cyUyMCUzRCUyMG91dHB1dHMuc3RhcnRfbG9naXRzJTBBZW5kX2xvZ2l0cyUyMCUzRCUyMG91dHB1dHMuZW5kX2xvZ2l0cyUwQXByaW50KHN0YXJ0X2xvZ2l0cy5zaGFwZSUyQyUyMGVuZF9sb2dpdHMuc2hhcGUp",highlighted:`outputs = model(**inputs)
start_logits = outputs.start_logits
end_logits = outputs.end_logits
<span class="hljs-built_in">print</span>(start_logits.shape, end_logits.shape)`,wrap:!1}});const na=[Ya,Fa],Zn=[];function la(t,e){return t[0]==="pt"?0:1}Y=la(y),S=Zn[Y]=na[Y](y);const ea=[Aa,Sa],xn=[];function sa(t,e){return t[0]==="pt"?0:1}A=sa(y),q=xn[A]=ea[A](y);const aa=[La,qa],Gn=[];function ia(t,e){return t[0]==="pt"?0:1}L=ia(y),D=Gn[L]=aa[L](y);const ca=[Pa,Da],Vn=[];function ra(t,e){return t[0]==="pt"?0:1}return P=ra(y),K=Vn[P]=ca[P](y),yn=new w({props:{code:"JTVCKDAlMkMlMjAxOCUyQyUyMDAuMzM4NjcpJTJDJTIwKDE3MyUyQyUyMDE4NCUyQyUyMDAuOTcxNDkpJTVE",highlighted:'[(<span class="hljs-number">0</span>, <span class="hljs-number">18</span>, <span class="hljs-number">0.33867</span>), (<span class="hljs-number">173</span>, <span class="hljs-number">184</span>, <span class="hljs-number">0.97149</span>)]',wrap:!1}}),st=new _e({props:{$$slots:{default:[Ka]},$$scope:{ctx:y}}}),Tn=new w({props:{code:"Zm9yJTIwY2FuZGlkYXRlJTJDJTIwb2Zmc2V0JTIwaW4lMjB6aXAoY2FuZGlkYXRlcyUyQyUyMG9mZnNldHMpJTNBJTBBJTIwJTIwJTIwJTIwc3RhcnRfdG9rZW4lMkMlMjBlbmRfdG9rZW4lMkMlMjBzY29yZSUyMCUzRCUyMGNhbmRpZGF0ZSUwQSUyMCUyMCUyMCUyMHN0YXJ0X2NoYXIlMkMlMjBfJTIwJTNEJTIwb2Zmc2V0JTVCc3RhcnRfdG9rZW4lNUQlMEElMjAlMjAlMjAlMjBfJTJDJTIwZW5kX2NoYXIlMjAlM0QlMjBvZmZzZXQlNUJlbmRfdG9rZW4lNUQlMEElMjAlMjAlMjAlMjBhbnN3ZXIlMjAlM0QlMjBsb25nX2NvbnRleHQlNUJzdGFydF9jaGFyJTNBZW5kX2NoYXIlNUQlMEElMjAlMjAlMjAlMjByZXN1bHQlMjAlM0QlMjAlN0IlMjJhbnN3ZXIlMjIlM0ElMjBhbnN3ZXIlMkMlMjAlMjJzdGFydCUyMiUzQSUyMHN0YXJ0X2NoYXIlMkMlMjAlMjJlbmQlMjIlM0ElMjBlbmRfY2hhciUyQyUyMCUyMnNjb3JlJTIyJTNBJTIwc2NvcmUlN0QlMEElMjAlMjAlMjAlMjBwcmludChyZXN1bHQp",highlighted:`<span class="hljs-keyword">for</span> candidate, offset <span class="hljs-keyword">in</span> <span class="hljs-built_in">zip</span>(candidates, offsets):
start_token, end_token, score = candidate
start_char, _ = offset[start_token]
_, end_char = offset[end_token]
answer = long_context[start_char:end_char]
result = {<span class="hljs-string">&quot;answer&quot;</span>: answer, <span class="hljs-string">&quot;start&quot;</span>: start_char, <span class="hljs-string">&quot;end&quot;</span>: end_char, <span class="hljs-string">&quot;score&quot;</span>: score}
<span class="hljs-built_in">print</span>(result)`,wrap:!1}}),wn=new w({props:{code:"JTdCJ2Fuc3dlciclM0ElMjAnJTVDbiVGMCU5RiVBNCU5NyUyMFRyYW5zZm9ybWVycyUzQSUyMFN0YXRlJTIwb2YlMjB0aGUlMjBBcnQlMjBOTFAnJTJDJTIwJ3N0YXJ0JyUzQSUyMDAlMkMlMjAnZW5kJyUzQSUyMDM3JTJDJTIwJ3Njb3JlJyUzQSUyMDAuMzM4NjclN0QlMEElN0InYW5zd2VyJyUzQSUyMCdKYXglMkMlMjBQeVRvcmNoJTIwYW5kJTIwVGVuc29yRmxvdyclMkMlMjAnc3RhcnQnJTNBJTIwMTg5MiUyQyUyMCdlbmQnJTNBJTIwMTkxOSUyQyUyMCdzY29yZSclM0ElMjAwLjk3MTQ5JTdE",highlighted:`{<span class="hljs-string">&#x27;answer&#x27;</span>: <span class="hljs-string">&#x27;\\n🤗 Transformers: State of the Art NLP&#x27;</span>, <span class="hljs-string">&#x27;start&#x27;</span>: <span class="hljs-number">0</span>, <span class="hljs-string">&#x27;end&#x27;</span>: <span class="hljs-number">37</span>, <span class="hljs-string">&#x27;score&#x27;</span>: <span class="hljs-number">0.33867</span>}
{<span class="hljs-string">&#x27;answer&#x27;</span>: <span class="hljs-string">&#x27;Jax, PyTorch and TensorFlow&#x27;</span>, <span class="hljs-string">&#x27;start&#x27;</span>: <span class="hljs-number">1892</span>, <span class="hljs-string">&#x27;end&#x27;</span>: <span class="hljs-number">1919</span>, <span class="hljs-string">&#x27;score&#x27;</span>: <span class="hljs-number">0.97149</span>}`,wrap:!1}}),at=new _e({props:{$$slots:{default:[Oa]},$$scope:{ctx:y}}}),jn=new ka({props:{source:"https://github.com/huggingface/course/blob/main/chapters/vi/chapter6/3b.mdx"}}),{c(){l=b("meta"),i=c(),n=b("p"),p=c(),h(d.$$.fragment),f=c(),h(j.$$.fragment),tl=c(),C.c(),Nn=c(),rt=b("p"),rt.innerHTML=De,nl=c(),Z.c(),Rn=c(),h(mt.$$.fragment),ll=c(),ot=b("p"),ot.innerHTML=Pe,el=c(),h(pt.$$.fragment),sl=c(),h(ht.$$.fragment),al=c(),Mt=b("p"),Mt.textContent=Ke,il=c(),h(Jt.$$.fragment),cl=c(),h(ut.$$.fragment),rl=c(),yt=b("p"),yt.textContent=Oe,ml=c(),h(dt.$$.fragment),ol=c(),bt=b("p"),bt.innerHTML=ts,pl=c(),G.c(),Wn=c(),Tt=b("p"),Tt.textContent=ns,hl=c(),nt=b("div"),nt.innerHTML=ls,Ml=c(),wt=b("p"),wt.textContent=es,Jl=c(),h(Ut.$$.fragment),ul=c(),N.c(),Xn=c(),ft=b("p"),ft.innerHTML=ss,yl=c(),jt=b("p"),jt.innerHTML=as,dl=c(),W.c(),zn=c(),gt=b("p"),gt.textContent=is,bl=c(),z.c(),Qn=c(),kt=b("p"),kt.innerHTML=cs,Tl=c(),g=b("p"),$e=it("Giả sử các sự kiện “Câu trả lời bắt đầu ở "),En=b("code"),En.textContent=rs,Ze=it("” và “Câu trả lời kết thúc ở "),Hn=b("code"),Hn.textContent=ms,xe=it("” là độc lập, xác suất để câu trả lời bắt đầu tại "),Fn=b("code"),Fn.textContent=os,Ge=it(" và kết thúc tại "),Yn=b("code"),Yn.textContent=ps,Ve=it(` là:
`),wl=new Ma(!1),Ul=c(),O=b("p"),Ne=it("Vì vậy, để tính tất cả các điểm, chúng ta chỉ cần tính tích"),fl=new Ma(!1),jl=it(" với "),Sn=b("code"),Sn.textContent=hs,Re=it("."),gl=c(),It=b("p"),It.textContent=Ms,kl=c(),h(vt.$$.fragment),Il=c(),E.c(),An=c(),_t=b("p"),_t.innerHTML=Js,vl=c(),h(Bt.$$.fragment),_l=c(),Ct=b("p"),Ct.textContent=us,Bl=c(),h($t.$$.fragment),Cl=c(),h(lt.$$.fragment),$l=c(),Zt=b("p"),Zt.innerHTML=ys,Zl=c(),h(xt.$$.fragment),xl=c(),Gt=b("p"),Gt.textContent=ds,Gl=c(),h(Vt.$$.fragment),Vl=c(),h(Nt.$$.fragment),Nl=c(),Rt=b("p"),Rt.textContent=bs,Rl=c(),h(et.$$.fragment),Wl=c(),h(Wt.$$.fragment),Xl=c(),Xt=b("p"),Xt.innerHTML=Ts,zl=c(),h(zt.$$.fragment),Ql=c(),h(Qt.$$.fragment),El=c(),Et=b("p"),Et.innerHTML=ws,Hl=c(),h(Ht.$$.fragment),Fl=c(),h(Ft.$$.fragment),Yl=c(),Yt=b("p"),Yt.textContent=Us,Sl=c(),St=b("p"),St.innerHTML=fs,Al=c(),h(At.$$.fragment),ql=c(),h(qt.$$.fragment),Ll=c(),Lt=b("p"),Lt.innerHTML=js,Dl=c(),Dt=b("p"),Dt.textContent=gs,Pl=c(),h(Pt.$$.fragment),Kl=c(),h(Kt.$$.fragment),Ol=c(),Ot=b("p"),Ot.innerHTML=ks,te=c(),h(tn.$$.fragment),ne=c(),h(nn.$$.fragment),le=c(),ln=b("p"),ln.textContent=Is,ee=c(),h(en.$$.fragment),se=c(),sn=b("p"),sn.textContent=vs,ae=c(),h(an.$$.fragment),ie=c(),cn=b("p"),cn.textContent=_s,ce=c(),rn=b("p"),rn.innerHTML=Bs,re=c(),h(mn.$$.fragment),me=c(),on=b("p"),on.innerHTML=Cs,oe=c(),F.c(),qn=c(),pn=b("p"),pn.textContent=$s,pe=c(),h(hn.$$.fragment),he=c(),S.c(),Ln=c(),Mn=b("p"),Mn.textContent=Zs,Me=c(),q.c(),Dn=c(),Jn=b("p"),Jn.textContent=xs,Je=c(),D.c(),Pn=c(),un=b("p"),un.textContent=Gs,ue=c(),K.c(),Kn=c(),h(yn.$$.fragment),ye=c(),dn=b("p"),dn.textContent=Vs,de=c(),h(st.$$.fragment),be=c(),bn=b("p"),bn.innerHTML=Ns,Te=c(),h(Tn.$$.fragment),we=c(),h(wn.$$.fragment),Ue=c(),Un=b("p"),Un.textContent=Rs,fe=c(),h(at.$$.fragment),je=c(),fn=b("p"),fn.textContent=Ws,ge=c(),h(jn.$$.fragment),ke=c(),On=b("p"),this.h()},l(t){const e=ja("svelte-u9bgzb",document.head);l=T(e,"META",{name:!0,content:!0}),e.forEach(s),i=r(t),n=T(t,"P",{}),ve(n).forEach(s),p=r(t),M(d.$$.fragment,t),f=r(t),M(j.$$.fragment,t),tl=r(t),C.l(t),Nn=r(t),rt=T(t,"P",{"data-svelte-h":!0}),U(rt)!=="svelte-yxy9gx"&&(rt.innerHTML=De),nl=r(t),Z.l(t),Rn=r(t),M(mt.$$.fragment,t),ll=r(t),ot=T(t,"P",{"data-svelte-h":!0}),U(ot)!=="svelte-vnjte0"&&(ot.innerHTML=Pe),el=r(t),M(pt.$$.fragment,t),sl=r(t),M(ht.$$.fragment,t),al=r(t),Mt=T(t,"P",{"data-svelte-h":!0}),U(Mt)!=="svelte-s9ftvh"&&(Mt.textContent=Ke),il=r(t),M(Jt.$$.fragment,t),cl=r(t),M(ut.$$.fragment,t),rl=r(t),yt=T(t,"P",{"data-svelte-h":!0}),U(yt)!=="svelte-1lyz06"&&(yt.textContent=Oe),ml=r(t),M(dt.$$.fragment,t),ol=r(t),bt=T(t,"P",{"data-svelte-h":!0}),U(bt)!=="svelte-14f47ia"&&(bt.innerHTML=ts),pl=r(t),G.l(t),Wn=r(t),Tt=T(t,"P",{"data-svelte-h":!0}),U(Tt)!=="svelte-1b7s8e9"&&(Tt.textContent=ns),hl=r(t),nt=T(t,"DIV",{class:!0,"data-svelte-h":!0}),U(nt)!=="svelte-47wedv"&&(nt.innerHTML=ls),Ml=r(t),wt=T(t,"P",{"data-svelte-h":!0}),U(wt)!=="svelte-1f3nki3"&&(wt.textContent=es),Jl=r(t),M(Ut.$$.fragment,t),ul=r(t),N.l(t),Xn=r(t),ft=T(t,"P",{"data-svelte-h":!0}),U(ft)!=="svelte-23keky"&&(ft.innerHTML=ss),yl=r(t),jt=T(t,"P",{"data-svelte-h":!0}),U(jt)!=="svelte-xi76ei"&&(jt.innerHTML=as),dl=r(t),W.l(t),zn=r(t),gt=T(t,"P",{"data-svelte-h":!0}),U(gt)!=="svelte-26cll"&&(gt.textContent=is),bl=r(t),z.l(t),Qn=r(t),kt=T(t,"P",{"data-svelte-h":!0}),U(kt)!=="svelte-11o0luf"&&(kt.innerHTML=cs),Tl=r(t),g=T(t,"P",{});var k=ve(g);$e=ct(k,"Giả sử các sự kiện “Câu trả lời bắt đầu ở "),En=T(k,"CODE",{"data-svelte-h":!0}),U(En)!=="svelte-8eqb3b"&&(En.textContent=rs),Ze=ct(k,"” và “Câu trả lời kết thúc ở "),Hn=T(k,"CODE",{"data-svelte-h":!0}),U(Hn)!=="svelte-9cistc"&&(Hn.textContent=ms),xe=ct(k,"” là độc lập, xác suất để câu trả lời bắt đầu tại "),Fn=T(k,"CODE",{"data-svelte-h":!0}),U(Fn)!=="svelte-8eqb3b"&&(Fn.textContent=os),Ge=ct(k," và kết thúc tại "),Yn=T(k,"CODE",{"data-svelte-h":!0}),U(Yn)!=="svelte-9cistc"&&(Yn.textContent=ps),Ve=ct(k,` là:
`),wl=Ja(k,!1),k.forEach(s),Ul=r(t),O=T(t,"P",{});var tt=ve(O);Ne=ct(tt,"Vì vậy, để tính tất cả các điểm, chúng ta chỉ cần tính tích"),fl=Ja(tt,!1),jl=ct(tt," với "),Sn=T(tt,"CODE",{"data-svelte-h":!0}),U(Sn)!=="svelte-1kp3szf"&&(Sn.textContent=hs),Re=ct(tt,"."),tt.forEach(s),gl=r(t),It=T(t,"P",{"data-svelte-h":!0}),U(It)!=="svelte-1xmjzd"&&(It.textContent=Ms),kl=r(t),M(vt.$$.fragment,t),Il=r(t),E.l(t),An=r(t),_t=T(t,"P",{"data-svelte-h":!0}),U(_t)!=="svelte-2b9cpo"&&(_t.innerHTML=Js),vl=r(t),M(Bt.$$.fragment,t),_l=r(t),Ct=T(t,"P",{"data-svelte-h":!0}),U(Ct)!=="svelte-flep9b"&&(Ct.textContent=us),Bl=r(t),M($t.$$.fragment,t),Cl=r(t),M(lt.$$.fragment,t),$l=r(t),Zt=T(t,"P",{"data-svelte-h":!0}),U(Zt)!=="svelte-bd0wb9"&&(Zt.innerHTML=ys),Zl=r(t),M(xt.$$.fragment,t),xl=r(t),Gt=T(t,"P",{"data-svelte-h":!0}),U(Gt)!=="svelte-13pxc0p"&&(Gt.textContent=ds),Gl=r(t),M(Vt.$$.fragment,t),Vl=r(t),M(Nt.$$.fragment,t),Nl=r(t),Rt=T(t,"P",{"data-svelte-h":!0}),U(Rt)!=="svelte-1plqxrv"&&(Rt.textContent=bs),Rl=r(t),M(et.$$.fragment,t),Wl=r(t),M(Wt.$$.fragment,t),Xl=r(t),Xt=T(t,"P",{"data-svelte-h":!0}),U(Xt)!=="svelte-9nxsrn"&&(Xt.innerHTML=Ts),zl=r(t),M(zt.$$.fragment,t),Ql=r(t),M(Qt.$$.fragment,t),El=r(t),Et=T(t,"P",{"data-svelte-h":!0}),U(Et)!=="svelte-6gx3ai"&&(Et.innerHTML=ws),Hl=r(t),M(Ht.$$.fragment,t),Fl=r(t),M(Ft.$$.fragment,t),Yl=r(t),Yt=T(t,"P",{"data-svelte-h":!0}),U(Yt)!=="svelte-5fxjef"&&(Yt.textContent=Us),Sl=r(t),St=T(t,"P",{"data-svelte-h":!0}),U(St)!=="svelte-1uf262q"&&(St.innerHTML=fs),Al=r(t),M(At.$$.fragment,t),ql=r(t),M(qt.$$.fragment,t),Ll=r(t),Lt=T(t,"P",{"data-svelte-h":!0}),U(Lt)!=="svelte-18x7z5d"&&(Lt.innerHTML=js),Dl=r(t),Dt=T(t,"P",{"data-svelte-h":!0}),U(Dt)!=="svelte-1opqzxx"&&(Dt.textContent=gs),Pl=r(t),M(Pt.$$.fragment,t),Kl=r(t),M(Kt.$$.fragment,t),Ol=r(t),Ot=T(t,"P",{"data-svelte-h":!0}),U(Ot)!=="svelte-uya1e8"&&(Ot.innerHTML=ks),te=r(t),M(tn.$$.fragment,t),ne=r(t),M(nn.$$.fragment,t),le=r(t),ln=T(t,"P",{"data-svelte-h":!0}),U(ln)!=="svelte-m3vijj"&&(ln.textContent=Is),ee=r(t),M(en.$$.fragment,t),se=r(t),sn=T(t,"P",{"data-svelte-h":!0}),U(sn)!=="svelte-1lpkcws"&&(sn.textContent=vs),ae=r(t),M(an.$$.fragment,t),ie=r(t),cn=T(t,"P",{"data-svelte-h":!0}),U(cn)!=="svelte-1gz6xtn"&&(cn.textContent=_s),ce=r(t),rn=T(t,"P",{"data-svelte-h":!0}),U(rn)!=="svelte-55erzg"&&(rn.innerHTML=Bs),re=r(t),M(mn.$$.fragment,t),me=r(t),on=T(t,"P",{"data-svelte-h":!0}),U(on)!=="svelte-1ep0q9j"&&(on.innerHTML=Cs),oe=r(t),F.l(t),qn=r(t),pn=T(t,"P",{"data-svelte-h":!0}),U(pn)!=="svelte-hfdr9q"&&(pn.textContent=$s),pe=r(t),M(hn.$$.fragment,t),he=r(t),S.l(t),Ln=r(t),Mn=T(t,"P",{"data-svelte-h":!0}),U(Mn)!=="svelte-1tvxzle"&&(Mn.textContent=Zs),Me=r(t),q.l(t),Dn=r(t),Jn=T(t,"P",{"data-svelte-h":!0}),U(Jn)!=="svelte-glqw3l"&&(Jn.textContent=xs),Je=r(t),D.l(t),Pn=r(t),un=T(t,"P",{"data-svelte-h":!0}),U(un)!=="svelte-10lv4ty"&&(un.textContent=Gs),ue=r(t),K.l(t),Kn=r(t),M(yn.$$.fragment,t),ye=r(t),dn=T(t,"P",{"data-svelte-h":!0}),U(dn)!=="svelte-t47wam"&&(dn.textContent=Vs),de=r(t),M(st.$$.fragment,t),be=r(t),bn=T(t,"P",{"data-svelte-h":!0}),U(bn)!=="svelte-57me3a"&&(bn.innerHTML=Ns),Te=r(t),M(Tn.$$.fragment,t),we=r(t),M(wn.$$.fragment,t),Ue=r(t),Un=T(t,"P",{"data-svelte-h":!0}),U(Un)!=="svelte-1xx830h"&&(Un.textContent=Rs),fe=r(t),M(at.$$.fragment,t),je=r(t),fn=T(t,"P",{"data-svelte-h":!0}),U(fn)!=="svelte-5dm25f"&&(fn.textContent=Ws),ge=r(t),M(jn.$$.fragment,t),ke=r(t),On=T(t,"P",{}),ve(On).forEach(s),this.h()},h(){Le(l,"name","hf:doc:metadata"),Le(l,"content",ni),Le(nt,"class","flex justify-center"),wl.a=null,fl.a=jl},m(t,e){I(document.head,l),a(t,i,e),a(t,n,e),a(t,p,e),J(d,t,e),a(t,f,e),J(j,t,e),a(t,tl,e),gn[B].m(t,e),a(t,Nn,e),a(t,rt,e),a(t,nl,e),kn[$].m(t,e),a(t,Rn,e),J(mt,t,e),a(t,ll,e),a(t,ot,e),a(t,el,e),J(pt,t,e),a(t,sl,e),J(ht,t,e),a(t,al,e),a(t,Mt,e),a(t,il,e),J(Jt,t,e),a(t,cl,e),J(ut,t,e),a(t,rl,e),a(t,yt,e),a(t,ml,e),J(dt,t,e),a(t,ol,e),a(t,bt,e),a(t,pl,e),In[x].m(t,e),a(t,Wn,e),a(t,Tt,e),a(t,hl,e),a(t,nt,e),a(t,Ml,e),a(t,wt,e),a(t,Jl,e),J(Ut,t,e),a(t,ul,e),vn[V].m(t,e),a(t,Xn,e),a(t,ft,e),a(t,yl,e),a(t,jt,e),a(t,dl,e),_n[R].m(t,e),a(t,zn,e),a(t,gt,e),a(t,bl,e),Bn[X].m(t,e),a(t,Qn,e),a(t,kt,e),a(t,Tl,e),a(t,g,e),I(g,$e),I(g,En),I(g,Ze),I(g,Hn),I(g,xe),I(g,Fn),I(g,Ge),I(g,Yn),I(g,Ve),wl.m(da,g),a(t,Ul,e),a(t,O,e),I(O,Ne),fl.m(ba,O),I(O,jl),I(O,Sn),I(O,Re),a(t,gl,e),a(t,It,e),a(t,kl,e),J(vt,t,e),a(t,Il,e),Cn[Q].m(t,e),a(t,An,e),a(t,_t,e),a(t,vl,e),J(Bt,t,e),a(t,_l,e),a(t,Ct,e),a(t,Bl,e),J($t,t,e),a(t,Cl,e),J(lt,t,e),a(t,$l,e),a(t,Zt,e),a(t,Zl,e),J(xt,t,e),a(t,xl,e),a(t,Gt,e),a(t,Gl,e),J(Vt,t,e),a(t,Vl,e),J(Nt,t,e),a(t,Nl,e),a(t,Rt,e),a(t,Rl,e),J(et,t,e),a(t,Wl,e),J(Wt,t,e),a(t,Xl,e),a(t,Xt,e),a(t,zl,e),J(zt,t,e),a(t,Ql,e),J(Qt,t,e),a(t,El,e),a(t,Et,e),a(t,Hl,e),J(Ht,t,e),a(t,Fl,e),J(Ft,t,e),a(t,Yl,e),a(t,Yt,e),a(t,Sl,e),a(t,St,e),a(t,Al,e),J(At,t,e),a(t,ql,e),J(qt,t,e),a(t,Ll,e),a(t,Lt,e),a(t,Dl,e),a(t,Dt,e),a(t,Pl,e),J(Pt,t,e),a(t,Kl,e),J(Kt,t,e),a(t,Ol,e),a(t,Ot,e),a(t,te,e),J(tn,t,e),a(t,ne,e),J(nn,t,e),a(t,le,e),a(t,ln,e),a(t,ee,e),J(en,t,e),a(t,se,e),a(t,sn,e),a(t,ae,e),J(an,t,e),a(t,ie,e),a(t,cn,e),a(t,ce,e),a(t,rn,e),a(t,re,e),J(mn,t,e),a(t,me,e),a(t,on,e),a(t,oe,e),$n[H].m(t,e),a(t,qn,e),a(t,pn,e),a(t,pe,e),J(hn,t,e),a(t,he,e),Zn[Y].m(t,e),a(t,Ln,e),a(t,Mn,e),a(t,Me,e),xn[A].m(t,e),a(t,Dn,e),a(t,Jn,e),a(t,Je,e),Gn[L].m(t,e),a(t,Pn,e),a(t,un,e),a(t,ue,e),Vn[P].m(t,e),a(t,Kn,e),J(yn,t,e),a(t,ye,e),a(t,dn,e),a(t,de,e),J(st,t,e),a(t,be,e),a(t,bn,e),a(t,Te,e),J(Tn,t,e),a(t,we,e),J(wn,t,e),a(t,Ue,e),a(t,Un,e),a(t,fe,e),J(at,t,e),a(t,je,e),a(t,fn,e),a(t,ge,e),J(jn,t,e),a(t,ke,e),a(t,On,e),Ie=!0},p(t,[e]){const k={};e&1&&(k.fw=t[0]),d.$set(k);let tt=B;B=zs(t),B!==tt&&(_(),m(gn[tt],1,1,()=>{gn[tt]=null}),v(),C=gn[B],C||(C=gn[B]=Xs[B](t),C.c()),o(C,1),C.m(Nn.parentNode,Nn));let We=$;$=Es(t),$!==We&&(_(),m(kn[We],1,1,()=>{kn[We]=null}),v(),Z=kn[$],Z||(Z=kn[$]=Qs[$](t),Z.c()),o(Z,1),Z.m(Rn.parentNode,Rn));let Xe=x;x=Fs(t),x!==Xe&&(_(),m(In[Xe],1,1,()=>{In[Xe]=null}),v(),G=In[x],G||(G=In[x]=Hs[x](t),G.c()),o(G,1),G.m(Wn.parentNode,Wn));let ze=V;V=Ss(t),V!==ze&&(_(),m(vn[ze],1,1,()=>{vn[ze]=null}),v(),N=vn[V],N||(N=vn[V]=Ys[V](t),N.c()),o(N,1),N.m(Xn.parentNode,Xn));let Qe=R;R=qs(t),R!==Qe&&(_(),m(_n[Qe],1,1,()=>{_n[Qe]=null}),v(),W=_n[R],W||(W=_n[R]=As[R](t),W.c()),o(W,1),W.m(zn.parentNode,zn));let Ee=X;X=Ds(t),X!==Ee&&(_(),m(Bn[Ee],1,1,()=>{Bn[Ee]=null}),v(),z=Bn[X],z||(z=Bn[X]=Ls[X](t),z.c()),o(z,1),z.m(Qn.parentNode,Qn));let He=Q;Q=Ks(t),Q!==He&&(_(),m(Cn[He],1,1,()=>{Cn[He]=null}),v(),E=Cn[Q],E||(E=Cn[Q]=Ps[Q](t),E.c()),o(E,1),E.m(An.parentNode,An));const ma={};e&2&&(ma.$$scope={dirty:e,ctx:t}),lt.$set(ma);const oa={};e&2&&(oa.$$scope={dirty:e,ctx:t}),et.$set(oa);let Fe=H;H=ta(t),H!==Fe&&(_(),m($n[Fe],1,1,()=>{$n[Fe]=null}),v(),F=$n[H],F||(F=$n[H]=Os[H](t),F.c()),o(F,1),F.m(qn.parentNode,qn));let Ye=Y;Y=la(t),Y!==Ye&&(_(),m(Zn[Ye],1,1,()=>{Zn[Ye]=null}),v(),S=Zn[Y],S||(S=Zn[Y]=na[Y](t),S.c()),o(S,1),S.m(Ln.parentNode,Ln));let Se=A;A=sa(t),A!==Se&&(_(),m(xn[Se],1,1,()=>{xn[Se]=null}),v(),q=xn[A],q||(q=xn[A]=ea[A](t),q.c()),o(q,1),q.m(Dn.parentNode,Dn));let Ae=L;L=ia(t),L!==Ae&&(_(),m(Gn[Ae],1,1,()=>{Gn[Ae]=null}),v(),D=Gn[L],D||(D=Gn[L]=aa[L](t),D.c()),o(D,1),D.m(Pn.parentNode,Pn));let qe=P;P=ra(t),P!==qe&&(_(),m(Vn[qe],1,1,()=>{Vn[qe]=null}),v(),K=Vn[P],K||(K=Vn[P]=ca[P](t),K.c()),o(K,1),K.m(Kn.parentNode,Kn));const pa={};e&2&&(pa.$$scope={dirty:e,ctx:t}),st.$set(pa);const ha={};e&2&&(ha.$$scope={dirty:e,ctx:t}),at.$set(ha)},i(t){Ie||(o(d.$$.fragment,t),o(j.$$.fragment,t),o(C),o(Z),o(mt.$$.fragment,t),o(pt.$$.fragment,t),o(ht.$$.fragment,t),o(Jt.$$.fragment,t),o(ut.$$.fragment,t),o(dt.$$.fragment,t),o(G),o(Ut.$$.fragment,t),o(N),o(W),o(z),o(vt.$$.fragment,t),o(E),o(Bt.$$.fragment,t),o($t.$$.fragment,t),o(lt.$$.fragment,t),o(xt.$$.fragment,t),o(Vt.$$.fragment,t),o(Nt.$$.fragment,t),o(et.$$.fragment,t),o(Wt.$$.fragment,t),o(zt.$$.fragment,t),o(Qt.$$.fragment,t),o(Ht.$$.fragment,t),o(Ft.$$.fragment,t),o(At.$$.fragment,t),o(qt.$$.fragment,t),o(Pt.$$.fragment,t),o(Kt.$$.fragment,t),o(tn.$$.fragment,t),o(nn.$$.fragment,t),o(en.$$.fragment,t),o(an.$$.fragment,t),o(mn.$$.fragment,t),o(F),o(hn.$$.fragment,t),o(S),o(q),o(D),o(K),o(yn.$$.fragment,t),o(st.$$.fragment,t),o(Tn.$$.fragment,t),o(wn.$$.fragment,t),o(at.$$.fragment,t),o(jn.$$.fragment,t),Ie=!0)},o(t){m(d.$$.fragment,t),m(j.$$.fragment,t),m(C),m(Z),m(mt.$$.fragment,t),m(pt.$$.fragment,t),m(ht.$$.fragment,t),m(Jt.$$.fragment,t),m(ut.$$.fragment,t),m(dt.$$.fragment,t),m(G),m(Ut.$$.fragment,t),m(N),m(W),m(z),m(vt.$$.fragment,t),m(E),m(Bt.$$.fragment,t),m($t.$$.fragment,t),m(lt.$$.fragment,t),m(xt.$$.fragment,t),m(Vt.$$.fragment,t),m(Nt.$$.fragment,t),m(et.$$.fragment,t),m(Wt.$$.fragment,t),m(zt.$$.fragment,t),m(Qt.$$.fragment,t),m(Ht.$$.fragment,t),m(Ft.$$.fragment,t),m(At.$$.fragment,t),m(qt.$$.fragment,t),m(Pt.$$.fragment,t),m(Kt.$$.fragment,t),m(tn.$$.fragment,t),m(nn.$$.fragment,t),m(en.$$.fragment,t),m(an.$$.fragment,t),m(mn.$$.fragment,t),m(F),m(hn.$$.fragment,t),m(S),m(q),m(D),m(K),m(yn.$$.fragment,t),m(st.$$.fragment,t),m(Tn.$$.fragment,t),m(wn.$$.fragment,t),m(at.$$.fragment,t),m(jn.$$.fragment,t),Ie=!1},d(t){t&&(s(i),s(n),s(p),s(f),s(tl),s(Nn),s(rt),s(nl),s(Rn),s(ll),s(ot),s(el),s(sl),s(al),s(Mt),s(il),s(cl),s(rl),s(yt),s(ml),s(ol),s(bt),s(pl),s(Wn),s(Tt),s(hl),s(nt),s(Ml),s(wt),s(Jl),s(ul),s(Xn),s(ft),s(yl),s(jt),s(dl),s(zn),s(gt),s(bl),s(Qn),s(kt),s(Tl),s(g),s(Ul),s(O),s(gl),s(It),s(kl),s(Il),s(An),s(_t),s(vl),s(_l),s(Ct),s(Bl),s(Cl),s($l),s(Zt),s(Zl),s(xl),s(Gt),s(Gl),s(Vl),s(Nl),s(Rt),s(Rl),s(Wl),s(Xl),s(Xt),s(zl),s(Ql),s(El),s(Et),s(Hl),s(Fl),s(Yl),s(Yt),s(Sl),s(St),s(Al),s(ql),s(Ll),s(Lt),s(Dl),s(Dt),s(Pl),s(Kl),s(Ol),s(Ot),s(te),s(ne),s(le),s(ln),s(ee),s(se),s(sn),s(ae),s(ie),s(cn),s(ce),s(rn),s(re),s(me),s(on),s(oe),s(qn),s(pn),s(pe),s(he),s(Ln),s(Mn),s(Me),s(Dn),s(Jn),s(Je),s(Pn),s(un),s(ue),s(Kn),s(ye),s(dn),s(de),s(be),s(bn),s(Te),s(we),s(Ue),s(Un),s(fe),s(je),s(fn),s(ge),s(ke),s(On)),s(l),u(d,t),u(j,t),gn[B].d(t),kn[$].d(t),u(mt,t),u(pt,t),u(ht,t),u(Jt,t),u(ut,t),u(dt,t),In[x].d(t),u(Ut,t),vn[V].d(t),_n[R].d(t),Bn[X].d(t),u(vt,t),Cn[Q].d(t),u(Bt,t),u($t,t),u(lt,t),u(xt,t),u(Vt,t),u(Nt,t),u(et,t),u(Wt,t),u(zt,t),u(Qt,t),u(Ht,t),u(Ft,t),u(At,t),u(qt,t),u(Pt,t),u(Kt,t),u(tn,t),u(nn,t),u(en,t),u(an,t),u(mn,t),$n[H].d(t),u(hn,t),Zn[Y].d(t),xn[A].d(t),Gn[L].d(t),Vn[P].d(t),u(yn,t),u(st,t),u(Tn,t),u(wn,t),u(at,t),u(jn,t)}}}const ni='{"title":"Fast tokenizers in the QA pipeline","local":"fast-tokenizers-in-the-qa-pipeline","sections":[{"title":"Sử dụng pipeline question-answering","local":"sử-dụng-pipeline-question-answering","sections":[],"depth":2},{"title":"Sử dụng mô hình cho tác vụ hỏi đáp","local":"sử-dụng-mô-hình-cho-tác-vụ-hỏi-đáp","sections":[],"depth":2},{"title":"Xử lý các ngữ cảnh dài","local":"xử-lý-các-ngữ-cảnh-dài","sections":[],"depth":2}],"depth":1}';function li(y,l,i){let n="pt";return wa(()=>{const p=new URLSearchParams(window.location.search);i(0,n=p.get("fw")||"pt")}),[n]}class pi extends Ua{constructor(l){super(),fa(this,l,li,ti,Ta,{})}}export{pi as component};

Xet Storage Details

Size:
90.3 kB
·
Xet hash:
32b4cee8e10dc48d897af3123d08ffdcc0ba4204f7f918d00517a711bf4d9e3f

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.