Buckets:
| import{s as G,n as F,o as N}from"../chunks/scheduler.37c15a92.js";import{S as O,i as R,g as f,s,r as w,A as W,h as d,f as a,c as r,j as A,u as E,x as T,k as B,y as D,a as n,v as y,d as S,t as L,w as H}from"../chunks/index.2bf4358c.js";import{C as I}from"../chunks/CourseFloatingBanner.6add7356.js";import{H as J}from"../chunks/Heading.8ada512a.js";import{E as K}from"../chunks/getInferenceSnippets.b37612c0.js";function Q(M){let o,z,$,_,i,g,l,b,m,q="Gran trabajo terminando este capítulo!",x,p,U="Luego de esta profundizacion en los tokenizadores, deberías:",k,u,j="<li>Ser capaz de entrenar un nuevo tokenizador usando un existente como plantilla</li> <li>Entender como usar los offsets para mapear las posiciones de los tokens a sus trozos de texto original</li> <li>Conocer las diferencias entre BPE, WordPiece y Unigram</li> <li>Ser capaz de mezclar y combinar los bloques provistos por la librería 🤗 Tokenizers para construir tu propio tokenizador</li> <li>Ser capaz de usar el tokenizador dentro de la librería 🤗 Transformers.</li>",v,c,C,h,P;return i=new J({props:{title:"Tokenizadores, listo!",local:"tokenizers-check",headingTag:"h1"}}),l=new I({props:{chapter:6,classNames:"absolute z-10 right-0 top-0"}}),c=new K({props:{source:"https://github.com/huggingface/course/blob/main/chapters/es/chapter6/9.mdx"}}),{c(){o=f("meta"),z=s(),$=f("p"),_=s(),w(i.$$.fragment),g=s(),w(l.$$.fragment),b=s(),m=f("p"),m.textContent=q,x=s(),p=f("p"),p.textContent=U,k=s(),u=f("ul"),u.innerHTML=j,v=s(),w(c.$$.fragment),C=s(),h=f("p"),this.h()},l(e){const t=W("svelte-u9bgzb",document.head);o=d(t,"META",{name:!0,content:!0}),t.forEach(a),z=r(e),$=d(e,"P",{}),A($).forEach(a),_=r(e),E(i.$$.fragment,e),g=r(e),E(l.$$.fragment,e),b=r(e),m=d(e,"P",{"data-svelte-h":!0}),T(m)!=="svelte-3z1det"&&(m.textContent=q),x=r(e),p=d(e,"P",{"data-svelte-h":!0}),T(p)!=="svelte-6klo4x"&&(p.textContent=U),k=r(e),u=d(e,"UL",{"data-svelte-h":!0}),T(u)!=="svelte-qla4gz"&&(u.innerHTML=j),v=r(e),E(c.$$.fragment,e),C=r(e),h=d(e,"P",{}),A(h).forEach(a),this.h()},h(){B(o,"name","hf:doc:metadata"),B(o,"content",V)},m(e,t){D(document.head,o),n(e,z,t),n(e,$,t),n(e,_,t),y(i,e,t),n(e,g,t),y(l,e,t),n(e,b,t),n(e,m,t),n(e,x,t),n(e,p,t),n(e,k,t),n(e,u,t),n(e,v,t),y(c,e,t),n(e,C,t),n(e,h,t),P=!0},p:F,i(e){P||(S(i.$$.fragment,e),S(l.$$.fragment,e),S(c.$$.fragment,e),P=!0)},o(e){L(i.$$.fragment,e),L(l.$$.fragment,e),L(c.$$.fragment,e),P=!1},d(e){e&&(a(z),a($),a(_),a(g),a(b),a(m),a(x),a(p),a(k),a(u),a(v),a(C),a(h)),a(o),H(i,e),H(l,e),H(c,e)}}}const V='{"title":"Tokenizadores, listo!","local":"tokenizers-check","sections":[],"depth":1}';function X(M){return N(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class ne extends O{constructor(o){super(),R(this,o,X,Q,G,{})}}export{ne as component}; | |
Xet Storage Details
- Size:
- 2.79 kB
- Xet hash:
- 713eedd3ecafcb612345ccd7bc34fdd3395defc8136773d3f628791c8214d4fd
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.