Buckets:
| import{s as Jt,o as ht,n as me}from"../chunks/scheduler.37c15a92.js";import{S as yt,i as Tt,g as p,s as t,r as u,A as Ut,h as c,f as l,c as n,j as mt,u as d,x as r,k as j,y as gt,a,v as M,d as m,t as J,w as h}from"../chunks/index.2bf4358c.js";import{T as Me}from"../chunks/Tip.363c041f.js";import{Y as jt}from"../chunks/Youtube.1e50a667.js";import{C as y}from"../chunks/CodeBlock.4e987730.js";import{C as bt}from"../chunks/CourseFloatingBanner.9ff4c771.js";import{H as Je,E as ft}from"../chunks/getInferenceSnippets.24b50994.js";function wt(g){let i,T="✏️ <strong>Prova tu!</strong> Clicca su alcuni degli URL nel payload JSON per farti un’idea del tipo di informazione a cui è collegato ogni issue GitHub.";return{c(){i=p("p"),i.innerHTML=T},l(o){i=c(o,"P",{"data-svelte-h":!0}),r(i)!=="svelte-ql7iz5"&&(i.innerHTML=T)},m(o,U){a(o,i,U)},p:me,d(o){o&&l(i)}}}function xt(g){let i,T='⚠️ Fai attenzione a non condividere un notebook con il tuo <code>GITHUB_TOKEN</code> al suo interno. Ti consigliamo di cancellare l’ultima cella una volta che l’hai eseguita per evitare di far trapelare quest’informazione accidentalmente. Meglio ancora, salva il tuo token in un file <em>.env</em> e usa la <a href="https://github.com/theskumar/python-dotenv" rel="nofollow">libreria <code>python-dotenv</code></a> per caricarlo automaticamente come una variabile d’ambiente.';return{c(){i=p("p"),i.innerHTML=T},l(o){i=c(o,"P",{"data-svelte-h":!0}),r(i)!=="svelte-bmnegk"&&(i.innerHTML=T)},m(o,U){a(o,i,U)},p:me,d(o){o&&l(i)}}}function Zt(g){let i,T="✏️ <strong>Prova tu!</strong> Calcola il tempo medio che ci vuole a chiudere un issue su 🤗 Datasets. Potrebbe essere utile usare la funzione <code>Dataset.filter()</code> per eliminare le richieste di pull e gli issue aperti, e puoi usare la funzione <code>Dataset.set_format()</code> per convertire il dataset in un <code>DataFrame</code> così che puoi facilmente manipolare i timestamp <code>created_at</code> e <code>closed_at</code>. Per dei punti bonus, calcola il tempo medio che ci vuole a chiudere le richieste di pull.";return{c(){i=p("p"),i.innerHTML=T},l(o){i=c(o,"P",{"data-svelte-h":!0}),r(i)!=="svelte-bcwlrn"&&(i.innerHTML=T)},m(o,U){a(o,i,U)},p:me,d(o){o&&l(i)}}}function Gt(g){let i,T="✏️ <strong>Prova tu!</strong> Usa le tue credenziali dell’Hub Hugging Face per ottenere un token e creare una repository vuota chiamata <code>github-issues</code>. Ricordati di <strong>non salvere mai le tue credenziali</strong> su Colab o qualunque altra repository, perché potrebbero essere recuperate da malintenzionati.";return{c(){i=p("p"),i.innerHTML=T},l(o){i=c(o,"P",{"data-svelte-h":!0}),r(i)!=="svelte-17hauie"&&(i.innerHTML=T)},m(o,U){a(o,i,U)},p:me,d(o){o&&l(i)}}}function Rt(g){let i,T='💡 Puoi caricare un dataset nell’Hub di Hugging Face anche direttamente dal terminale usando <code>huggingface-cli</code> e un po’ di magia Git. La <a href="https://huggingface.co/docs/datasets/share#share-a-dataset-using-the-cli" rel="nofollow">guida a 🤗 Datasets</a> spiega come farlo.';return{c(){i=p("p"),i.innerHTML=T},l(o){i=c(o,"P",{"data-svelte-h":!0}),r(i)!=="svelte-ttry9d"&&(i.innerHTML=T)},m(o,U){a(o,i,U)},p:me,d(o){o&&l(i)}}}function It(g){let i,T='✏️ <strong>Prova tu!</strong> Usa l’applicazione <code>dataset-tagging</code> e la <a href="https://github.com/huggingface/datasets/blob/master/templates/README_guide.md" rel="nofollow">guida 🤗 Datasets</a> per completare il file <em>README.md</em> per il tuo dataset di issue di GitHub.';return{c(){i=p("p"),i.innerHTML=T},l(o){i=c(o,"P",{"data-svelte-h":!0}),r(i)!=="svelte-1iu8kwm"&&(i.innerHTML=T)},m(o,U){a(o,i,U)},p:me,d(o){o&&l(i)}}}function zt(g){let i,T="✏️ <strong>Prova tu!</strong> Segui i passi che abbiamo eseguito in questa sezione per creare un dataset di issue GitHub per la tua libreria open source preferita (ovviamente scegli qualcosa di diverso da 🤗 Datasets!). Per punti bonus, esegui il fine-tuning di un classificatore multiclasse per predirre i tag presenti nel campo <code>labels</code>.";return{c(){i=p("p"),i.innerHTML=T},l(o){i=c(o,"P",{"data-svelte-h":!0}),r(i)!=="svelte-aozvfr"&&(i.innerHTML=T)},m(o,U){a(o,i,U)},p:me,d(o){o&&l(i)}}}function Ct(g){let i,T,o,U,k,ye,V,Te,$,ra='A volte il dataset che ti serve per la tua applicazione NLP non esiste, per cui dovrai crearlo da te. In questa sezione ti mostreremo come creare un corpus di <a href="https://github.com/features/issues" rel="nofollow">issue da GitHub</a>, usate solitamente per tenere traccia dei bug e delle feature nelle repository su GitHub. Questo corpus può essere usato in diversi modi, ad esempio:',Ue,B,oa="<li>Esplorare il tempo impiegato per chiudere un issue, o per effettuare dei pull</li> <li>Addestrare un <em>classificatore multiclasse</em> che assegna a ogni issue dei metadati sulla base della descrizione dell’issue (ad esempio, “bug”, “enhancement”, “question”)</li> <li>Creare un motore di ricerca semantico per trovare quale issue corrisponde a una richiesta dell’utente</li>",ge,H,ua="Ci focalizzeremo sulla creazione del corpus, e nella prossima sezione affronteremo la creazione di un motore di ricerca semantico. Useremo gli issue GitHub associate a un progetto open source molto popolare: 🤗 Datasets! Diamo un’occhiata a come recuperare i dati e come esplorare le informazioni contenute negli issue.",je,W,be,Y,da='Puoi trovare tutte gli issue in 🤗 Datasets navigando nella <a href="https://github.com/huggingface/datasets/issues" rel="nofollow">sezione Issues della repository</a>. Come si vede dallo screenshot, al momento della scrittura c’erano 331 issue aperti e 668 issue chiusi.',fe,b,Ma='<img src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter5/datasets-issues.png" alt="The GitHub issues associated with 🤗 Datasets." width="80%"/>',we,F,ma="Se clicchi su una di questi issue vedrai che contiene un titolo, una descrizione, e un set di etichette che caratterizzano l’issue. Un esempio è mostrato nello screenshot successivo.",xe,f,Ja='<img src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter5/datasets-issues-single.png" alt="A typical GitHub issue in the 🤗 Datasets repository." width="80%"/>',Ze,Q,ha='Per scaricare gli issue della repository, useremo la <a href="https://docs.github.com/en/rest" rel="nofollow">REST API di GitHub</a> per interrogare l’<a href="https://docs.github.com/en/rest/reference/issues#list-repository-issues" rel="nofollow">endpoint <code>Issues</code></a>. Questo endpoint restituisce una lista di oggetti JSON, e ogni oggetto contiene un gran numero di campi, tra cui il titolo e la descrizione, così come dei metadati circo lo status dell’issue e altro ancora.',Ge,E,ya="Una maniera conveniente di scaricare gli issue è attraverso la libreria <code>requests</code>, che rappresenta il metodo standard di fare richieste HTTP su Python. Puoi installa la libreria attraverso il codice:",Re,S,Ie,A,Ta="Una volta che la libreria è stata installata, puoi effettuare una richiesta GET all’endpoint <code>Issues</code> utilizzando la funzione <code>requests.get()</code>. Ad esempio, puoi eseguire il comando mostrato di seguito per recuperare il primo issue nella prima pagina:",ze,L,Ce,q,Ua="L’oggetto <code>response</code> contiene un sacco di informazioni utili sulla richiesta, compreso il codice di stato HTTP:",Xe,D,ve,P,Ne,O,ga='Lo status <code>200</code> indica che la richiesta ha avuto buon fine (puoi trovare una lista di codici di stato HTTTP <a href="https://it.wikipedia.org/wiki/Codici_di_stato_HTTP" rel="nofollow">qui</a>). Ma ciò che ci interessa davvero è il <em>payload</em>, a cui è possibile accedere utilizzando diversi formati come byte, stringh, o JSON. Visto che sappiamo che i nostri issue sono in formato JSON, diamo un’occhiata al payload come segue:',_e,K,ke,ss,Ve,es,ja="Wow, quante informazioni! Possiamo vedere alcuni campi utili come <code>title</code>, <code>body</code> e <code>number</code> che descrivono l’issue, così come informazioni sull’utente che l’ha aperto.",$e,w,Be,ls,ba='Come descritto nella <a href="https://docs.github.com/en/rest/overview/resources-in-the-rest-api#rate-limiting" rel="nofollow">documentazione di GitHub</a>, le richieste senza autenticazione sono limitate a 60 ogni ora. Benché possiamo aumentare il parametro della query <code>per_page</code> per ridurre il numero di richieste, raggiungerai comunque il limite su qualunque repository che ha qualche migliaio di issue. Quindi, dovresti seguire le <a href="https://docs.github.com/en/github/authenticating-to-github/creating-a-personal-access-token" rel="nofollow">istruzioni</a> su come creare un <em>token di accesso personale</em> così che puoi aumentare il limite a 5.000 richieste ogni ora. Una volta che hai ottenuto il tuo token, puoi includerlo come parte dell’header della richiesta:',He,as,We,x,Ye,ts,fa="Ora che abbiamo il nostro token di accesso, creiamo una funzione che scarichi tutti gli issue da una repository GitHub:",Fe,ns,Qe,is,wa="Ora quando eseguiremo <code>fetch_issues()</code>, scaricherà tutti gli issue in batch per evitare di superare il limite di GitHub del numero di richieste per ora; il risultato sarà conservato in un file <em>repository_name-issues.jsonl</em>, in cui ogni linea è un oggetto JSON che rappresenta un issue. Usiamo questa funzione per recuperare tutti gli issue da 🤗 Datasets:",Ee,ps,Se,cs,xa='Una volta che gli issue sono stati scaricati, possiamo caricarli in locale usando le nuove abilità imparate nella <a href="/course/chapter5/2">sezione 2</a>:',Ae,rs,Le,os,qe,us,Za='Benissimo, abbiamo creato il nostro primo dataset da zero! Ma perché ci sono migliaia di issue quando la <a href="https://github.com/huggingface/datasets/issues" rel="nofollow">sezione Issues</a> della repository 🤗 Datasets mostra circa 1,000 issue in totale 🤔? Come indicato nella <a href="https://docs.github.com/en/rest/reference/issues#list-issues-assigned-to-the-authenticated-user" rel="nofollow">documentazione di GitHub</a>, è perché abbiamo scaricato anche le richieste di pull:',De,ds,Ga="<p>GitHub’s REST API v3 considers every pull request an issue, but not every issue is a pull request. For this reason, “Issues” endpoints may return both issues and pull requests in the response. You can identify pull requests by the <code>pull_request</code> key. Be aware that the <code>id</code> of a pull request returned from “Issues” endpoints will be an issue id.</p>",Pe,Ms,Ra="(<em>La REST API v3 di GitHub considera ogni richiesta di pull un issue, ma non ogni issue è una richiesta di pull. Per questa ragione, gli endpoint “Issues” potrebbe tornare sia gli issue che le richieste di pull. È possibile identificare le richieste di pull utilizzando la chiave <code>pull_request</code>. Tieni presente che l’<code>id</code> di una richiesta di pull resituita dagli endpoint <code>Issues</code> sarà un id di un issue.</em>)",Oe,ms,Ia="Poichè i contenuti degli issue e delle richieste di pull sono molto diversi, facciamo un po’ di preprocessing per permetterci di distinguere tra i due.",Ke,Js,sl,hs,za='Il frammento precedente della documentazione di GitHub ci dice che la colonna <code>pull_request</code> può essere utilizzata per distinguere gli issue e le richieste di pull. Diamo uno sguardo a un esempio casuale per vedere qual è la differenza. Come abbiamo fatto nella <a href="/course/chapter5/3">sezione 3</a>, concateneremo <code>Dataset.shuffle()</code> e <code>Dataset.select()</code> per creare un campione random, e poi zipperemo le colonne <code>html_url</code> e <code>pull_request</code> così da poter paragonare i diversi URL:',el,ys,ll,Ts,al,Us,Ca="Possiamo vedere che ogni richiesta di pull è associata a diversi URL, mentre i comuni issue hanno un’entrata <code>None</code>. Possiamo usare questa distinzione per crare una nuova colonna <code>is_pull_request</code> che controlla se il campo <code>pull_request</code> sia <code>None</code> o meno:",tl,gs,nl,Z,il,js,Xa="Benché potremmo procedere e pulire ulteriormente il dataset eliminando o rinominando alcune colonne, è solitamente buona prassi lasciare il dataset quando più intatto è possibile in questo stadio, così che può essere utilizzato facilmente in più applicazioni.",pl,bs,va="Prima di caricare il nostro dataset sull’Hub Hugging Face, dobbiamo occuparci di una cosa che manca: i commenti associati a ogni issue e richiesta di pull. Hai indovinato, li aggiungeremo utilizzando la REST API di GitHub!",cl,fs,rl,ws,Na="Come mostrato negli screenshot di seguito, i commenti associati a un issue o una richiesta di pull offrono una fonte molto ricca di informazioni, soprattutto se siamo interessati a costruire un motore di ricerca per rispondere alle richieste degli utenti sulla libreria.",ol,G,_a='<img src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter5/datasets-issues-comment.png" alt="Comments associated with an issue about 🤗 Datasets." width="80%"/>',ul,xs,ka='La REST API di GitHub offre un <a href="https://docs.github.com/en/rest/reference/issues#list-issue-comments" rel="nofollow">endpoint <code>Comments</code></a> che restituisce tutti i commenti associati con un numero di issue. Testiamo quest’endpoint per vedere cosa restituisce:',dl,Zs,Ml,Gs,ml,Rs,Va="Possiamo vedere che il commento è archiviato nel campo <code>body</code>, quindi possiamo scvrivere una semplice funzione che restituisce tutti i commenti associati con un issue estraendo i contenuti di <code>body</code> per ogni elemento in <code>response.json()</code>:",Jl,Is,hl,zs,yl,Cs,$a="Sembra andar bene, quindi possiamo usare <code>Dataset.map()</code> per aggiungere una nuova colonna <code>comments</code> a ogni usse nel nostro dataset:",Tl,Xs,Ul,vs,Ba="Come passaggio finale, salviamo il dataset esteso assieme ai nostri dati non processati, così da poter caricare entrambi sull’Hub:",gl,Ns,jl,_s,bl,ks,fl,Vs,Ha='Ora che abbiamo il nostro dataset esteso, è arrivato il momento di caricarlo sull’Hub, così da poterlo condividere con la community! Per caricare il dataset useremo la <a href="https://github.com/huggingface/huggingface_hub" rel="nofollow">libreria 🤗 Hub</a>, che ci permette di interagire con l’Hub di Hugging Face attraverso un’API di Python. 🤗 Hub è preinstallato con 🤗 Transformers, così possiamo usarlo da subito. Ad esempio, possiamo usare la funzione <code>list_datastes()</code> per avere informazioni su tutti i dataset pubblici attualmente presenti sull’Hub:',wl,$s,xl,Bs,Zl,Hs,Wa="Possiamo vedere che al momento ci sono circa 1.500 dataset sull’Hub, e la funzione <code>list_datasets()</code> inoltre permette di avere alcuni metadati su ciascuna repository.",Gl,Ws,Ya="Per ciò che ci riguarda, la prima cosa che dobbiamo fare è crare una nuova repository nell’Hub. Per far ciò abbiamo bisogno di un token di autentificazione, che pouò essere ottenuto effettuando l’accesso nell’Hub Hugging Face con la funzione <code>notebook_login()</code>:",Rl,Ys,Il,Fs,Fa="Questo creerà un widget in cui puoi inserire il tuo username e la tua password, e un token API verrà salvato in <em>~/.huggingface/token</em>. Se stai eseguendo il codice in un terminale, puoi effettuare l’accesso attraverso il comando:",zl,Qs,Cl,Es,Qa="Una volta fatto questo, possiamo crare una nuova repository con la funzione <code>create_repo()</code>:",Xl,Ss,vl,As,Nl,Ls,Ea="In quest’esempio, abbiamo creato una repository vuota chiamata <code>github-issues</code> con l’username <code>lewtun</code> (l’username dovrebbe essere quello del tuo account Hub quando esegui questo codice!).",_l,R,kl,qs,Sa="Ora, cloniamo la repository dall’Hub alla nostra macchina e copiamo al suo interno i file del nostro dataset. 🤗 Hub contiene una classe <code>Repository</code> che ha al suo interno molti dei comandi più comuni di Git, per cui per clonare la repository in remoto dobbiamo semplicemente fornire l’URL e il percorso locale in cui desideriamo clonare:",Vl,Ds,$l,Ps,Aa="Di default, diverse estensioni file (ad esempio <em>.bin</em>, <em>.gz</em> e <em>.zip</em>) sono registrate da Git LFS, così che i file di grandi dimensioni possono essere gestiti all’interno dello stesso workflow. Puoi trovare una lista delle estensioni di file monitorati nel file <em>.gitattributes</em> della repository. Per includere il formato JSON Lines a questa lista, possiamo utilizzare il comando:",Bl,Os,Hl,Ks,La="Ora possiamo usare <code>Repository.push_to_hub()</code> per caricare il dataset sull’Hub:",Wl,se,Yl,ee,qa="Se navighiamo fino all’URL contenuto in <code>repo_url</code>, vedremo che il file del nostro dataset è stato caricato.",Fl,I,Da='<img src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter5/hub-repo.png" alt="Our dataset repository on the Hugging Face Hub." width="80%"/>',Ql,le,Pa="Da qui, chiunque può scaricare il dataset semplicemente inserendo l’ID della repository come argomento <code>path</code> di <code>load_dataset()</code>:",El,ae,Sl,te,Al,ne,Oa="Bene, abbiamo caricato il nostro dataset sull’Hub, e può essere utilizzato da tutti! C’è un’altra cosa importante che dobbiamo fare: aggiungere una <em>dataset card</em> che spiega come è stato creato il corpus, e offre altre informazioni utili per la community.",Ll,z,ql,ie,Dl,pe,Ka="I dataset ben-documentati sono più utili agli altri utenti (compreso il futuro te!), poiché spiegano il contesto per permettere agli utenti di decidere se un dataset può essere utile, e valutare gli eventuali bias o rischi associati nell’utilizzo del dataset.",Pl,ce,st="Sull’Hug di Hugging Face, queste informazioni si trovano nel file <em>README.md</em> della repository. Ci sono due passaggi principali che dovresti seguire prima di creare questo file:",Ol,re,et='<li>Usa l’<a href="https://huggingface.co/datasets/tagging/" rel="nofollow">applicatione <code>datasets-tagging</code></a> per creare tag di metadati in formato YAML. Questi tag sono usato per una serie di funzioni di ricerca sull’Hub di Hugging Face, e assicurano che il tuo dataset possa essere facilmente trovato dai membri della community. Poichè abbiamo creato un nostro dataset, dovrai clonare la repository <code>datasets-tagging</code>, ed eseguire l’applicazione in locale. Ecco com’è l’interfaccia:</li>',Kl,C,lt='<img src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter5/datasets-tagger.png" alt="The 'datasets-tagging' interface." width="80%"/>',sa,X,at='<li>Leggi la <a href="https://github.com/huggingface/datasets/blob/master/templates/README_guide.md" rel="nofollow">guida 🤗 Datasets</a> sulla creazione di dataset card informative, e usala come template.</li>',ea,oe,tt="Puoi creare il file <em>README.md</em> direttamente sull’Hub, e puoi trovare un modello per una dataset card nella repository <code>lewtun/github-issues</code>. Di seguito è mostrato uno screenshot di una dataset card già compilata.",la,v,nt='<img src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter5/dataset-card.png" alt="A dataset card." width="80%"/>',aa,N,ta,ue,it="È tutto! Abbiamo visto in questa sezione che creare un buon dataset può essere un’impresa, ma per fortuna caricarlo e condividerlo con la community è molto più semplice. Nella prossima sezione useremo il nostro nuovo dataset per creare un motore di ricerca semantico con 🤗 Datasets, che abbina alle domande gli issue e i commenti più rilevanti.",na,_,ia,de,pa,he,ca;return k=new Je({props:{title:"Creare il proprio dataset",local:"creare-il-proprio-dataset",headingTag:"h1"}}),V=new bt({props:{chapter:5,classNames:"absolute z-10 right-0 top-0",notebooks:[{label:"Google Colab",value:"https://colab.research.google.com/github/huggingface/notebooks/blob/master/course/it/chapter5/section5.ipynb"},{label:"Aws Studio",value:"https://studiolab.sagemaker.aws/import/github/huggingface/notebooks/blob/master/course/it/chapter5/section5.ipynb"}]}}),W=new Je({props:{title:"Recuperare i dati",local:"recuperare-i-dati",headingTag:"h2"}}),S=new y({props:{code:"IXBpcCUyMGluc3RhbGwlMjByZXF1ZXN0cw==",highlighted:"!pip install requests",wrap:!1}}),L=new y({props:{code:"aW1wb3J0JTIwcmVxdWVzdHMlMEElMEF1cmwlMjAlM0QlMjAlMjJodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGaXNzdWVzJTNGcGFnZSUzRDElMjZwZXJfcGFnZSUzRDElMjIlMEFyZXNwb25zZSUyMCUzRCUyMHJlcXVlc3RzLmdldCh1cmwp",highlighted:`<span class="hljs-keyword">import</span> requests | |
| url = <span class="hljs-string">"https://api.github.com/repos/huggingface/datasets/issues?page=1&per_page=1"</span> | |
| response = requests.get(url)`,wrap:!1}}),D=new y({props:{code:"cmVzcG9uc2Uuc3RhdHVzX2NvZGU=",highlighted:"response.status_code",wrap:!1}}),P=new y({props:{code:"MjAw",highlighted:'<span class="hljs-number">200</span>',wrap:!1}}),K=new y({props:{code:"cmVzcG9uc2UuanNvbigp",highlighted:"response.json()",wrap:!1}}),ss=new y({props:{code:"JTVCJTdCJ3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnJlcG9zJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRmlzc3VlcyUyRjI3OTInJTJDJTBBJTIwJTIwJ3JlcG9zaXRvcnlfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJyUyQyUwQSUyMCUyMCdsYWJlbHNfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGaXNzdWVzJTJGMjc5MiUyRmxhYmVscyU3QiUyRm5hbWUlN0QnJTJDJTBBJTIwJTIwJ2NvbW1lbnRzX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnJlcG9zJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRmlzc3VlcyUyRjI3OTIlMkZjb21tZW50cyclMkMlMEElMjAlMjAnZXZlbnRzX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnJlcG9zJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRmlzc3VlcyUyRjI3OTIlMkZldmVudHMnJTJDJTBBJTIwJTIwJ2h0bWxfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbCUyRjI3OTInJTJDJTBBJTIwJTIwJ2lkJyUzQSUyMDk2ODY1MDI3NCUyQyUwQSUyMCUyMCdub2RlX2lkJyUzQSUyMCdNREV4T2xCMWJHeFNaWEYxWlhOME56RXdOelV5TWpjMCclMkMlMEElMjAlMjAnbnVtYmVyJyUzQSUyMDI3OTIlMkMlMEElMjAlMjAndGl0bGUnJTNBJTIwJ1VwZGF0ZSUyMEdvb0FRJyUyQyUwQSUyMCUyMCd1c2VyJyUzQSUyMCU3Qidsb2dpbiclM0ElMjAnYmhhdml0dnlhbWFsaWsnJTJDJTBBJTIwJTIwJTIwJ2lkJyUzQSUyMDE5NzE4ODE4JTJDJTBBJTIwJTIwJTIwJ25vZGVfaWQnJTNBJTIwJ01EUTZWWE5sY2pFNU56RTRPREU0JyUyQyUwQSUyMCUyMCUyMCdhdmF0YXJfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmF2YXRhcnMuZ2l0aHVidXNlcmNvbnRlbnQuY29tJTJGdSUyRjE5NzE4ODE4JTNGdiUzRDQnJTJDJTBBJTIwJTIwJTIwJ2dyYXZhdGFyX2lkJyUzQSUyMCcnJTJDJTBBJTIwJTIwJTIwJ3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWsnJTJDJTBBJTIwJTIwJTIwJ2h0bWxfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZiaGF2aXR2eWFtYWxpayclMkMlMEElMjAlMjAlMjAnZm9sbG93ZXJzX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWslMkZmb2xsb3dlcnMnJTJDJTBBJTIwJTIwJTIwJ2ZvbGxvd2luZ191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGZm9sbG93aW5nJTdCJTJGb3RoZXJfdXNlciU3RCclMkMlMEElMjAlMjAlMjAnZ2lzdHNfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGdXNlcnMlMkZiaGF2aXR2eWFtYWxpayUyRmdpc3RzJTdCJTJGZ2lzdF9pZCU3RCclMkMlMEElMjAlMjAlMjAnc3RhcnJlZF91cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGc3RhcnJlZCU3QiUyRm93bmVyJTdEJTdCJTJGcmVwbyU3RCclMkMlMEElMjAlMjAlMjAnc3Vic2NyaXB0aW9uc191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGc3Vic2NyaXB0aW9ucyclMkMlMEElMjAlMjAlMjAnb3JnYW5pemF0aW9uc191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGb3JncyclMkMlMEElMjAlMjAlMjAncmVwb3NfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGdXNlcnMlMkZiaGF2aXR2eWFtYWxpayUyRnJlcG9zJyUyQyUwQSUyMCUyMCUyMCdldmVudHNfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGdXNlcnMlMkZiaGF2aXR2eWFtYWxpayUyRmV2ZW50cyU3QiUyRnByaXZhY3klN0QnJTJDJTBBJTIwJTIwJTIwJ3JlY2VpdmVkX2V2ZW50c191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGcmVjZWl2ZWRfZXZlbnRzJyUyQyUwQSUyMCUyMCUyMCd0eXBlJyUzQSUyMCdVc2VyJyUyQyUwQSUyMCUyMCUyMCdzaXRlX2FkbWluJyUzQSUyMEZhbHNlJTdEJTJDJTBBJTIwJTIwJ2xhYmVscyclM0ElMjAlNUIlNUQlMkMlMEElMjAlMjAnc3RhdGUnJTNBJTIwJ29wZW4nJTJDJTBBJTIwJTIwJ2xvY2tlZCclM0ElMjBGYWxzZSUyQyUwQSUyMCUyMCdhc3NpZ25lZSclM0ElMjBOb25lJTJDJTBBJTIwJTIwJ2Fzc2lnbmVlcyclM0ElMjAlNUIlNUQlMkMlMEElMjAlMjAnbWlsZXN0b25lJyUzQSUyME5vbmUlMkMlMEElMjAlMjAnY29tbWVudHMnJTNBJTIwMSUyQyUwQSUyMCUyMCdjcmVhdGVkX2F0JyUzQSUyMCcyMDIxLTA4LTEyVDExJTNBNDAlM0ExOFonJTJDJTBBJTIwJTIwJ3VwZGF0ZWRfYXQnJTNBJTIwJzIwMjEtMDgtMTJUMTIlM0EzMSUzQTE3WiclMkMlMEElMjAlMjAnY2xvc2VkX2F0JyUzQSUyME5vbmUlMkMlMEElMjAlMjAnYXV0aG9yX2Fzc29jaWF0aW9uJyUzQSUyMCdDT05UUklCVVRPUiclMkMlMEElMjAlMjAnYWN0aXZlX2xvY2tfcmVhc29uJyUzQSUyME5vbmUlMkMlMEElMjAlMjAncHVsbF9yZXF1ZXN0JyUzQSUyMCU3Qid1cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZyZXBvcyUyRmh1Z2dpbmdmYWNlJTJGZGF0YXNldHMlMkZwdWxscyUyRjI3OTInJTJDJTBBJTIwJTIwJTIwJ2h0bWxfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbCUyRjI3OTInJTJDJTBBJTIwJTIwJTIwJ2RpZmZfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbCUyRjI3OTIuZGlmZiclMkMlMEElMjAlMjAlMjAncGF0Y2hfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbCUyRjI3OTIucGF0Y2gnJTdEJTJDJTBBJTIwJTIwJ2JvZHknJTNBJTIwJyU1Qkdvb0FRJTVEKGh0dHBzJTNBJTJGJTJGZ2l0aHViLmNvbSUyRmFsbGVuYWklMkZnb29hcSklMjBkYXRhc2V0JTIwd2FzJTIwcmVjZW50bHklMjB1cGRhdGVkJTIwYWZ0ZXIlMjBzcGxpdHMlMjB3ZXJlJTIwYWRkZWQlMjBmb3IlMjB0aGUlMjBzYW1lLiUyMFRoaXMlMjBQUiUyMGNvbnRhaW5zJTIwbmV3JTIwdXBkYXRlZCUyMEdvb0FRJTIwd2l0aCUyMHRyYWluJTJGdmFsJTJGdGVzdCUyMHNwbGl0cyUyMGFuZCUyMHVwZGF0ZWQlMjBSRUFETUUlMjBhcyUyMHdlbGwuJyUyQyUwQSUyMCUyMCdwZXJmb3JtZWRfdmlhX2dpdGh1Yl9hcHAnJTNBJTIwTm9uZSU3RCU1RA==",highlighted:`[{<span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/issues/2792'</span>, | |
| <span class="hljs-string">'repository_url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets'</span>, | |
| <span class="hljs-string">'labels_url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/issues/2792/labels{/name}'</span>, | |
| <span class="hljs-string">'comments_url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/issues/2792/comments'</span>, | |
| <span class="hljs-string">'events_url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/issues/2792/events'</span>, | |
| <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/2792'</span>, | |
| <span class="hljs-string">'id'</span>: <span class="hljs-number">968650274</span>, | |
| <span class="hljs-string">'node_id'</span>: <span class="hljs-string">'MDExOlB1bGxSZXF1ZXN0NzEwNzUyMjc0'</span>, | |
| <span class="hljs-string">'number'</span>: <span class="hljs-number">2792</span>, | |
| <span class="hljs-string">'title'</span>: <span class="hljs-string">'Update GooAQ'</span>, | |
| <span class="hljs-string">'user'</span>: {<span class="hljs-string">'login'</span>: <span class="hljs-string">'bhavitvyamalik'</span>, | |
| <span class="hljs-string">'id'</span>: <span class="hljs-number">19718818</span>, | |
| <span class="hljs-string">'node_id'</span>: <span class="hljs-string">'MDQ6VXNlcjE5NzE4ODE4'</span>, | |
| <span class="hljs-string">'avatar_url'</span>: <span class="hljs-string">'https://avatars.githubusercontent.com/u/19718818?v=4'</span>, | |
| <span class="hljs-string">'gravatar_id'</span>: <span class="hljs-string">''</span>, | |
| <span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik'</span>, | |
| <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/bhavitvyamalik'</span>, | |
| <span class="hljs-string">'followers_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/followers'</span>, | |
| <span class="hljs-string">'following_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/following{/other_user}'</span>, | |
| <span class="hljs-string">'gists_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/gists{/gist_id}'</span>, | |
| <span class="hljs-string">'starred_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/starred{/owner}{/repo}'</span>, | |
| <span class="hljs-string">'subscriptions_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/subscriptions'</span>, | |
| <span class="hljs-string">'organizations_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/orgs'</span>, | |
| <span class="hljs-string">'repos_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/repos'</span>, | |
| <span class="hljs-string">'events_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/events{/privacy}'</span>, | |
| <span class="hljs-string">'received_events_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/received_events'</span>, | |
| <span class="hljs-string">'type'</span>: <span class="hljs-string">'User'</span>, | |
| <span class="hljs-string">'site_admin'</span>: <span class="hljs-literal">False</span>}, | |
| <span class="hljs-string">'labels'</span>: [], | |
| <span class="hljs-string">'state'</span>: <span class="hljs-string">'open'</span>, | |
| <span class="hljs-string">'locked'</span>: <span class="hljs-literal">False</span>, | |
| <span class="hljs-string">'assignee'</span>: <span class="hljs-literal">None</span>, | |
| <span class="hljs-string">'assignees'</span>: [], | |
| <span class="hljs-string">'milestone'</span>: <span class="hljs-literal">None</span>, | |
| <span class="hljs-string">'comments'</span>: <span class="hljs-number">1</span>, | |
| <span class="hljs-string">'created_at'</span>: <span class="hljs-string">'2021-08-12T11:40:18Z'</span>, | |
| <span class="hljs-string">'updated_at'</span>: <span class="hljs-string">'2021-08-12T12:31:17Z'</span>, | |
| <span class="hljs-string">'closed_at'</span>: <span class="hljs-literal">None</span>, | |
| <span class="hljs-string">'author_association'</span>: <span class="hljs-string">'CONTRIBUTOR'</span>, | |
| <span class="hljs-string">'active_lock_reason'</span>: <span class="hljs-literal">None</span>, | |
| <span class="hljs-string">'pull_request'</span>: {<span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/pulls/2792'</span>, | |
| <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/2792'</span>, | |
| <span class="hljs-string">'diff_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/2792.diff'</span>, | |
| <span class="hljs-string">'patch_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/2792.patch'</span>}, | |
| <span class="hljs-string">'body'</span>: <span class="hljs-string">'[GooAQ](https://github.com/allenai/gooaq) dataset was recently updated after splits were added for the same. This PR contains new updated GooAQ with train/val/test splits and updated README as well.'</span>, | |
| <span class="hljs-string">'performed_via_github_app'</span>: <span class="hljs-literal">None</span>}]`,wrap:!1}}),w=new Me({props:{$$slots:{default:[wt]},$$scope:{ctx:g}}}),as=new y({props:{code:"R0lUSFVCX1RPS0VOJTIwJTNEJTIweHh4JTIwJTIwJTIzJTIwaW5zZXJpc2NpJTIwcXVpJTIwaWwlMjB0dW8lMjB0b2tlbiUyMEdpdEh1YiUwQWhlYWRlcnMlMjAlM0QlMjAlN0IlMjJBdXRob3JpemF0aW9uJTIyJTNBJTIwZiUyMnRva2VuJTIwJTdCR0lUSFVCX1RPS0VOJTdEJTIyJTdE",highlighted:`GITHUB_TOKEN = xxx <span class="hljs-comment"># inserisci qui il tuo token GitHub</span> | |
| headers = {<span class="hljs-string">"Authorization"</span>: <span class="hljs-string">f"token <span class="hljs-subst">{GITHUB_TOKEN}</span>"</span>}`,wrap:!1}}),x=new Me({props:{warning:!0,$$slots:{default:[xt]},$$scope:{ctx:g}}}),ns=new y({props:{code:"aW1wb3J0JTIwdGltZSUwQWltcG9ydCUyMG1hdGglMEFmcm9tJTIwcGF0aGxpYiUyMGltcG9ydCUyMFBhdGglMEFpbXBvcnQlMjBwYW5kYXMlMjBhcyUyMHBkJTBBZnJvbSUyMHRxZG0ubm90ZWJvb2slMjBpbXBvcnQlMjB0cWRtJTBBJTBBJTBBZGVmJTIwZmV0Y2hfaXNzdWVzKCUwQSUyMCUyMCUyMCUyMG93bmVyJTNEJTIyaHVnZ2luZ2ZhY2UlMjIlMkMlMEElMjAlMjAlMjAlMjByZXBvJTNEJTIyZGF0YXNldHMlMjIlMkMlMEElMjAlMjAlMjAlMjBudW1faXNzdWVzJTNEMTBfMDAwJTJDJTBBJTIwJTIwJTIwJTIwcmF0ZV9saW1pdCUzRDVfMDAwJTJDJTBBJTIwJTIwJTIwJTIwaXNzdWVzX3BhdGglM0RQYXRoKCUyMi4lMjIpJTJDJTBBKSUzQSUwQSUyMCUyMCUyMCUyMGlmJTIwbm90JTIwaXNzdWVzX3BhdGguaXNfZGlyKCklM0ElMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjBpc3N1ZXNfcGF0aC5ta2RpcihleGlzdF9vayUzRFRydWUpJTBBJTBBJTIwJTIwJTIwJTIwYmF0Y2glMjAlM0QlMjAlNUIlNUQlMEElMjAlMjAlMjAlMjBhbGxfaXNzdWVzJTIwJTNEJTIwJTVCJTVEJTBBJTIwJTIwJTIwJTIwcGVyX3BhZ2UlMjAlM0QlMjAxMDAlMjAlMjAlMjMlMjBOdW1lcm8lMjBkaSUyMGlzc3VlJTIwZGElMjByZXN0aXR1aXJlJTIwcGVyJTIwcGFnaW5hJTBBJTIwJTIwJTIwJTIwbnVtX3BhZ2VzJTIwJTNEJTIwbWF0aC5jZWlsKG51bV9pc3N1ZXMlMjAlMkYlMjBwZXJfcGFnZSklMEElMjAlMjAlMjAlMjBiYXNlX3VybCUyMCUzRCUyMCUyMmh0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZyZXBvcyUyMiUwQSUwQSUyMCUyMCUyMCUyMGZvciUyMHBhZ2UlMjBpbiUyMHRxZG0ocmFuZ2UobnVtX3BhZ2VzKSklM0ElMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjMlMjBMYSUyMHF1ZXJ5JTIwaGElMjBzdGF0ZSUzRGFsbCUyMHBlciUyMG90dGVuZXJlJTIwc2lhJTIwZ2xpJTIwaXNzdWUlMjBhcGVydGklMjBjaGUlMjBxdWVsbGklMjBjaGl1c2klMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjBxdWVyeSUyMCUzRCUyMGYlMjJpc3N1ZXMlM0ZwYWdlJTNEJTdCcGFnZSU3RCUyNnBlcl9wYWdlJTNEJTdCcGVyX3BhZ2UlN0QlMjZzdGF0ZSUzRGFsbCUyMiUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMGlzc3VlcyUyMCUzRCUyMHJlcXVlc3RzLmdldChmJTIyJTdCYmFzZV91cmwlN0QlMkYlN0Jvd25lciU3RCUyRiU3QnJlcG8lN0QlMkYlN0JxdWVyeSU3RCUyMiUyQyUyMGhlYWRlcnMlM0RoZWFkZXJzKSUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMGJhdGNoLmV4dGVuZChpc3N1ZXMuanNvbigpKSUwQSUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMGlmJTIwbGVuKGJhdGNoKSUyMCUzRSUyMHJhdGVfbGltaXQlMjBhbmQlMjBsZW4oYWxsX2lzc3VlcyklMjAlM0MlMjBudW1faXNzdWVzJTNBJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwYWxsX2lzc3Vlcy5leHRlbmQoYmF0Y2gpJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwYmF0Y2glMjAlM0QlMjAlNUIlNUQlMjAlMjAlMjMlMjBwdWxpYW1vJTIwbGElMjBiYXRjaCUyMHBlciUyMGlsJTIwdGVybWluZSUyMHN1Y2Nlc3Npdm8lMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjBwcmludChmJTIyUmVhY2hlZCUyMEdpdEh1YiUyMHJhdGUlMjBsaW1pdC4lMjBTbGVlcGluZyUyMGZvciUyMG9uZSUyMGhvdXIlMjAuLi4lMjIpJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwdGltZS5zbGVlcCg2MCUyMColMjA2MCUyMCUyQiUyMDEpJTBBJTBBJTIwJTIwJTIwJTIwYWxsX2lzc3Vlcy5leHRlbmQoYmF0Y2gpJTBBJTIwJTIwJTIwJTIwZGYlMjAlM0QlMjBwZC5EYXRhRnJhbWUuZnJvbV9yZWNvcmRzKGFsbF9pc3N1ZXMpJTBBJTIwJTIwJTIwJTIwZGYudG9fanNvbihmJTIyJTdCaXNzdWVzX3BhdGglN0QlMkYlN0JyZXBvJTdELWlzc3Vlcy5qc29ubCUyMiUyQyUyMG9yaWVudCUzRCUyMnJlY29yZHMlMjIlMkMlMjBsaW5lcyUzRFRydWUpJTBBJTIwJTIwJTIwJTIwcHJpbnQoJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwZiUyMkRvd25sb2FkZWQlMjBhbGwlMjB0aGUlMjBpc3N1ZXMlMjBmb3IlMjAlN0JyZXBvJTdEISUyMERhdGFzZXQlMjBzdG9yZWQlMjBhdCUyMCU3Qmlzc3Vlc19wYXRoJTdEJTJGJTdCcmVwbyU3RC1pc3N1ZXMuanNvbmwlMjIlMEElMjAlMjAlMjAlMjAp",highlighted:`<span class="hljs-keyword">import</span> time | |
| <span class="hljs-keyword">import</span> math | |
| <span class="hljs-keyword">from</span> pathlib <span class="hljs-keyword">import</span> Path | |
| <span class="hljs-keyword">import</span> pandas <span class="hljs-keyword">as</span> pd | |
| <span class="hljs-keyword">from</span> tqdm.notebook <span class="hljs-keyword">import</span> tqdm | |
| <span class="hljs-keyword">def</span> <span class="hljs-title function_">fetch_issues</span>(<span class="hljs-params"> | |
| owner=<span class="hljs-string">"huggingface"</span>, | |
| repo=<span class="hljs-string">"datasets"</span>, | |
| num_issues=<span class="hljs-number">10_000</span>, | |
| rate_limit=<span class="hljs-number">5_000</span>, | |
| issues_path=Path(<span class="hljs-params"><span class="hljs-string">"."</span></span>), | |
| </span>): | |
| <span class="hljs-keyword">if</span> <span class="hljs-keyword">not</span> issues_path.is_dir(): | |
| issues_path.mkdir(exist_ok=<span class="hljs-literal">True</span>) | |
| batch = [] | |
| all_issues = [] | |
| per_page = <span class="hljs-number">100</span> <span class="hljs-comment"># Numero di issue da restituire per pagina</span> | |
| num_pages = math.ceil(num_issues / per_page) | |
| base_url = <span class="hljs-string">"https://api.github.com/repos"</span> | |
| <span class="hljs-keyword">for</span> page <span class="hljs-keyword">in</span> tqdm(<span class="hljs-built_in">range</span>(num_pages)): | |
| <span class="hljs-comment"># La query ha state=all per ottenere sia gli issue aperti che quelli chiusi</span> | |
| query = <span class="hljs-string">f"issues?page=<span class="hljs-subst">{page}</span>&per_page=<span class="hljs-subst">{per_page}</span>&state=all"</span> | |
| issues = requests.get(<span class="hljs-string">f"<span class="hljs-subst">{base_url}</span>/<span class="hljs-subst">{owner}</span>/<span class="hljs-subst">{repo}</span>/<span class="hljs-subst">{query}</span>"</span>, headers=headers) | |
| batch.extend(issues.json()) | |
| <span class="hljs-keyword">if</span> <span class="hljs-built_in">len</span>(batch) > rate_limit <span class="hljs-keyword">and</span> <span class="hljs-built_in">len</span>(all_issues) < num_issues: | |
| all_issues.extend(batch) | |
| batch = [] <span class="hljs-comment"># puliamo la batch per il termine successivo</span> | |
| <span class="hljs-built_in">print</span>(<span class="hljs-string">f"Reached GitHub rate limit. Sleeping for one hour ..."</span>) | |
| time.sleep(<span class="hljs-number">60</span> * <span class="hljs-number">60</span> + <span class="hljs-number">1</span>) | |
| all_issues.extend(batch) | |
| df = pd.DataFrame.from_records(all_issues) | |
| df.to_json(<span class="hljs-string">f"<span class="hljs-subst">{issues_path}</span>/<span class="hljs-subst">{repo}</span>-issues.jsonl"</span>, orient=<span class="hljs-string">"records"</span>, lines=<span class="hljs-literal">True</span>) | |
| <span class="hljs-built_in">print</span>( | |
| <span class="hljs-string">f"Downloaded all the issues for <span class="hljs-subst">{repo}</span>! Dataset stored at <span class="hljs-subst">{issues_path}</span>/<span class="hljs-subst">{repo}</span>-issues.jsonl"</span> | |
| )`,wrap:!1}}),ps=new y({props:{code:"JTIzJTIwQSUyMHNlY29uZGElMjBkZWxsYSUyMHR1YSUyMGNvbm5lc3Npb25lJTIwaW50ZXJuZXQlMkMlMjBjaSUyMHBvdHJlYmJlJTIwdm9sZXJlJTIwcXVhbGNoZSUyMHNlY29uZG8uLi4lMEFmZXRjaF9pc3N1ZXMoKQ==",highlighted:`<span class="hljs-comment"># A seconda della tua connessione internet, ci potrebbe volere qualche secondo...</span> | |
| fetch_issues()`,wrap:!1}}),rs=new y({props:{code:"aXNzdWVzX2RhdGFzZXQlMjAlM0QlMjBsb2FkX2RhdGFzZXQoJTIyanNvbiUyMiUyQyUyMGRhdGFfZmlsZXMlM0QlMjJkYXRhc2V0cy1pc3N1ZXMuanNvbmwlMjIlMkMlMjBzcGxpdCUzRCUyMnRyYWluJTIyKSUwQWlzc3Vlc19kYXRhc2V0",highlighted:`issues_dataset = load_dataset(<span class="hljs-string">"json"</span>, data_files=<span class="hljs-string">"datasets-issues.jsonl"</span>, split=<span class="hljs-string">"train"</span>) | |
| issues_dataset`,wrap:!1}}),os=new y({props:{code:"RGF0YXNldCglN0IlMEElMjAlMjAlMjAlMjBmZWF0dXJlcyUzQSUyMCU1Qid1cmwnJTJDJTIwJ3JlcG9zaXRvcnlfdXJsJyUyQyUyMCdsYWJlbHNfdXJsJyUyQyUyMCdjb21tZW50c191cmwnJTJDJTIwJ2V2ZW50c191cmwnJTJDJTIwJ2h0bWxfdXJsJyUyQyUyMCdpZCclMkMlMjAnbm9kZV9pZCclMkMlMjAnbnVtYmVyJyUyQyUyMCd0aXRsZSclMkMlMjAndXNlciclMkMlMjAnbGFiZWxzJyUyQyUyMCdzdGF0ZSclMkMlMjAnbG9ja2VkJyUyQyUyMCdhc3NpZ25lZSclMkMlMjAnYXNzaWduZWVzJyUyQyUyMCdtaWxlc3RvbmUnJTJDJTIwJ2NvbW1lbnRzJyUyQyUyMCdjcmVhdGVkX2F0JyUyQyUyMCd1cGRhdGVkX2F0JyUyQyUyMCdjbG9zZWRfYXQnJTJDJTIwJ2F1dGhvcl9hc3NvY2lhdGlvbiclMkMlMjAnYWN0aXZlX2xvY2tfcmVhc29uJyUyQyUyMCdwdWxsX3JlcXVlc3QnJTJDJTIwJ2JvZHknJTJDJTIwJ3RpbWVsaW5lX3VybCclMkMlMjAncGVyZm9ybWVkX3ZpYV9naXRodWJfYXBwJyU1RCUyQyUwQSUyMCUyMCUyMCUyMG51bV9yb3dzJTNBJTIwMzAxOSUwQSU3RCk=",highlighted:`Dataset({ | |
| features: [<span class="hljs-string">'url'</span>, <span class="hljs-string">'repository_url'</span>, <span class="hljs-string">'labels_url'</span>, <span class="hljs-string">'comments_url'</span>, <span class="hljs-string">'events_url'</span>, <span class="hljs-string">'html_url'</span>, <span class="hljs-string">'id'</span>, <span class="hljs-string">'node_id'</span>, <span class="hljs-string">'number'</span>, <span class="hljs-string">'title'</span>, <span class="hljs-string">'user'</span>, <span class="hljs-string">'labels'</span>, <span class="hljs-string">'state'</span>, <span class="hljs-string">'locked'</span>, <span class="hljs-string">'assignee'</span>, <span class="hljs-string">'assignees'</span>, <span class="hljs-string">'milestone'</span>, <span class="hljs-string">'comments'</span>, <span class="hljs-string">'created_at'</span>, <span class="hljs-string">'updated_at'</span>, <span class="hljs-string">'closed_at'</span>, <span class="hljs-string">'author_association'</span>, <span class="hljs-string">'active_lock_reason'</span>, <span class="hljs-string">'pull_request'</span>, <span class="hljs-string">'body'</span>, <span class="hljs-string">'timeline_url'</span>, <span class="hljs-string">'performed_via_github_app'</span>], | |
| num_rows: <span class="hljs-number">3019</span> | |
| })`,wrap:!1}}),Js=new Je({props:{title:"Pulire i dati",local:"pulire-i-dati",headingTag:"h2"}}),ys=new y({props:{code:"c2FtcGxlJTIwJTNEJTIwaXNzdWVzX2RhdGFzZXQuc2h1ZmZsZShzZWVkJTNENjY2KS5zZWxlY3QocmFuZ2UoMykpJTBBJTBBJTIzJTIwU3RhbXBpYW1vJTIwbGUlMjBlbnRyYXRlJTIwJTYwVVJMJTYwJTIwZSUyMCU2MHB1bGxfcmVxdWVzdCU2MCUwQWZvciUyMHVybCUyQyUyMHByJTIwaW4lMjB6aXAoc2FtcGxlJTVCJTIyaHRtbF91cmwlMjIlNUQlMkMlMjBzYW1wbGUlNUIlMjJwdWxsX3JlcXVlc3QlMjIlNUQpJTNBJTBBJTIwJTIwJTIwJTIwcHJpbnQoZiUyMiUzRSUzRSUyMFVSTCUzQSUyMCU3QnVybCU3RCUyMiklMEElMjAlMjAlMjAlMjBwcmludChmJTIyJTNFJTNFJTIwUHVsbCUyMHJlcXVlc3QlM0ElMjAlN0JwciU3RCU1Q24lMjIp",highlighted:`sample = issues_dataset.shuffle(seed=<span class="hljs-number">666</span>).select(<span class="hljs-built_in">range</span>(<span class="hljs-number">3</span>)) | |
| <span class="hljs-comment"># Stampiamo le entrate \`URL\` e \`pull_request\`</span> | |
| <span class="hljs-keyword">for</span> url, pr <span class="hljs-keyword">in</span> <span class="hljs-built_in">zip</span>(sample[<span class="hljs-string">"html_url"</span>], sample[<span class="hljs-string">"pull_request"</span>]): | |
| <span class="hljs-built_in">print</span>(<span class="hljs-string">f">> URL: <span class="hljs-subst">{url}</span>"</span>) | |
| <span class="hljs-built_in">print</span>(<span class="hljs-string">f">> Pull request: <span class="hljs-subst">{pr}</span>\\n"</span>)`,wrap:!1}}),Ts=new y({props:{code:"JTNFJTNFJTIwVVJMJTNBJTIwaHR0cHMlM0ElMkYlMkZnaXRodWIuY29tJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRnB1bGwlMkY4NTAlMEElM0UlM0UlMjBQdWxsJTIwcmVxdWVzdCUzQSUyMCU3Qid1cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZyZXBvcyUyRmh1Z2dpbmdmYWNlJTJGZGF0YXNldHMlMkZwdWxscyUyRjg1MCclMkMlMjAnaHRtbF91cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGZ2l0aHViLmNvbSUyRmh1Z2dpbmdmYWNlJTJGZGF0YXNldHMlMkZwdWxsJTJGODUwJyUyQyUyMCdkaWZmX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZnaXRodWIuY29tJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRnB1bGwlMkY4NTAuZGlmZiclMkMlMjAncGF0Y2hfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbCUyRjg1MC5wYXRjaCclN0QlMEElMEElM0UlM0UlMjBVUkwlM0ElMjBodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGaXNzdWVzJTJGMjc3MyUwQSUzRSUzRSUyMFB1bGwlMjByZXF1ZXN0JTNBJTIwTm9uZSUwQSUwQSUzRSUzRSUyMFVSTCUzQSUyMGh0dHBzJTNBJTJGJTJGZ2l0aHViLmNvbSUyRmh1Z2dpbmdmYWNlJTJGZGF0YXNldHMlMkZwdWxsJTJGNzgzJTBBJTNFJTNFJTIwUHVsbCUyMHJlcXVlc3QlM0ElMjAlN0IndXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbHMlMkY3ODMnJTJDJTIwJ2h0bWxfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbCUyRjc4MyclMkMlMjAnZGlmZl91cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGZ2l0aHViLmNvbSUyRmh1Z2dpbmdmYWNlJTJGZGF0YXNldHMlMkZwdWxsJTJGNzgzLmRpZmYnJTJDJTIwJ3BhdGNoX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZnaXRodWIuY29tJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRnB1bGwlMkY3ODMucGF0Y2gnJTdE",highlighted:`>> URL: https://github.com/huggingface/datasets/pull/<span class="hljs-number">850</span> | |
| >> Pull request: {<span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/pulls/850'</span>, <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/850'</span>, <span class="hljs-string">'diff_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/850.diff'</span>, <span class="hljs-string">'patch_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/850.patch'</span>} | |
| >> URL: https://github.com/huggingface/datasets/issues/<span class="hljs-number">2773</span> | |
| >> Pull request: <span class="hljs-literal">None</span> | |
| >> URL: https://github.com/huggingface/datasets/pull/<span class="hljs-number">783</span> | |
| >> Pull request: {<span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/pulls/783'</span>, <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/783'</span>, <span class="hljs-string">'diff_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/783.diff'</span>, <span class="hljs-string">'patch_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/783.patch'</span>}`,wrap:!1}}),gs=new y({props:{code:"aXNzdWVzX2RhdGFzZXQlMjAlM0QlMjBpc3N1ZXNfZGF0YXNldC5tYXAoJTBBJTIwJTIwJTIwJTIwbGFtYmRhJTIweCUzQSUyMCU3QiUyMmlzX3B1bGxfcmVxdWVzdCUyMiUzQSUyMEZhbHNlJTIwaWYlMjB4JTVCJTIycHVsbF9yZXF1ZXN0JTIyJTVEJTIwaXMlMjBOb25lJTIwZWxzZSUyMFRydWUlN0QlMEEp",highlighted:`issues_dataset = issues_dataset.<span class="hljs-built_in">map</span>( | |
| <span class="hljs-keyword">lambda</span> x: {<span class="hljs-string">"is_pull_request"</span>: <span class="hljs-literal">False</span> <span class="hljs-keyword">if</span> x[<span class="hljs-string">"pull_request"</span>] <span class="hljs-keyword">is</span> <span class="hljs-literal">None</span> <span class="hljs-keyword">else</span> <span class="hljs-literal">True</span>} | |
| )`,wrap:!1}}),Z=new Me({props:{$$slots:{default:[Zt]},$$scope:{ctx:g}}}),fs=new Je({props:{title:"Estendere il dataset",local:"estendere-il-dataset",headingTag:"h2"}}),Zs=new y({props:{code:"aXNzdWVfbnVtYmVyJTIwJTNEJTIwMjc5MiUwQXVybCUyMCUzRCUyMGYlMjJodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGaXNzdWVzJTJGJTdCaXNzdWVfbnVtYmVyJTdEJTJGY29tbWVudHMlMjIlMEFyZXNwb25zZSUyMCUzRCUyMHJlcXVlc3RzLmdldCh1cmwlMkMlMjBoZWFkZXJzJTNEaGVhZGVycyklMEFyZXNwb25zZS5qc29uKCk=",highlighted:`issue_number = <span class="hljs-number">2792</span> | |
| url = <span class="hljs-string">f"https://api.github.com/repos/huggingface/datasets/issues/<span class="hljs-subst">{issue_number}</span>/comments"</span> | |
| response = requests.get(url, headers=headers) | |
| response.json()`,wrap:!1}}),Gs=new y({props:{code:"JTVCJTdCJ3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnJlcG9zJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRmlzc3VlcyUyRmNvbW1lbnRzJTJGODk3NTk0MTI4JyUyQyUwQSUyMCUyMCdodG1sX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZnaXRodWIuY29tJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRnB1bGwlMkYyNzkyJTIzaXNzdWVjb21tZW50LTg5NzU5NDEyOCclMkMlMEElMjAlMjAnaXNzdWVfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGaXNzdWVzJTJGMjc5MiclMkMlMEElMjAlMjAnaWQnJTNBJTIwODk3NTk0MTI4JTJDJTBBJTIwJTIwJ25vZGVfaWQnJTNBJTIwJ0lDX2t3RE9EdW56cHM0MWdETVEnJTJDJTBBJTIwJTIwJ3VzZXInJTNBJTIwJTdCJ2xvZ2luJyUzQSUyMCdiaGF2aXR2eWFtYWxpayclMkMlMEElMjAlMjAlMjAnaWQnJTNBJTIwMTk3MTg4MTglMkMlMEElMjAlMjAlMjAnbm9kZV9pZCclM0ElMjAnTURRNlZYTmxjakU1TnpFNE9ERTQnJTJDJTBBJTIwJTIwJTIwJ2F2YXRhcl91cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXZhdGFycy5naXRodWJ1c2VyY29udGVudC5jb20lMkZ1JTJGMTk3MTg4MTglM0Z2JTNENCclMkMlMEElMjAlMjAlMjAnZ3JhdmF0YXJfaWQnJTNBJTIwJyclMkMlMEElMjAlMjAlMjAndXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGdXNlcnMlMkZiaGF2aXR2eWFtYWxpayclMkMlMEElMjAlMjAlMjAnaHRtbF91cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGZ2l0aHViLmNvbSUyRmJoYXZpdHZ5YW1hbGlrJyUyQyUwQSUyMCUyMCUyMCdmb2xsb3dlcnNfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGdXNlcnMlMkZiaGF2aXR2eWFtYWxpayUyRmZvbGxvd2VycyclMkMlMEElMjAlMjAlMjAnZm9sbG93aW5nX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWslMkZmb2xsb3dpbmclN0IlMkZvdGhlcl91c2VyJTdEJyUyQyUwQSUyMCUyMCUyMCdnaXN0c191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGZ2lzdHMlN0IlMkZnaXN0X2lkJTdEJyUyQyUwQSUyMCUyMCUyMCdzdGFycmVkX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWslMkZzdGFycmVkJTdCJTJGb3duZXIlN0QlN0IlMkZyZXBvJTdEJyUyQyUwQSUyMCUyMCUyMCdzdWJzY3JpcHRpb25zX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWslMkZzdWJzY3JpcHRpb25zJyUyQyUwQSUyMCUyMCUyMCdvcmdhbml6YXRpb25zX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWslMkZvcmdzJyUyQyUwQSUyMCUyMCUyMCdyZXBvc191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGcmVwb3MnJTJDJTBBJTIwJTIwJTIwJ2V2ZW50c191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGZXZlbnRzJTdCJTJGcHJpdmFjeSU3RCclMkMlMEElMjAlMjAlMjAncmVjZWl2ZWRfZXZlbnRzX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWslMkZyZWNlaXZlZF9ldmVudHMnJTJDJTBBJTIwJTIwJTIwJ3R5cGUnJTNBJTIwJ1VzZXInJTJDJTBBJTIwJTIwJTIwJ3NpdGVfYWRtaW4nJTNBJTIwRmFsc2UlN0QlMkMlMEElMjAlMjAnY3JlYXRlZF9hdCclM0ElMjAnMjAyMS0wOC0xMlQxMiUzQTIxJTNBNTJaJyUyQyUwQSUyMCUyMCd1cGRhdGVkX2F0JyUzQSUyMCcyMDIxLTA4LTEyVDEyJTNBMzElM0ExN1onJTJDJTBBJTIwJTIwJ2F1dGhvcl9hc3NvY2lhdGlvbiclM0ElMjAnQ09OVFJJQlVUT1InJTJDJTBBJTIwJTIwJ2JvZHknJTNBJTIwJTIyJTQwYWxiZXJ0dmlsbGFub3ZhJTIwbXklMjB0ZXN0cyUyMGFyZSUyMGZhaWxpbmclMjBoZXJlJTNBJTVDciU1Q24lNjAlNjAlNjAlNUNyJTVDbmRhdGFzZXRfbmFtZSUyMCUzRCUyMCdnb29hcSclNUNyJTVDbiU1Q3IlNUNuJTIwJTIwJTIwJTIwZGVmJTIwdGVzdF9sb2FkX2RhdGFzZXQoc2VsZiUyQyUyMGRhdGFzZXRfbmFtZSklM0ElNUNyJTVDbiUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMGNvbmZpZ3MlMjAlM0QlMjBzZWxmLmRhdGFzZXRfdGVzdGVyLmxvYWRfYWxsX2NvbmZpZ3MoZGF0YXNldF9uYW1lJTJDJTIwaXNfbG9jYWwlM0RUcnVlKSU1QiUzQTElNUQlNUNyJTVDbiUzRSUyMCUyMCUyMCUyMCUyMCUyMCUyMHNlbGYuZGF0YXNldF90ZXN0ZXIuY2hlY2tfbG9hZF9kYXRhc2V0KGRhdGFzZXRfbmFtZSUyQyUyMGNvbmZpZ3MlMkMlMjBpc19sb2NhbCUzRFRydWUlMkMlMjB1c2VfbG9jYWxfZHVtbXlfZGF0YSUzRFRydWUpJTVDciU1Q24lNUNyJTVDbnRlc3RzJTJGdGVzdF9kYXRhc2V0X2NvbW1vbi5weSUzQTIzNCUzQSUyMCU1Q3IlNUNuXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMCU1Q3IlNUNudGVzdHMlMkZ0ZXN0X2RhdGFzZXRfY29tbW9uLnB5JTNBMTg3JTNBJTIwaW4lMjBjaGVja19sb2FkX2RhdGFzZXQlNUNyJTVDbiUyMCUyMCUyMCUyMHNlbGYucGFyZW50LmFzc2VydFRydWUobGVuKGRhdGFzZXQlNUJzcGxpdCU1RCklMjAlM0UlMjAwKSU1Q3IlNUNuRSUyMCUyMCUyMEFzc2VydGlvbkVycm9yJTNBJTIwRmFsc2UlMjBpcyUyMG5vdCUyMHRydWUlNUNyJTVDbiU2MCU2MCU2MCU1Q3IlNUNuV2hlbiUyMEklMjB0cnklMjBsb2FkaW5nJTIwZGF0YXNldCUyMG9uJTIwbG9jYWwlMjBtYWNoaW5lJTIwaXQlMjB3b3JrcyUyMGZpbmUuJTIwQW55JTIwc3VnZ2VzdGlvbnMlMjBvbiUyMGhvdyUyMGNhbiUyMEklMjBhdm9pZCUyMHRoaXMlMjBlcnJvciUzRiUyMiUyQyUwQSUyMCUyMCdwZXJmb3JtZWRfdmlhX2dpdGh1Yl9hcHAnJTNBJTIwTm9uZSU3RCU1RA==",highlighted:`[{<span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/issues/comments/897594128'</span>, | |
| <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/2792#issuecomment-897594128'</span>, | |
| <span class="hljs-string">'issue_url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/issues/2792'</span>, | |
| <span class="hljs-string">'id'</span>: <span class="hljs-number">897594128</span>, | |
| <span class="hljs-string">'node_id'</span>: <span class="hljs-string">'IC_kwDODunzps41gDMQ'</span>, | |
| <span class="hljs-string">'user'</span>: {<span class="hljs-string">'login'</span>: <span class="hljs-string">'bhavitvyamalik'</span>, | |
| <span class="hljs-string">'id'</span>: <span class="hljs-number">19718818</span>, | |
| <span class="hljs-string">'node_id'</span>: <span class="hljs-string">'MDQ6VXNlcjE5NzE4ODE4'</span>, | |
| <span class="hljs-string">'avatar_url'</span>: <span class="hljs-string">'https://avatars.githubusercontent.com/u/19718818?v=4'</span>, | |
| <span class="hljs-string">'gravatar_id'</span>: <span class="hljs-string">''</span>, | |
| <span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik'</span>, | |
| <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/bhavitvyamalik'</span>, | |
| <span class="hljs-string">'followers_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/followers'</span>, | |
| <span class="hljs-string">'following_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/following{/other_user}'</span>, | |
| <span class="hljs-string">'gists_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/gists{/gist_id}'</span>, | |
| <span class="hljs-string">'starred_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/starred{/owner}{/repo}'</span>, | |
| <span class="hljs-string">'subscriptions_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/subscriptions'</span>, | |
| <span class="hljs-string">'organizations_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/orgs'</span>, | |
| <span class="hljs-string">'repos_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/repos'</span>, | |
| <span class="hljs-string">'events_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/events{/privacy}'</span>, | |
| <span class="hljs-string">'received_events_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/received_events'</span>, | |
| <span class="hljs-string">'type'</span>: <span class="hljs-string">'User'</span>, | |
| <span class="hljs-string">'site_admin'</span>: <span class="hljs-literal">False</span>}, | |
| <span class="hljs-string">'created_at'</span>: <span class="hljs-string">'2021-08-12T12:21:52Z'</span>, | |
| <span class="hljs-string">'updated_at'</span>: <span class="hljs-string">'2021-08-12T12:31:17Z'</span>, | |
| <span class="hljs-string">'author_association'</span>: <span class="hljs-string">'CONTRIBUTOR'</span>, | |
| <span class="hljs-string">'body'</span>: <span class="hljs-string">"@albertvillanova my tests are failing here:\\r\\n\`\`\`\\r\\ndataset_name = 'gooaq'\\r\\n\\r\\n def test_load_dataset(self, dataset_name):\\r\\n configs = self.dataset_tester.load_all_configs(dataset_name, is_local=True)[:1]\\r\\n> self.dataset_tester.check_load_dataset(dataset_name, configs, is_local=True, use_local_dummy_data=True)\\r\\n\\r\\ntests/test_dataset_common.py:234: \\r\\n_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ \\r\\ntests/test_dataset_common.py:187: in check_load_dataset\\r\\n self.parent.assertTrue(len(dataset[split]) > 0)\\r\\nE AssertionError: False is not true\\r\\n\`\`\`\\r\\nWhen I try loading dataset on local machine it works fine. Any suggestions on how can I avoid this error?"</span>, | |
| <span class="hljs-string">'performed_via_github_app'</span>: <span class="hljs-literal">None</span>}]`,wrap:!1}}),Is=new y({props:{code:"ZGVmJTIwZ2V0X2NvbW1lbnRzKGlzc3VlX251bWJlciklM0ElMEElMjAlMjAlMjAlMjB1cmwlMjAlM0QlMjBmJTIyaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnJlcG9zJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRmlzc3VlcyUyRiU3Qmlzc3VlX251bWJlciU3RCUyRmNvbW1lbnRzJTIyJTBBJTIwJTIwJTIwJTIwcmVzcG9uc2UlMjAlM0QlMjByZXF1ZXN0cy5nZXQodXJsJTJDJTIwaGVhZGVycyUzRGhlYWRlcnMpJTBBJTIwJTIwJTIwJTIwcmV0dXJuJTIwJTVCciU1QiUyMmJvZHklMjIlNUQlMjBmb3IlMjByJTIwaW4lMjByZXNwb25zZS5qc29uKCklNUQlMEElMEElMEElMjMlMjBUZXN0aWFtbyUyMGxhJTIwbm9zdHJhJTIwZnVuemlvbmUlMEFnZXRfY29tbWVudHMoMjc5Mik=",highlighted:`<span class="hljs-keyword">def</span> <span class="hljs-title function_">get_comments</span>(<span class="hljs-params">issue_number</span>): | |
| url = <span class="hljs-string">f"https://api.github.com/repos/huggingface/datasets/issues/<span class="hljs-subst">{issue_number}</span>/comments"</span> | |
| response = requests.get(url, headers=headers) | |
| <span class="hljs-keyword">return</span> [r[<span class="hljs-string">"body"</span>] <span class="hljs-keyword">for</span> r <span class="hljs-keyword">in</span> response.json()] | |
| <span class="hljs-comment"># Testiamo la nostra funzione</span> | |
| get_comments(<span class="hljs-number">2792</span>)`,wrap:!1}}),zs=new y({props:{code:"JTVCJTIyJTQwYWxiZXJ0dmlsbGFub3ZhJTIwbXklMjB0ZXN0cyUyMGFyZSUyMGZhaWxpbmclMjBoZXJlJTNBJTVDciU1Q24lNjAlNjAlNjAlNUNyJTVDbmRhdGFzZXRfbmFtZSUyMCUzRCUyMCdnb29hcSclNUNyJTVDbiU1Q3IlNUNuJTIwJTIwJTIwJTIwZGVmJTIwdGVzdF9sb2FkX2RhdGFzZXQoc2VsZiUyQyUyMGRhdGFzZXRfbmFtZSklM0ElNUNyJTVDbiUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMGNvbmZpZ3MlMjAlM0QlMjBzZWxmLmRhdGFzZXRfdGVzdGVyLmxvYWRfYWxsX2NvbmZpZ3MoZGF0YXNldF9uYW1lJTJDJTIwaXNfbG9jYWwlM0RUcnVlKSU1QiUzQTElNUQlNUNyJTVDbiUzRSUyMCUyMCUyMCUyMCUyMCUyMCUyMHNlbGYuZGF0YXNldF90ZXN0ZXIuY2hlY2tfbG9hZF9kYXRhc2V0KGRhdGFzZXRfbmFtZSUyQyUyMGNvbmZpZ3MlMkMlMjBpc19sb2NhbCUzRFRydWUlMkMlMjB1c2VfbG9jYWxfZHVtbXlfZGF0YSUzRFRydWUpJTVDciU1Q24lNUNyJTVDbnRlc3RzJTJGdGVzdF9kYXRhc2V0X2NvbW1vbi5weSUzQTIzNCUzQSUyMCU1Q3IlNUNuXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMCU1Q3IlNUNudGVzdHMlMkZ0ZXN0X2RhdGFzZXRfY29tbW9uLnB5JTNBMTg3JTNBJTIwaW4lMjBjaGVja19sb2FkX2RhdGFzZXQlNUNyJTVDbiUyMCUyMCUyMCUyMHNlbGYucGFyZW50LmFzc2VydFRydWUobGVuKGRhdGFzZXQlNUJzcGxpdCU1RCklMjAlM0UlMjAwKSU1Q3IlNUNuRSUyMCUyMCUyMEFzc2VydGlvbkVycm9yJTNBJTIwRmFsc2UlMjBpcyUyMG5vdCUyMHRydWUlNUNyJTVDbiU2MCU2MCU2MCU1Q3IlNUNuV2hlbiUyMEklMjB0cnklMjBsb2FkaW5nJTIwZGF0YXNldCUyMG9uJTIwbG9jYWwlMjBtYWNoaW5lJTIwaXQlMjB3b3JrcyUyMGZpbmUuJTIwQW55JTIwc3VnZ2VzdGlvbnMlMjBvbiUyMGhvdyUyMGNhbiUyMEklMjBhdm9pZCUyMHRoaXMlMjBlcnJvciUzRiUyMiU1RA==",highlighted:'[<span class="hljs-string">"@albertvillanova my tests are failing here:\\r\\n```\\r\\ndataset_name = 'gooaq'\\r\\n\\r\\n def test_load_dataset(self, dataset_name):\\r\\n configs = self.dataset_tester.load_all_configs(dataset_name, is_local=True)[:1]\\r\\n> self.dataset_tester.check_load_dataset(dataset_name, configs, is_local=True, use_local_dummy_data=True)\\r\\n\\r\\ntests/test_dataset_common.py:234: \\r\\n_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ \\r\\ntests/test_dataset_common.py:187: in check_load_dataset\\r\\n self.parent.assertTrue(len(dataset[split]) > 0)\\r\\nE AssertionError: False is not true\\r\\n```\\r\\nWhen I try loading dataset on local machine it works fine. Any suggestions on how can I avoid this error?"</span>]',wrap:!1}}),Xs=new y({props:{code:"JTIzJTIwQSUyMHNlY29uZGElMjBkZWxsYSUyMHR1YSUyMGNvbm5lc3Npb25lJTJDJTIwcG90cmViYmUlMjB2b2xlcmNpJTIwcXVhbGNoZSUyMHNlY29uZG8uLi4lMEFpc3N1ZXNfd2l0aF9jb21tZW50c19kYXRhc2V0JTIwJTNEJTIwaXNzdWVzX2RhdGFzZXQubWFwKCUwQSUyMCUyMCUyMCUyMGxhbWJkYSUyMHglM0ElMjAlN0IlMjJjb21tZW50cyUyMiUzQSUyMGdldF9jb21tZW50cyh4JTVCJTIybnVtYmVyJTIyJTVEKSU3RCUwQSk=",highlighted:`<span class="hljs-comment"># A seconda della tua connessione, potrebbe volerci qualche secondo...</span> | |
| issues_with_comments_dataset = issues_dataset.<span class="hljs-built_in">map</span>( | |
| <span class="hljs-keyword">lambda</span> x: {<span class="hljs-string">"comments"</span>: get_comments(x[<span class="hljs-string">"number"</span>])} | |
| )`,wrap:!1}}),Ns=new y({props:{code:"aXNzdWVzX3dpdGhfY29tbWVudHNfZGF0YXNldC50b19qc29uKCUyMmlzc3Vlcy1kYXRhc2V0cy13aXRoLWNvbW1lbnRzLmpzb25sJTIyKQ==",highlighted:'issues_with_comments_dataset.to_json(<span class="hljs-string">"issues-datasets-with-comments.jsonl"</span>)',wrap:!1}}),_s=new Je({props:{title:"Caricare il dataset sull’Hub Hugging Face",local:"caricare-il-dataset-sullhub-hugging-face",headingTag:"h2"}}),ks=new jt({props:{id:"HaN6qCr_Afc"}}),$s=new y({props:{code:"ZnJvbSUyMGh1Z2dpbmdmYWNlX2h1YiUyMGltcG9ydCUyMGxpc3RfZGF0YXNldHMlMEElMEFhbGxfZGF0YXNldHMlMjAlM0QlMjBsaXN0X2RhdGFzZXRzKCklMEFwcmludChmJTIyTnVtYmVyJTIwb2YlMjBkYXRhc2V0cyUyMG9uJTIwSHViJTNBJTIwJTdCbGVuKGFsbF9kYXRhc2V0cyklN0QlMjIpJTBBcHJpbnQoYWxsX2RhdGFzZXRzJTVCMCU1RCk=",highlighted:`<span class="hljs-keyword">from</span> huggingface_hub <span class="hljs-keyword">import</span> list_datasets | |
| all_datasets = list_datasets() | |
| <span class="hljs-built_in">print</span>(<span class="hljs-string">f"Number of datasets on Hub: <span class="hljs-subst">{<span class="hljs-built_in">len</span>(all_datasets)}</span>"</span>) | |
| <span class="hljs-built_in">print</span>(all_datasets[<span class="hljs-number">0</span>])`,wrap:!1}}),Bs=new y({props:{code:"TnVtYmVyJTIwb2YlMjBkYXRhc2V0cyUyMG9uJTIwSHViJTNBJTIwMTQ4NyUwQURhdGFzZXQlMjBOYW1lJTNBJTIwYWNyb255bV9pZGVudGlmaWNhdGlvbiUyQyUyMFRhZ3MlM0ElMjAlNUInYW5ub3RhdGlvbnNfY3JlYXRvcnMlM0FleHBlcnQtZ2VuZXJhdGVkJyUyQyUyMCdsYW5ndWFnZV9jcmVhdG9ycyUzQWZvdW5kJyUyQyUyMCdsYW5ndWFnZXMlM0FlbiclMkMlMjAnbGljZW5zZXMlM0FtaXQnJTJDJTIwJ211bHRpbGluZ3VhbGl0eSUzQW1vbm9saW5ndWFsJyUyQyUyMCdzaXplX2NhdGVnb3JpZXMlM0ExMEslM0NuJTNDMTAwSyclMkMlMjAnc291cmNlX2RhdGFzZXRzJTNBb3JpZ2luYWwnJTJDJTIwJ3Rhc2tfY2F0ZWdvcmllcyUzQXN0cnVjdHVyZS1wcmVkaWN0aW9uJyUyQyUyMCd0YXNrX2lkcyUzQXN0cnVjdHVyZS1wcmVkaWN0aW9uLW90aGVyLWFjcm9ueW0taWRlbnRpZmljYXRpb24nJTVE",highlighted:`Number of datasets on Hub: <span class="hljs-number">1487</span> | |
| Dataset Name: acronym_identification, Tags: [<span class="hljs-string">'annotations_creators:expert-generated'</span>, <span class="hljs-string">'language_creators:found'</span>, <span class="hljs-string">'languages:en'</span>, <span class="hljs-string">'licenses:mit'</span>, <span class="hljs-string">'multilinguality:monolingual'</span>, <span class="hljs-string">'size_categories:10K<n<100K'</span>, <span class="hljs-string">'source_datasets:original'</span>, <span class="hljs-string">'task_categories:structure-prediction'</span>, <span class="hljs-string">'task_ids:structure-prediction-other-acronym-identification'</span>]`,wrap:!1}}),Ys=new y({props:{code:"ZnJvbSUyMGh1Z2dpbmdmYWNlX2h1YiUyMGltcG9ydCUyMG5vdGVib29rX2xvZ2luJTBBJTBBbm90ZWJvb2tfbG9naW4oKQ==",highlighted:`<span class="hljs-keyword">from</span> huggingface_hub <span class="hljs-keyword">import</span> notebook_login | |
| notebook_login()`,wrap:!1}}),Qs=new y({props:{code:"aHVnZ2luZ2ZhY2UtY2xpJTIwbG9naW4=",highlighted:"huggingface-cli login",wrap:!1}}),Ss=new y({props:{code:"ZnJvbSUyMGh1Z2dpbmdmYWNlX2h1YiUyMGltcG9ydCUyMGNyZWF0ZV9yZXBvJTBBJTBBcmVwb191cmwlMjAlM0QlMjBjcmVhdGVfcmVwbyhuYW1lJTNEJTIyZ2l0aHViLWlzc3VlcyUyMiUyQyUyMHJlcG9fdHlwZSUzRCUyMmRhdGFzZXQlMjIpJTBBcmVwb191cmw=",highlighted:`<span class="hljs-keyword">from</span> huggingface_hub <span class="hljs-keyword">import</span> create_repo | |
| repo_url = create_repo(name=<span class="hljs-string">"github-issues"</span>, repo_type=<span class="hljs-string">"dataset"</span>) | |
| repo_url`,wrap:!1}}),As=new y({props:{code:"J2h0dHBzJTNBJTJGJTJGaHVnZ2luZ2ZhY2UuY28lMkZkYXRhc2V0cyUyRmxld3R1biUyRmdpdGh1Yi1pc3N1ZXMn",highlighted:'<span class="hljs-string">'https://huggingface.co/datasets/lewtun/github-issues'</span>',wrap:!1}}),R=new Me({props:{$$slots:{default:[Gt]},$$scope:{ctx:g}}}),Ds=new y({props:{code:"ZnJvbSUyMGh1Z2dpbmdmYWNlX2h1YiUyMGltcG9ydCUyMFJlcG9zaXRvcnklMEElMEFyZXBvJTIwJTNEJTIwUmVwb3NpdG9yeShsb2NhbF9kaXIlM0QlMjJnaXRodWItaXNzdWVzJTIyJTJDJTIwY2xvbmVfZnJvbSUzRHJlcG9fdXJsKSUwQSFjcCUyMGlzc3Vlcy1kYXRhc2V0cy13aXRoLWNvbW1lbnRzLmpzb25sJTIwZ2l0aHViLWlzc3VlcyUyRg==",highlighted:`<span class="hljs-keyword">from</span> huggingface_hub <span class="hljs-keyword">import</span> Repository | |
| repo = Repository(local_dir=<span class="hljs-string">"github-issues"</span>, clone_from=repo_url) | |
| !cp issues-datasets-<span class="hljs-keyword">with</span>-comments.jsonl github-issues/`,wrap:!1}}),Os=new y({props:{code:"cmVwby5sZnNfdHJhY2soJTIyKi5qc29ubCUyMik=",highlighted:'repo.lfs_track(<span class="hljs-string">"*.jsonl"</span>)',wrap:!1}}),se=new y({props:{code:"cmVwby5wdXNoX3RvX2h1Yigp",highlighted:"repo.push_to_hub()",wrap:!1}}),ae=new y({props:{code:"cmVtb3RlX2RhdGFzZXQlMjAlM0QlMjBsb2FkX2RhdGFzZXQoJTIybGV3dHVuJTJGZ2l0aHViLWlzc3VlcyUyMiUyQyUyMHNwbGl0JTNEJTIydHJhaW4lMjIpJTBBcmVtb3RlX2RhdGFzZXQ=",highlighted:`remote_dataset = load_dataset(<span class="hljs-string">"lewtun/github-issues"</span>, split=<span class="hljs-string">"train"</span>) | |
| remote_dataset`,wrap:!1}}),te=new y({props:{code:"RGF0YXNldCglN0IlMEElMjAlMjAlMjAlMjBmZWF0dXJlcyUzQSUyMCU1Qid1cmwnJTJDJTIwJ3JlcG9zaXRvcnlfdXJsJyUyQyUyMCdsYWJlbHNfdXJsJyUyQyUyMCdjb21tZW50c191cmwnJTJDJTIwJ2V2ZW50c191cmwnJTJDJTIwJ2h0bWxfdXJsJyUyQyUyMCdpZCclMkMlMjAnbm9kZV9pZCclMkMlMjAnbnVtYmVyJyUyQyUyMCd0aXRsZSclMkMlMjAndXNlciclMkMlMjAnbGFiZWxzJyUyQyUyMCdzdGF0ZSclMkMlMjAnbG9ja2VkJyUyQyUyMCdhc3NpZ25lZSclMkMlMjAnYXNzaWduZWVzJyUyQyUyMCdtaWxlc3RvbmUnJTJDJTIwJ2NvbW1lbnRzJyUyQyUyMCdjcmVhdGVkX2F0JyUyQyUyMCd1cGRhdGVkX2F0JyUyQyUyMCdjbG9zZWRfYXQnJTJDJTIwJ2F1dGhvcl9hc3NvY2lhdGlvbiclMkMlMjAnYWN0aXZlX2xvY2tfcmVhc29uJyUyQyUyMCdwdWxsX3JlcXVlc3QnJTJDJTIwJ2JvZHknJTJDJTIwJ3BlcmZvcm1lZF92aWFfZ2l0aHViX2FwcCclMkMlMjAnaXNfcHVsbF9yZXF1ZXN0JyU1RCUyQyUwQSUyMCUyMCUyMCUyMG51bV9yb3dzJTNBJTIwMjg1NSUwQSU3RCk=",highlighted:`Dataset({ | |
| features: [<span class="hljs-string">'url'</span>, <span class="hljs-string">'repository_url'</span>, <span class="hljs-string">'labels_url'</span>, <span class="hljs-string">'comments_url'</span>, <span class="hljs-string">'events_url'</span>, <span class="hljs-string">'html_url'</span>, <span class="hljs-string">'id'</span>, <span class="hljs-string">'node_id'</span>, <span class="hljs-string">'number'</span>, <span class="hljs-string">'title'</span>, <span class="hljs-string">'user'</span>, <span class="hljs-string">'labels'</span>, <span class="hljs-string">'state'</span>, <span class="hljs-string">'locked'</span>, <span class="hljs-string">'assignee'</span>, <span class="hljs-string">'assignees'</span>, <span class="hljs-string">'milestone'</span>, <span class="hljs-string">'comments'</span>, <span class="hljs-string">'created_at'</span>, <span class="hljs-string">'updated_at'</span>, <span class="hljs-string">'closed_at'</span>, <span class="hljs-string">'author_association'</span>, <span class="hljs-string">'active_lock_reason'</span>, <span class="hljs-string">'pull_request'</span>, <span class="hljs-string">'body'</span>, <span class="hljs-string">'performed_via_github_app'</span>, <span class="hljs-string">'is_pull_request'</span>], | |
| num_rows: <span class="hljs-number">2855</span> | |
| })`,wrap:!1}}),z=new Me({props:{$$slots:{default:[Rt]},$$scope:{ctx:g}}}),ie=new Je({props:{title:"Creare una dataset card",local:"creare-una-dataset-card",headingTag:"h2"}}),N=new Me({props:{$$slots:{default:[It]},$$scope:{ctx:g}}}),_=new Me({props:{$$slots:{default:[zt]},$$scope:{ctx:g}}}),de=new ft({props:{source:"https://github.com/huggingface/course/blob/main/chapters/it/chapter5/5.mdx"}}),{c(){i=p("meta"),T=t(),o=p("p"),U=t(),u(k.$$.fragment),ye=t(),u(V.$$.fragment),Te=t(),$=p("p"),$.innerHTML=ra,Ue=t(),B=p("ul"),B.innerHTML=oa,ge=t(),H=p("p"),H.textContent=ua,je=t(),u(W.$$.fragment),be=t(),Y=p("p"),Y.innerHTML=da,fe=t(),b=p("div"),b.innerHTML=Ma,we=t(),F=p("p"),F.textContent=ma,xe=t(),f=p("div"),f.innerHTML=Ja,Ze=t(),Q=p("p"),Q.innerHTML=ha,Ge=t(),E=p("p"),E.innerHTML=ya,Re=t(),u(S.$$.fragment),Ie=t(),A=p("p"),A.innerHTML=Ta,ze=t(),u(L.$$.fragment),Ce=t(),q=p("p"),q.innerHTML=Ua,Xe=t(),u(D.$$.fragment),ve=t(),u(P.$$.fragment),Ne=t(),O=p("p"),O.innerHTML=ga,_e=t(),u(K.$$.fragment),ke=t(),u(ss.$$.fragment),Ve=t(),es=p("p"),es.innerHTML=ja,$e=t(),u(w.$$.fragment),Be=t(),ls=p("p"),ls.innerHTML=ba,He=t(),u(as.$$.fragment),We=t(),u(x.$$.fragment),Ye=t(),ts=p("p"),ts.textContent=fa,Fe=t(),u(ns.$$.fragment),Qe=t(),is=p("p"),is.innerHTML=wa,Ee=t(),u(ps.$$.fragment),Se=t(),cs=p("p"),cs.innerHTML=xa,Ae=t(),u(rs.$$.fragment),Le=t(),u(os.$$.fragment),qe=t(),us=p("p"),us.innerHTML=Za,De=t(),ds=p("blockquote"),ds.innerHTML=Ga,Pe=t(),Ms=p("p"),Ms.innerHTML=Ra,Oe=t(),ms=p("p"),ms.textContent=Ia,Ke=t(),u(Js.$$.fragment),sl=t(),hs=p("p"),hs.innerHTML=za,el=t(),u(ys.$$.fragment),ll=t(),u(Ts.$$.fragment),al=t(),Us=p("p"),Us.innerHTML=Ca,tl=t(),u(gs.$$.fragment),nl=t(),u(Z.$$.fragment),il=t(),js=p("p"),js.textContent=Xa,pl=t(),bs=p("p"),bs.textContent=va,cl=t(),u(fs.$$.fragment),rl=t(),ws=p("p"),ws.textContent=Na,ol=t(),G=p("div"),G.innerHTML=_a,ul=t(),xs=p("p"),xs.innerHTML=ka,dl=t(),u(Zs.$$.fragment),Ml=t(),u(Gs.$$.fragment),ml=t(),Rs=p("p"),Rs.innerHTML=Va,Jl=t(),u(Is.$$.fragment),hl=t(),u(zs.$$.fragment),yl=t(),Cs=p("p"),Cs.innerHTML=$a,Tl=t(),u(Xs.$$.fragment),Ul=t(),vs=p("p"),vs.textContent=Ba,gl=t(),u(Ns.$$.fragment),jl=t(),u(_s.$$.fragment),bl=t(),u(ks.$$.fragment),fl=t(),Vs=p("p"),Vs.innerHTML=Ha,wl=t(),u($s.$$.fragment),xl=t(),u(Bs.$$.fragment),Zl=t(),Hs=p("p"),Hs.innerHTML=Wa,Gl=t(),Ws=p("p"),Ws.innerHTML=Ya,Rl=t(),u(Ys.$$.fragment),Il=t(),Fs=p("p"),Fs.innerHTML=Fa,zl=t(),u(Qs.$$.fragment),Cl=t(),Es=p("p"),Es.innerHTML=Qa,Xl=t(),u(Ss.$$.fragment),vl=t(),u(As.$$.fragment),Nl=t(),Ls=p("p"),Ls.innerHTML=Ea,_l=t(),u(R.$$.fragment),kl=t(),qs=p("p"),qs.innerHTML=Sa,Vl=t(),u(Ds.$$.fragment),$l=t(),Ps=p("p"),Ps.innerHTML=Aa,Bl=t(),u(Os.$$.fragment),Hl=t(),Ks=p("p"),Ks.innerHTML=La,Wl=t(),u(se.$$.fragment),Yl=t(),ee=p("p"),ee.innerHTML=qa,Fl=t(),I=p("div"),I.innerHTML=Da,Ql=t(),le=p("p"),le.innerHTML=Pa,El=t(),u(ae.$$.fragment),Sl=t(),u(te.$$.fragment),Al=t(),ne=p("p"),ne.innerHTML=Oa,Ll=t(),u(z.$$.fragment),ql=t(),u(ie.$$.fragment),Dl=t(),pe=p("p"),pe.textContent=Ka,Pl=t(),ce=p("p"),ce.innerHTML=st,Ol=t(),re=p("ol"),re.innerHTML=et,Kl=t(),C=p("div"),C.innerHTML=lt,sa=t(),X=p("ol"),X.innerHTML=at,ea=t(),oe=p("p"),oe.innerHTML=tt,la=t(),v=p("div"),v.innerHTML=nt,aa=t(),u(N.$$.fragment),ta=t(),ue=p("p"),ue.textContent=it,na=t(),u(_.$$.fragment),ia=t(),u(de.$$.fragment),pa=t(),he=p("p"),this.h()},l(s){const e=Ut("svelte-u9bgzb",document.head);i=c(e,"META",{name:!0,content:!0}),e.forEach(l),T=n(s),o=c(s,"P",{}),mt(o).forEach(l),U=n(s),d(k.$$.fragment,s),ye=n(s),d(V.$$.fragment,s),Te=n(s),$=c(s,"P",{"data-svelte-h":!0}),r($)!=="svelte-1h3t35x"&&($.innerHTML=ra),Ue=n(s),B=c(s,"UL",{"data-svelte-h":!0}),r(B)!=="svelte-qe2w3o"&&(B.innerHTML=oa),ge=n(s),H=c(s,"P",{"data-svelte-h":!0}),r(H)!=="svelte-dydfa0"&&(H.textContent=ua),je=n(s),d(W.$$.fragment,s),be=n(s),Y=c(s,"P",{"data-svelte-h":!0}),r(Y)!=="svelte-190qwz0"&&(Y.innerHTML=da),fe=n(s),b=c(s,"DIV",{class:!0,"data-svelte-h":!0}),r(b)!=="svelte-1htetkm"&&(b.innerHTML=Ma),we=n(s),F=c(s,"P",{"data-svelte-h":!0}),r(F)!=="svelte-1yipl9d"&&(F.textContent=ma),xe=n(s),f=c(s,"DIV",{class:!0,"data-svelte-h":!0}),r(f)!=="svelte-1jsgvzc"&&(f.innerHTML=Ja),Ze=n(s),Q=c(s,"P",{"data-svelte-h":!0}),r(Q)!=="svelte-17sk5bj"&&(Q.innerHTML=ha),Ge=n(s),E=c(s,"P",{"data-svelte-h":!0}),r(E)!=="svelte-58mesu"&&(E.innerHTML=ya),Re=n(s),d(S.$$.fragment,s),Ie=n(s),A=c(s,"P",{"data-svelte-h":!0}),r(A)!=="svelte-linx15"&&(A.innerHTML=Ta),ze=n(s),d(L.$$.fragment,s),Ce=n(s),q=c(s,"P",{"data-svelte-h":!0}),r(q)!=="svelte-hwpfvr"&&(q.innerHTML=Ua),Xe=n(s),d(D.$$.fragment,s),ve=n(s),d(P.$$.fragment,s),Ne=n(s),O=c(s,"P",{"data-svelte-h":!0}),r(O)!=="svelte-n5f90"&&(O.innerHTML=ga),_e=n(s),d(K.$$.fragment,s),ke=n(s),d(ss.$$.fragment,s),Ve=n(s),es=c(s,"P",{"data-svelte-h":!0}),r(es)!=="svelte-bmsgi4"&&(es.innerHTML=ja),$e=n(s),d(w.$$.fragment,s),Be=n(s),ls=c(s,"P",{"data-svelte-h":!0}),r(ls)!=="svelte-jjlpsx"&&(ls.innerHTML=ba),He=n(s),d(as.$$.fragment,s),We=n(s),d(x.$$.fragment,s),Ye=n(s),ts=c(s,"P",{"data-svelte-h":!0}),r(ts)!=="svelte-ge0v0t"&&(ts.textContent=fa),Fe=n(s),d(ns.$$.fragment,s),Qe=n(s),is=c(s,"P",{"data-svelte-h":!0}),r(is)!=="svelte-12lrurn"&&(is.innerHTML=wa),Ee=n(s),d(ps.$$.fragment,s),Se=n(s),cs=c(s,"P",{"data-svelte-h":!0}),r(cs)!=="svelte-1fepqzy"&&(cs.innerHTML=xa),Ae=n(s),d(rs.$$.fragment,s),Le=n(s),d(os.$$.fragment,s),qe=n(s),us=c(s,"P",{"data-svelte-h":!0}),r(us)!=="svelte-1wbhe20"&&(us.innerHTML=Za),De=n(s),ds=c(s,"BLOCKQUOTE",{"data-svelte-h":!0}),r(ds)!=="svelte-165ve2g"&&(ds.innerHTML=Ga),Pe=n(s),Ms=c(s,"P",{"data-svelte-h":!0}),r(Ms)!=="svelte-17d1r3t"&&(Ms.innerHTML=Ra),Oe=n(s),ms=c(s,"P",{"data-svelte-h":!0}),r(ms)!=="svelte-1uhjti4"&&(ms.textContent=Ia),Ke=n(s),d(Js.$$.fragment,s),sl=n(s),hs=c(s,"P",{"data-svelte-h":!0}),r(hs)!=="svelte-5irsew"&&(hs.innerHTML=za),el=n(s),d(ys.$$.fragment,s),ll=n(s),d(Ts.$$.fragment,s),al=n(s),Us=c(s,"P",{"data-svelte-h":!0}),r(Us)!=="svelte-196qdbm"&&(Us.innerHTML=Ca),tl=n(s),d(gs.$$.fragment,s),nl=n(s),d(Z.$$.fragment,s),il=n(s),js=c(s,"P",{"data-svelte-h":!0}),r(js)!=="svelte-1e9tu80"&&(js.textContent=Xa),pl=n(s),bs=c(s,"P",{"data-svelte-h":!0}),r(bs)!=="svelte-z2nyet"&&(bs.textContent=va),cl=n(s),d(fs.$$.fragment,s),rl=n(s),ws=c(s,"P",{"data-svelte-h":!0}),r(ws)!=="svelte-ywuirq"&&(ws.textContent=Na),ol=n(s),G=c(s,"DIV",{class:!0,"data-svelte-h":!0}),r(G)!=="svelte-1fxxwaz"&&(G.innerHTML=_a),ul=n(s),xs=c(s,"P",{"data-svelte-h":!0}),r(xs)!=="svelte-q4eegl"&&(xs.innerHTML=ka),dl=n(s),d(Zs.$$.fragment,s),Ml=n(s),d(Gs.$$.fragment,s),ml=n(s),Rs=c(s,"P",{"data-svelte-h":!0}),r(Rs)!=="svelte-69hg6q"&&(Rs.innerHTML=Va),Jl=n(s),d(Is.$$.fragment,s),hl=n(s),d(zs.$$.fragment,s),yl=n(s),Cs=c(s,"P",{"data-svelte-h":!0}),r(Cs)!=="svelte-1bt9zz6"&&(Cs.innerHTML=$a),Tl=n(s),d(Xs.$$.fragment,s),Ul=n(s),vs=c(s,"P",{"data-svelte-h":!0}),r(vs)!=="svelte-1bdvuzp"&&(vs.textContent=Ba),gl=n(s),d(Ns.$$.fragment,s),jl=n(s),d(_s.$$.fragment,s),bl=n(s),d(ks.$$.fragment,s),fl=n(s),Vs=c(s,"P",{"data-svelte-h":!0}),r(Vs)!=="svelte-wrr7o5"&&(Vs.innerHTML=Ha),wl=n(s),d($s.$$.fragment,s),xl=n(s),d(Bs.$$.fragment,s),Zl=n(s),Hs=c(s,"P",{"data-svelte-h":!0}),r(Hs)!=="svelte-1sbkpb8"&&(Hs.innerHTML=Wa),Gl=n(s),Ws=c(s,"P",{"data-svelte-h":!0}),r(Ws)!=="svelte-1x1iq75"&&(Ws.innerHTML=Ya),Rl=n(s),d(Ys.$$.fragment,s),Il=n(s),Fs=c(s,"P",{"data-svelte-h":!0}),r(Fs)!=="svelte-fkm3k"&&(Fs.innerHTML=Fa),zl=n(s),d(Qs.$$.fragment,s),Cl=n(s),Es=c(s,"P",{"data-svelte-h":!0}),r(Es)!=="svelte-1q0q1uc"&&(Es.innerHTML=Qa),Xl=n(s),d(Ss.$$.fragment,s),vl=n(s),d(As.$$.fragment,s),Nl=n(s),Ls=c(s,"P",{"data-svelte-h":!0}),r(Ls)!=="svelte-1ro7sli"&&(Ls.innerHTML=Ea),_l=n(s),d(R.$$.fragment,s),kl=n(s),qs=c(s,"P",{"data-svelte-h":!0}),r(qs)!=="svelte-axrgi"&&(qs.innerHTML=Sa),Vl=n(s),d(Ds.$$.fragment,s),$l=n(s),Ps=c(s,"P",{"data-svelte-h":!0}),r(Ps)!=="svelte-1tfh3nd"&&(Ps.innerHTML=Aa),Bl=n(s),d(Os.$$.fragment,s),Hl=n(s),Ks=c(s,"P",{"data-svelte-h":!0}),r(Ks)!=="svelte-119nihd"&&(Ks.innerHTML=La),Wl=n(s),d(se.$$.fragment,s),Yl=n(s),ee=c(s,"P",{"data-svelte-h":!0}),r(ee)!=="svelte-f7bnod"&&(ee.innerHTML=qa),Fl=n(s),I=c(s,"DIV",{class:!0,"data-svelte-h":!0}),r(I)!=="svelte-18puw29"&&(I.innerHTML=Da),Ql=n(s),le=c(s,"P",{"data-svelte-h":!0}),r(le)!=="svelte-fxrj9t"&&(le.innerHTML=Pa),El=n(s),d(ae.$$.fragment,s),Sl=n(s),d(te.$$.fragment,s),Al=n(s),ne=c(s,"P",{"data-svelte-h":!0}),r(ne)!=="svelte-1woaiq9"&&(ne.innerHTML=Oa),Ll=n(s),d(z.$$.fragment,s),ql=n(s),d(ie.$$.fragment,s),Dl=n(s),pe=c(s,"P",{"data-svelte-h":!0}),r(pe)!=="svelte-vxtenw"&&(pe.textContent=Ka),Pl=n(s),ce=c(s,"P",{"data-svelte-h":!0}),r(ce)!=="svelte-krhhu0"&&(ce.innerHTML=st),Ol=n(s),re=c(s,"OL",{"data-svelte-h":!0}),r(re)!=="svelte-12j1wif"&&(re.innerHTML=et),Kl=n(s),C=c(s,"DIV",{class:!0,"data-svelte-h":!0}),r(C)!=="svelte-1gqifn5"&&(C.innerHTML=lt),sa=n(s),X=c(s,"OL",{start:!0,"data-svelte-h":!0}),r(X)!=="svelte-16lcu59"&&(X.innerHTML=at),ea=n(s),oe=c(s,"P",{"data-svelte-h":!0}),r(oe)!=="svelte-1qxc0rz"&&(oe.innerHTML=tt),la=n(s),v=c(s,"DIV",{class:!0,"data-svelte-h":!0}),r(v)!=="svelte-ct1wn8"&&(v.innerHTML=nt),aa=n(s),d(N.$$.fragment,s),ta=n(s),ue=c(s,"P",{"data-svelte-h":!0}),r(ue)!=="svelte-kroznp"&&(ue.textContent=it),na=n(s),d(_.$$.fragment,s),ia=n(s),d(de.$$.fragment,s),pa=n(s),he=c(s,"P",{}),mt(he).forEach(l),this.h()},h(){j(i,"name","hf:doc:metadata"),j(i,"content",Xt),j(b,"class","flex justify-center"),j(f,"class","flex justify-center"),j(G,"class","flex justify-center"),j(I,"class","flex justify-center"),j(C,"class","flex justify-center"),j(X,"start","2"),j(v,"class","flex justify-center")},m(s,e){gt(document.head,i),a(s,T,e),a(s,o,e),a(s,U,e),M(k,s,e),a(s,ye,e),M(V,s,e),a(s,Te,e),a(s,$,e),a(s,Ue,e),a(s,B,e),a(s,ge,e),a(s,H,e),a(s,je,e),M(W,s,e),a(s,be,e),a(s,Y,e),a(s,fe,e),a(s,b,e),a(s,we,e),a(s,F,e),a(s,xe,e),a(s,f,e),a(s,Ze,e),a(s,Q,e),a(s,Ge,e),a(s,E,e),a(s,Re,e),M(S,s,e),a(s,Ie,e),a(s,A,e),a(s,ze,e),M(L,s,e),a(s,Ce,e),a(s,q,e),a(s,Xe,e),M(D,s,e),a(s,ve,e),M(P,s,e),a(s,Ne,e),a(s,O,e),a(s,_e,e),M(K,s,e),a(s,ke,e),M(ss,s,e),a(s,Ve,e),a(s,es,e),a(s,$e,e),M(w,s,e),a(s,Be,e),a(s,ls,e),a(s,He,e),M(as,s,e),a(s,We,e),M(x,s,e),a(s,Ye,e),a(s,ts,e),a(s,Fe,e),M(ns,s,e),a(s,Qe,e),a(s,is,e),a(s,Ee,e),M(ps,s,e),a(s,Se,e),a(s,cs,e),a(s,Ae,e),M(rs,s,e),a(s,Le,e),M(os,s,e),a(s,qe,e),a(s,us,e),a(s,De,e),a(s,ds,e),a(s,Pe,e),a(s,Ms,e),a(s,Oe,e),a(s,ms,e),a(s,Ke,e),M(Js,s,e),a(s,sl,e),a(s,hs,e),a(s,el,e),M(ys,s,e),a(s,ll,e),M(Ts,s,e),a(s,al,e),a(s,Us,e),a(s,tl,e),M(gs,s,e),a(s,nl,e),M(Z,s,e),a(s,il,e),a(s,js,e),a(s,pl,e),a(s,bs,e),a(s,cl,e),M(fs,s,e),a(s,rl,e),a(s,ws,e),a(s,ol,e),a(s,G,e),a(s,ul,e),a(s,xs,e),a(s,dl,e),M(Zs,s,e),a(s,Ml,e),M(Gs,s,e),a(s,ml,e),a(s,Rs,e),a(s,Jl,e),M(Is,s,e),a(s,hl,e),M(zs,s,e),a(s,yl,e),a(s,Cs,e),a(s,Tl,e),M(Xs,s,e),a(s,Ul,e),a(s,vs,e),a(s,gl,e),M(Ns,s,e),a(s,jl,e),M(_s,s,e),a(s,bl,e),M(ks,s,e),a(s,fl,e),a(s,Vs,e),a(s,wl,e),M($s,s,e),a(s,xl,e),M(Bs,s,e),a(s,Zl,e),a(s,Hs,e),a(s,Gl,e),a(s,Ws,e),a(s,Rl,e),M(Ys,s,e),a(s,Il,e),a(s,Fs,e),a(s,zl,e),M(Qs,s,e),a(s,Cl,e),a(s,Es,e),a(s,Xl,e),M(Ss,s,e),a(s,vl,e),M(As,s,e),a(s,Nl,e),a(s,Ls,e),a(s,_l,e),M(R,s,e),a(s,kl,e),a(s,qs,e),a(s,Vl,e),M(Ds,s,e),a(s,$l,e),a(s,Ps,e),a(s,Bl,e),M(Os,s,e),a(s,Hl,e),a(s,Ks,e),a(s,Wl,e),M(se,s,e),a(s,Yl,e),a(s,ee,e),a(s,Fl,e),a(s,I,e),a(s,Ql,e),a(s,le,e),a(s,El,e),M(ae,s,e),a(s,Sl,e),M(te,s,e),a(s,Al,e),a(s,ne,e),a(s,Ll,e),M(z,s,e),a(s,ql,e),M(ie,s,e),a(s,Dl,e),a(s,pe,e),a(s,Pl,e),a(s,ce,e),a(s,Ol,e),a(s,re,e),a(s,Kl,e),a(s,C,e),a(s,sa,e),a(s,X,e),a(s,ea,e),a(s,oe,e),a(s,la,e),a(s,v,e),a(s,aa,e),M(N,s,e),a(s,ta,e),a(s,ue,e),a(s,na,e),M(_,s,e),a(s,ia,e),M(de,s,e),a(s,pa,e),a(s,he,e),ca=!0},p(s,[e]){const pt={};e&2&&(pt.$$scope={dirty:e,ctx:s}),w.$set(pt);const ct={};e&2&&(ct.$$scope={dirty:e,ctx:s}),x.$set(ct);const rt={};e&2&&(rt.$$scope={dirty:e,ctx:s}),Z.$set(rt);const ot={};e&2&&(ot.$$scope={dirty:e,ctx:s}),R.$set(ot);const ut={};e&2&&(ut.$$scope={dirty:e,ctx:s}),z.$set(ut);const dt={};e&2&&(dt.$$scope={dirty:e,ctx:s}),N.$set(dt);const Mt={};e&2&&(Mt.$$scope={dirty:e,ctx:s}),_.$set(Mt)},i(s){ca||(m(k.$$.fragment,s),m(V.$$.fragment,s),m(W.$$.fragment,s),m(S.$$.fragment,s),m(L.$$.fragment,s),m(D.$$.fragment,s),m(P.$$.fragment,s),m(K.$$.fragment,s),m(ss.$$.fragment,s),m(w.$$.fragment,s),m(as.$$.fragment,s),m(x.$$.fragment,s),m(ns.$$.fragment,s),m(ps.$$.fragment,s),m(rs.$$.fragment,s),m(os.$$.fragment,s),m(Js.$$.fragment,s),m(ys.$$.fragment,s),m(Ts.$$.fragment,s),m(gs.$$.fragment,s),m(Z.$$.fragment,s),m(fs.$$.fragment,s),m(Zs.$$.fragment,s),m(Gs.$$.fragment,s),m(Is.$$.fragment,s),m(zs.$$.fragment,s),m(Xs.$$.fragment,s),m(Ns.$$.fragment,s),m(_s.$$.fragment,s),m(ks.$$.fragment,s),m($s.$$.fragment,s),m(Bs.$$.fragment,s),m(Ys.$$.fragment,s),m(Qs.$$.fragment,s),m(Ss.$$.fragment,s),m(As.$$.fragment,s),m(R.$$.fragment,s),m(Ds.$$.fragment,s),m(Os.$$.fragment,s),m(se.$$.fragment,s),m(ae.$$.fragment,s),m(te.$$.fragment,s),m(z.$$.fragment,s),m(ie.$$.fragment,s),m(N.$$.fragment,s),m(_.$$.fragment,s),m(de.$$.fragment,s),ca=!0)},o(s){J(k.$$.fragment,s),J(V.$$.fragment,s),J(W.$$.fragment,s),J(S.$$.fragment,s),J(L.$$.fragment,s),J(D.$$.fragment,s),J(P.$$.fragment,s),J(K.$$.fragment,s),J(ss.$$.fragment,s),J(w.$$.fragment,s),J(as.$$.fragment,s),J(x.$$.fragment,s),J(ns.$$.fragment,s),J(ps.$$.fragment,s),J(rs.$$.fragment,s),J(os.$$.fragment,s),J(Js.$$.fragment,s),J(ys.$$.fragment,s),J(Ts.$$.fragment,s),J(gs.$$.fragment,s),J(Z.$$.fragment,s),J(fs.$$.fragment,s),J(Zs.$$.fragment,s),J(Gs.$$.fragment,s),J(Is.$$.fragment,s),J(zs.$$.fragment,s),J(Xs.$$.fragment,s),J(Ns.$$.fragment,s),J(_s.$$.fragment,s),J(ks.$$.fragment,s),J($s.$$.fragment,s),J(Bs.$$.fragment,s),J(Ys.$$.fragment,s),J(Qs.$$.fragment,s),J(Ss.$$.fragment,s),J(As.$$.fragment,s),J(R.$$.fragment,s),J(Ds.$$.fragment,s),J(Os.$$.fragment,s),J(se.$$.fragment,s),J(ae.$$.fragment,s),J(te.$$.fragment,s),J(z.$$.fragment,s),J(ie.$$.fragment,s),J(N.$$.fragment,s),J(_.$$.fragment,s),J(de.$$.fragment,s),ca=!1},d(s){s&&(l(T),l(o),l(U),l(ye),l(Te),l($),l(Ue),l(B),l(ge),l(H),l(je),l(be),l(Y),l(fe),l(b),l(we),l(F),l(xe),l(f),l(Ze),l(Q),l(Ge),l(E),l(Re),l(Ie),l(A),l(ze),l(Ce),l(q),l(Xe),l(ve),l(Ne),l(O),l(_e),l(ke),l(Ve),l(es),l($e),l(Be),l(ls),l(He),l(We),l(Ye),l(ts),l(Fe),l(Qe),l(is),l(Ee),l(Se),l(cs),l(Ae),l(Le),l(qe),l(us),l(De),l(ds),l(Pe),l(Ms),l(Oe),l(ms),l(Ke),l(sl),l(hs),l(el),l(ll),l(al),l(Us),l(tl),l(nl),l(il),l(js),l(pl),l(bs),l(cl),l(rl),l(ws),l(ol),l(G),l(ul),l(xs),l(dl),l(Ml),l(ml),l(Rs),l(Jl),l(hl),l(yl),l(Cs),l(Tl),l(Ul),l(vs),l(gl),l(jl),l(bl),l(fl),l(Vs),l(wl),l(xl),l(Zl),l(Hs),l(Gl),l(Ws),l(Rl),l(Il),l(Fs),l(zl),l(Cl),l(Es),l(Xl),l(vl),l(Nl),l(Ls),l(_l),l(kl),l(qs),l(Vl),l($l),l(Ps),l(Bl),l(Hl),l(Ks),l(Wl),l(Yl),l(ee),l(Fl),l(I),l(Ql),l(le),l(El),l(Sl),l(Al),l(ne),l(Ll),l(ql),l(Dl),l(pe),l(Pl),l(ce),l(Ol),l(re),l(Kl),l(C),l(sa),l(X),l(ea),l(oe),l(la),l(v),l(aa),l(ta),l(ue),l(na),l(ia),l(pa),l(he)),l(i),h(k,s),h(V,s),h(W,s),h(S,s),h(L,s),h(D,s),h(P,s),h(K,s),h(ss,s),h(w,s),h(as,s),h(x,s),h(ns,s),h(ps,s),h(rs,s),h(os,s),h(Js,s),h(ys,s),h(Ts,s),h(gs,s),h(Z,s),h(fs,s),h(Zs,s),h(Gs,s),h(Is,s),h(zs,s),h(Xs,s),h(Ns,s),h(_s,s),h(ks,s),h($s,s),h(Bs,s),h(Ys,s),h(Qs,s),h(Ss,s),h(As,s),h(R,s),h(Ds,s),h(Os,s),h(se,s),h(ae,s),h(te,s),h(z,s),h(ie,s),h(N,s),h(_,s),h(de,s)}}}const Xt='{"title":"Creare il proprio dataset","local":"creare-il-proprio-dataset","sections":[{"title":"Recuperare i dati","local":"recuperare-i-dati","sections":[],"depth":2},{"title":"Pulire i dati","local":"pulire-i-dati","sections":[],"depth":2},{"title":"Estendere il dataset","local":"estendere-il-dataset","sections":[],"depth":2},{"title":"Caricare il dataset sull’Hub Hugging Face","local":"caricare-il-dataset-sullhub-hugging-face","sections":[],"depth":2},{"title":"Creare una dataset card","local":"creare-una-dataset-card","sections":[],"depth":2}],"depth":1}';function vt(g){return ht(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class Wt extends yt{constructor(i){super(),Tt(this,i,vt,Ct,Jt,{})}}export{Wt as component}; | |
Xet Storage Details
- Size:
- 85.5 kB
- Xet hash:
- bd4701e2a1cb1bf01afcdf03bb908f424c9dfc545b3ff3e0f034c7dc4d22e866
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.