Buckets:
| import{s as ut,o as mt,n as ma}from"../chunks/scheduler.37c15a92.js";import{S as Mt,i as Jt,g as i,s as t,r as d,A as yt,h as p,f as e,c as n,j as dt,u,x as c,k as b,y as ht,a as l,v as m,d as M,t as J,w as y}from"../chunks/index.2bf4358c.js";import{T as ua}from"../chunks/Tip.363c041f.js";import{Y as Tt}from"../chunks/Youtube.1e50a667.js";import{C as h}from"../chunks/CodeBlock.4e987730.js";import{C as Ut}from"../chunks/CourseFloatingBanner.6add7356.js";import{H as Ma,E as jt}from"../chunks/getInferenceSnippets.1837c472.js";function bt(j){let o,T="✏️ <strong>Experimente!</strong> Clique em alguns dos URLs na carga JSON acima para ter uma ideia de que tipo de informação cada issue do GitHub está vinculado.";return{c(){o=i("p"),o.innerHTML=T},l(r){o=p(r,"P",{"data-svelte-h":!0}),c(o)!=="svelte-1e5rp6z"&&(o.innerHTML=T)},m(r,U){l(r,o,U)},p:ma,d(r){r&&e(o)}}}function gt(j){let o,T='⚠️ Não compartilhe um notebook com seu <code>GITHUB_TOKEN</code> colado nele. Recomendamos que você exclua a última célula depois de executá-la para evitar o vazamento dessas informações acidentalmente. Melhor ainda, armazene o token em um arquivo <em>.env</em> e use a <a href="https://github.com/theskumar/python-dotenv" rel="nofollow"><code>python-dotenv</code> library</a> para carregá-lo automaticamente para você como uma variável de ambiente.';return{c(){o=i("p"),o.innerHTML=T},l(r){o=p(r,"P",{"data-svelte-h":!0}),c(o)!=="svelte-1vzn3qq"&&(o.innerHTML=T)},m(r,U){l(r,o,U)},p:ma,d(r){r&&e(o)}}}function ft(j){let o,T="✏️ <strong>Experimente!</strong> Calcule o tempo médio que leva para fechar as issues em 🤗 Datasets. Você pode achar a função <code>Dataset.filter()</code> útil para filtrar os pull requests e as issues abertas, e você pode usar a função <code>Dataset.set_format()</code> para converter o conjunto de dados em um <code>DataFrame</code> para que você possa manipular facilmente os timestamps <code>created_at</code> e <code>closed_at</code>. Para pontos de bônus, calcule o tempo médio que leva para fechar os pull requests.";return{c(){o=i("p"),o.innerHTML=T},l(r){o=p(r,"P",{"data-svelte-h":!0}),c(o)!=="svelte-19u3bxy"&&(o.innerHTML=T)},m(r,U){l(r,o,U)},p:ma,d(r){r&&e(o)}}}function wt(j){let o,T="✏️ <strong>Experimente!</strong> Use seu nome de usuário e senha do Hugging Face Hub para obter um token e criar um repositório vazio chamado <code>github-issues</code>. Lembre-se de <strong>nunca salvar suas credenciais</strong> no Colab ou em qualquer outro repositório, pois essas informações podem ser exploradas por agentes mal-intencionados.";return{c(){o=i("p"),o.innerHTML=T},l(r){o=p(r,"P",{"data-svelte-h":!0}),c(o)!=="svelte-ld82he"&&(o.innerHTML=T)},m(r,U){l(r,o,U)},p:ma,d(r){r&&e(o)}}}function xt(j){let o,T='💡 Você também pode enviar um conjunto de dados para o Hugging Face Hub diretamente do terminal usando <code>huggingface-cli</code> e um pouco de magia Git. Consulte o <a href="https://huggingface.co/docs/datasets/share#share-a-dataset-using-the-cli" rel="nofollow">guia do 🤗 Datasets</a> para obter detalhes sobre como fazer isso.';return{c(){o=i("p"),o.innerHTML=T},l(r){o=p(r,"P",{"data-svelte-h":!0}),c(o)!=="svelte-rrol3s"&&(o.innerHTML=T)},m(r,U){l(r,o,U)},p:ma,d(r){r&&e(o)}}}function Zt(j){let o,T='✏️ <strong>Experimente!</strong> Use o aplicativo <code>dataset-tagging</code> e <a href="https://github.com/huggingface/datasets/blob/master/templates/README_guide.md" rel="nofollow">guia do 🤗 datasets</a> para concluir o <em>Arquivo README.md</em> para o conjunto de dados de issues do GitHub.';return{c(){o=i("p"),o.innerHTML=T},l(r){o=p(r,"P",{"data-svelte-h":!0}),c(o)!=="svelte-1vt20th"&&(o.innerHTML=T)},m(r,U){l(r,o,U)},p:ma,d(r){r&&e(o)}}}function Gt(j){let o,T="✏️ <strong>Experimente!</strong> Siga as etapas que seguimos nesta seção para criar um conjunto de dados de issues do GitHub para sua biblioteca de código aberto favorita (escolha algo diferente do 🤗 datasets, é claro!). Para pontos de bônus, ajuste um classificador multilabel para prever as tags presentes no campo <code>labels</code>.";return{c(){o=i("p"),o.innerHTML=T},l(r){o=p(r,"P",{"data-svelte-h":!0}),c(o)!=="svelte-eptrxz"&&(o.innerHTML=T)},m(r,U){l(r,o,U)},p:ma,d(r){r&&e(o)}}}function Rt(j){let o,T,r,U,z,ya,V,ha,$,il='Às vezes, o conjunto de dados de que você precisa para criar um aplicativo de PLN não existe, portanto, você mesmo precisará criá-lo. Nesta seção, mostraremos como criar um corpus de <a href="https://github.com/features/issues/" rel="nofollow">issues do GitHub</a>, que são comumente usados para rastrear bugs ou recursos nos repositórios do GitHub. Este corpus pode ser usado para vários fins, incluindo:',Ta,B,pl="<li>Explorar quanto tempo leva para fechar as issues abertos ou pull requests</li> <li>Treinar um <em>classificador multilabel</em> que pode marcar issues com metadados com base na descrição da issue (por exemplo, “bug”, “melhoria” ou “pergunta”)</li> <li>Criando um mecanismo de pesquisa semântica para descobrir quais issues correspondem à consulta de um usuário</li>",Ua,H,cl="Aqui nos concentraremos na criação do corpus e, na próxima seção, abordaremos o aplicativo de pesquisa semântica. Para manter a meta, usaremos as issues do GitHub associados a um projeto de código aberto popular: 🤗 Datasets! Vamos dar uma olhada em como obter os dados e explorar as informações contidas nessas edições.",ja,W,ba,F,rl='Você pode encontrar todos as issues em 🤗 Datasets navegando até a <a href="https://github.com/huggingface/datasets/issues" rel="nofollow">guia de issues</a> do repositório. Conforme mostrado na captura de tela a seguir, no momento da redação, havia 331 issues abertos e 668 fechados.',ga,g,dl='<img src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter5/datasets-issues.png" alt="The GitHub issues associated with 🤗 Datasets." width="80%"/>',fa,Q,ul="Se você clicar em uma dessas issues, verá que ele contém um título, uma descrição e um conjunto de rótulos que caracterizam a issue. Um exemplo é mostrado na captura de tela abaixo.",wa,f,ml='<img src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter5/datasets-issues-single.png" alt="A typical GitHub issue in the 🤗 Datasets repository." width="80%"/>',xa,Y,Ml='Para baixar todos as issues do repositório, usaremos a <a href="https://docs.github.com/en/rest" rel="nofollow">GitHub REST API</a> para pesquisar o [<code>Issues</code> endpoint](<a href="https://docs.github." rel="nofollow">https://docs.github.</a> com/en/rest/reference/issues#list-repository-issues). Esse endpoint retorna uma lista de objetos JSON, com cada objeto contendo um grande número de campos que incluem o título e a descrição, bem como metadados sobre o status da issue e assim por diante.',Za,E,Jl="Uma maneira conveniente de baixar as issues é por meio da biblioteca <code>requests</code>, que é a maneira padrão de fazer solicitações HTTP em Python. Você pode instalar a biblioteca executando:",Ga,S,Ra,A,yl="Uma vez que a biblioteca esteja instalada, você pode fazer solicitações GET para o endpoint <code>Issues</code> invocando a função <code>requests.get()</code>. Por exemplo, você pode executar o seguinte comando para recuperar a primeira issue na primeira página:",va,q,Ia,L,hl="O objeto <code>response</code> contém muitas informações úteis sobre a solicitação, incluindo o código de status HTTP:",Xa,D,Ca,P,Na,O,Tl='onde um status <code>200</code> significa que a solicitação foi bem-sucedida (você pode encontrar uma lista de possíveis códigos de status HTTP <a href="https://en.wikipedia.org/wiki/List_of_HTTP_status_codes" rel="nofollow">aqui</a>). O que realmente nos interessa, porém, é o <em>payload</em>, que pode ser acessado em vários formatos como bytes, strings ou JSON. Como sabemos que nossas issues estão no formato JSON, vamos inspecionar o payload da seguinte forma:',_a,K,ka,ss,za,as,Ul="Uau, é muita informação! Podemos ver campos úteis como <code>title</code>, <code>body</code> e <code>number</code> que descrevem a issue, bem como informações sobre o usuário do GitHub que abriu a issue.",Va,w,$a,es,jl='Conforme descrito na [documentação] do GitHub (<a href="https://docs.github.com/en/rest/overview/resources-in-the-rest-api#rate-limiting" rel="nofollow">https://docs.github.com/en/rest/overview/resources-in-the-rest-api#rate-limiting</a>), as solicitações não autenticadas são limitadas a 60 solicitações por hora. Embora você possa aumentar o parâmetro de consulta <code>per_page</code> para reduzir o número de solicitações feitas, você ainda atingirá o limite de taxa em qualquer repositório que tenha mais do que alguns milhares de issues. Então, em vez disso, você deve seguir as [instruções] do GitHub (<a href="https://docs.github.com/en/github/authenticating-to-github/creating-a-personal-access-token" rel="nofollow">https://docs.github.com/en/github/authenticating-to-github/creating-a-personal-access-token</a>) sobre como criar um <em>token de acesso pessoal</em> para que você pode aumentar o limite de taxa para 5.000 solicitações por hora. Depois de ter seu token, você pode incluí-lo como parte do cabeçalho da solicitação:',Ba,ls,Ha,x,Wa,ts,bl="Agora que temos nosso token de acesso, vamos criar uma função que possa baixar todas as issues de um repositório do GitHub:",Fa,ns,Qa,os,gl="Agora, quando chamamos <code>fetch_issues()</code>, ele fará o download de todas as issues em lotes para evitar exceder o limite do GitHub no número de solicitações por hora; o resultado será armazenado em um arquivo <em>repository_name-issues.jsonl</em>, onde cada linha é um objeto JSON que representa uma issue. Vamos usar esta função para pegar todas as issues de 🤗 Datasets:",Ya,is,Ea,ps,fl='Depois que as issues forem baixadas, podemos carregá-las localmente usando nossas novas habilidades da <a href="/course/chapter5/2">seção 2</a>:',Sa,cs,Aa,rs,qa,ds,wl='Ótimo, criamos nosso primeiro conjunto de dados do zero! Mas por que existem vários milhares de issues quando a <a href="https://github.com/huggingface/datasets/issues" rel="nofollow">guia Issue</a> do repositório 🤗 Datasets mostra apenas cerca de 1.000 issues no total 🤔? Conforme descrito na [documentação] do GitHub (<a href="https://docs.github.com/en/rest/reference/issues#list-issues-assigned-to-the-authenticated-user" rel="nofollow">https://docs.github.com/en/rest/reference/issues#list-issues-assigned-to-the-authenticated-user</a>), isso ocorre porque baixamos todos os pull request também:',La,us,xl="<p>A API REST v3 do GitHub considera cada pull request como uma issue, mas nem toda issue é um pull request. Por esse motivo, os endpoints de “issues” podem retornar issues e solicitações de pull na resposta. Você pode identificar solicitações de pull pela chave <code>pull_request</code>. Esteja ciente de que o <code>id</code> de uma solicitação pull retornada de endpoints “issues” será um ID de issue.</p>",Da,ms,Zl="Como o conteúdo das issues e dos pull request são bem diferentes, vamos fazer um pequeno pré-processamento para nos permitir distinguir entre eles.",Pa,Ms,Oa,Js,Gl='O trecho acima da documentação do GitHub nos diz que a coluna <code>pull_request</code> pode ser usada para diferenciar entre issues e solicitações de pull request. Vamos olhar para uma amostra aleatória para ver qual é a diferença. Como fizemos na <a href="/course/chapter5/3">seção 3</a>, vamos encadear <code>Dataset.shuffle()</code> e <code>Dataset.select()</code> para criar uma amostra aleatória e então compactar o <code>html_url</code> e <code>pull_request</code> para que possamos comparar os vários URLs:',Ka,ys,se,hs,ae,Ts,Rl="Aqui podemos ver que cada pull request está associado a vários URLs, enquanto as issues comuns têm uma entrada <code>None</code>. Podemos usar essa distinção para criar uma nova coluna <code>is_pull_request</code> que verifica se o campo <code>pull_request</code> é <code>None</code> ou não:",ee,Us,le,Z,te,js,vl="Embora possamos continuar a limpar o conjunto de dados descartando ou renomeando algumas colunas, geralmente é uma boa prática manter o conjunto de dados o mais “bruto” possível neste estágio para que possa ser facilmente usado em vários aplicativos.",ne,bs,Il="Antes de enviarmos nosso conjunto de dados para o Hugging Face Hub, vamos lidar com uma coisa que está faltando: os comentários associados a cada issue e pull request. Vamos adicioná-los a seguir - você adivinhou - a API REST do GitHub!",oe,gs,ie,fs,Xl="Conforme mostrado na captura de tela a seguir, os comentários associados a uma issue ou a pull request fornecem uma rica fonte de informações, especialmente se estivermos interessados em criar um mecanismo de pesquisa para responder às consultas dos usuários sobre a biblioteca.",pe,G,Cl='<img src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter5/datasets-issues-comment.png" alt="Comments associated with an issue about 🤗 Datasets." width="80%"/>',ce,ws,Nl='A API REST do GitHub fornece um <a href="https://docs.github.com/en/rest/reference/issues#list-issue-comments" rel="nofollow">endpoint <code>Comments</code></a> que retorna todos os comentários associados a uma issue. Vamos testar o endpoint para ver o que ele retorna:',re,xs,de,Zs,ue,Gs,_l="Podemos ver que o comentário está armazenado no campo <code>body</code>, então vamos escrever uma função simples que retorna todos os comentários associados a uma issue selecionando o conteúdo do <code>body</code> para cada elemento em <code>response.json()</code>:",me,Rs,Me,vs,Je,Is,kl="Isso parece certo, então vamos usar <code>Dataset.map()</code> para adicionar uma nova coluna <code>comments</code> para cada issue em nosso conjunto de dados:",ye,Xs,he,Cs,zl="A etapa final é salvar o conjunto de dados aumentado junto com nossos dados brutos para que possamos enviá-los para o Hub:",Te,Ns,Ue,_s,je,ks,be,zs,Vl='Agora que temos nosso conjunto de dados aumentado, é hora de enviá-lo para o Hub para que possamos compartilhá-lo com a comunidade! Para fazer o upload do conjunto de dados, usaremos a <a href="https://github.com/huggingface/huggingface_hub" rel="nofollow">🤗 Hub library</a>, que nos permite interagir com o Hugging Face Hub por meio de uma API Python. 🤗 Hub vem pré-instalado com 🤗 Transformers, para que possamos usá-lo diretamente. Por exemplo, podemos usar a função <code>list_datasets()</code> para obter informações sobre todos os conjuntos de dados públicos atualmente hospedados no Hub:',ge,Vs,fe,$s,we,Bs,$l="Podemos ver que atualmente existem cerca de 1.500 conjuntos de dados no Hub, e a função <code>list_datasets()</code> também fornece alguns metadados básicos sobre cada repositório de conjuntos de dados.",xe,Hs,Bl="Para nossos propósitos, a primeira coisa que precisamos fazer é criar um novo repositório de conjunto de dados no Hub. Para fazer isso, precisamos de um token de autenticação, que pode ser obtido primeiro entrando no Hugging Face Hub com a função <code>notebook_login()</code>:",Ze,Ws,Ge,Fs,Hl="Isso criará um widget onde você poderá inserir seu nome de usuário e senha, e um token de API será salvo em <em>~/.huggingface/token</em>. Se você estiver executando o código em um terminal, poderá fazer login via CLI:",Re,Qs,ve,Ys,Wl="Feito isso, podemos criar um novo repositório de conjunto de dados com a função <code>create_repo()</code>:",Ie,Es,Xe,Ss,Ce,As,Fl="Neste exemplo, criamos um repositório de conjunto de dados vazio chamado <code>github-issues</code> sob o nome de usuário <code>lewtun</code> (o nome de usuário deve ser seu nome de usuário do Hub quando você estiver executando este código!).",Ne,R,_e,qs,Ql="Em seguida, vamos clonar o repositório do Hub para nossa máquina local e copiar nosso arquivo de conjunto de dados para ele. O 🤗 Hub fornece uma classe <code>Repository</code> útil que envolve muitos dos comandos comuns do Git, portanto, para clonar o repositório remoto, basta fornecer o URL e o caminho local para o qual desejamos clonar:",ke,Ls,ze,Ds,Yl="Por padrão, várias extensões de arquivo (como <em>.bin</em>, <em>.gz</em> e <em>.zip</em>) são rastreadas com o Git LFS para que arquivos grandes possam ser versionados no mesmo fluxo de trabalho do Git. Você pode encontrar uma lista de extensões de arquivos rastreados dentro do arquivo <em>.gitattributes</em> do repositório. Para incluir o formato JSON Lines na lista, podemos executar o seguinte comando:",Ve,Ps,$e,Os,El="Então podemos usar <code>Repository.push_to_hub()</code> para enviar o conjunto de dados para o Hub:",Be,Ks,He,sa,Sl="Se navegarmos para a URL contida em <code>repo_url</code>, veremos agora que nosso arquivo de conjunto de dados foi carregado.",We,v,Al='<img src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter5/hub-repo.png" alt="Our dataset repository on the Hugging Face Hub." width="80%"/>',Fe,aa,ql="A partir daqui, qualquer um pode baixar o conjunto de dados simplesmente fornecendo <code>load_dataset()</code> com o ID do repositório como o argumento <code>path</code>:",Qe,ea,Ye,la,Ee,ta,Ll="Legal, nós enviamos nosso conjunto de dados para o Hub e está disponível para outros usarem! Há apenas uma coisa importante a fazer: adicionar um <em>cartão de conjunto de dados</em> que explica como o corpus foi criado e fornece outras informações úteis para a comunidade.",Se,I,Ae,na,qe,oa,Dl="Conjuntos de dados bem documentados são mais propensos a serem úteis para outras pessoas (incluindo você mesmo no futuro!), pois fornecem o contexto para permitir que os usuários decidam se o conjunto de dados é relevante para sua tarefa e avaliem possíveis vieses ou riscos associados ao uso o conjunto de dados.",Le,ia,Pl="No Hugging Face Hub, essas informações são armazenadas no arquivo <em>README.md</em> de cada repositório de conjunto de dados. Há duas etapas principais que você deve seguir antes de criar este arquivo:",De,pa,Ol='<li>Use a aplicação <a href="https://huggingface.co/datasets/tagging/" rel="nofollow"><code>datasets-tagging</code></a> para criar tags de metadados no formato YAML. Essas tags são usadas para uma variedade de recursos de pesquisa no Hugging Face Hub e garantem que seu conjunto de dados possa ser facilmente encontrado pelos membros da comunidade. Como criamos um conjunto de dados personalizado aqui, você precisará clonar o repositório <code>datasets-tagging</code> e executar o aplicativo localmente. Veja como é a interface:</li>',Pe,X,Kl='<img src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter5/datasets-tagger.png" alt="The 'datasets-tagging' interface." width="80%"/>',Oe,C,st='<li>Leia o <a href="https://github.com/huggingface/datasets/blob/master/templates/README_guide.md" rel="nofollow">guia do 🤗 datasets</a> sobre como criar cartões informativos de conjuntos de dados e use-os como modelo.</li>',Ke,ca,at="Você pode criar o arquivo <em>README.md</em> diretamente no Hub e encontrar um cartão de conjunto de dados de modelo no repositório de conjunto de dados <code>lewtun/github-issues</code>. Uma captura de tela do cartão de conjunto de dados preenchido é mostrada abaixo.",sl,N,et='<img src="https://huggingface.co/datasets/huggingface-course/documentation-images/resolve/main/en/chapter5/dataset-card.png" alt="A dataset card." width="80%"/>',al,_,el,ra,lt="É isso! Vimos nesta seção que criar um bom conjunto de dados pode ser bastante complicado, mas felizmente carregá-lo e compartilhá-lo com a comunidade não é. Na próxima seção, usaremos nosso novo conjunto de dados para criar um mecanismo de pesquisa semântica com o 🤗 datasets que podem corresponder perguntas as issues e comentários mais relevantes.",ll,k,tl,da,nl,Ja,ol;return z=new Ma({props:{title:"Criando seu próprio dataset",local:"criando-seu-próprio-dataset",headingTag:"h1"}}),V=new Ut({props:{chapter:5,classNames:"absolute z-10 right-0 top-0",notebooks:[{label:"Google Colab",value:"https://colab.research.google.com/github/huggingface/notebooks/blob/master/course/pt/chapter5/section5.ipynb"},{label:"Aws Studio",value:"https://studiolab.sagemaker.aws/import/github/huggingface/notebooks/blob/master/course/pt/chapter5/section5.ipynb"}]}}),W=new Ma({props:{title:"Obtendo os dados",local:"obtendo-os-dados",headingTag:"h2"}}),S=new h({props:{code:"IXBpcCUyMGluc3RhbGwlMjByZXF1ZXN0cw==",highlighted:"!pip install requests",wrap:!1}}),q=new h({props:{code:"aW1wb3J0JTIwcmVxdWVzdHMlMEElMEF1cmwlMjAlM0QlMjAlMjJodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGaXNzdWVzJTNGcGFnZSUzRDElMjZwZXJfcGFnZSUzRDElMjIlMEFyZXNwb25zZSUyMCUzRCUyMHJlcXVlc3RzLmdldCh1cmwp",highlighted:`<span class="hljs-keyword">import</span> requests | |
| url = <span class="hljs-string">"https://api.github.com/repos/huggingface/datasets/issues?page=1&per_page=1"</span> | |
| response = requests.get(url)`,wrap:!1}}),D=new h({props:{code:"cmVzcG9uc2Uuc3RhdHVzX2NvZGU=",highlighted:"response.status_code",wrap:!1}}),P=new h({props:{code:"MjAw",highlighted:'<span class="hljs-number">200</span>',wrap:!1}}),K=new h({props:{code:"cmVzcG9uc2UuanNvbigp",highlighted:"response.json()",wrap:!1}}),ss=new h({props:{code:"JTVCJTdCJ3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnJlcG9zJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRmlzc3VlcyUyRjI3OTInJTJDJTBBJTIwJTIwJ3JlcG9zaXRvcnlfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJyUyQyUwQSUyMCUyMCdsYWJlbHNfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGaXNzdWVzJTJGMjc5MiUyRmxhYmVscyU3QiUyRm5hbWUlN0QnJTJDJTBBJTIwJTIwJ2NvbW1lbnRzX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnJlcG9zJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRmlzc3VlcyUyRjI3OTIlMkZjb21tZW50cyclMkMlMEElMjAlMjAnZXZlbnRzX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnJlcG9zJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRmlzc3VlcyUyRjI3OTIlMkZldmVudHMnJTJDJTBBJTIwJTIwJ2h0bWxfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbCUyRjI3OTInJTJDJTBBJTIwJTIwJ2lkJyUzQSUyMDk2ODY1MDI3NCUyQyUwQSUyMCUyMCdub2RlX2lkJyUzQSUyMCdNREV4T2xCMWJHeFNaWEYxWlhOME56RXdOelV5TWpjMCclMkMlMEElMjAlMjAnbnVtYmVyJyUzQSUyMDI3OTIlMkMlMEElMjAlMjAndGl0bGUnJTNBJTIwJ1VwZGF0ZSUyMEdvb0FRJyUyQyUwQSUyMCUyMCd1c2VyJyUzQSUyMCU3Qidsb2dpbiclM0ElMjAnYmhhdml0dnlhbWFsaWsnJTJDJTBBJTIwJTIwJTIwJ2lkJyUzQSUyMDE5NzE4ODE4JTJDJTBBJTIwJTIwJTIwJ25vZGVfaWQnJTNBJTIwJ01EUTZWWE5sY2pFNU56RTRPREU0JyUyQyUwQSUyMCUyMCUyMCdhdmF0YXJfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmF2YXRhcnMuZ2l0aHVidXNlcmNvbnRlbnQuY29tJTJGdSUyRjE5NzE4ODE4JTNGdiUzRDQnJTJDJTBBJTIwJTIwJTIwJ2dyYXZhdGFyX2lkJyUzQSUyMCcnJTJDJTBBJTIwJTIwJTIwJ3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWsnJTJDJTBBJTIwJTIwJTIwJ2h0bWxfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZiaGF2aXR2eWFtYWxpayclMkMlMEElMjAlMjAlMjAnZm9sbG93ZXJzX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWslMkZmb2xsb3dlcnMnJTJDJTBBJTIwJTIwJTIwJ2ZvbGxvd2luZ191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGZm9sbG93aW5nJTdCJTJGb3RoZXJfdXNlciU3RCclMkMlMEElMjAlMjAlMjAnZ2lzdHNfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGdXNlcnMlMkZiaGF2aXR2eWFtYWxpayUyRmdpc3RzJTdCJTJGZ2lzdF9pZCU3RCclMkMlMEElMjAlMjAlMjAnc3RhcnJlZF91cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGc3RhcnJlZCU3QiUyRm93bmVyJTdEJTdCJTJGcmVwbyU3RCclMkMlMEElMjAlMjAlMjAnc3Vic2NyaXB0aW9uc191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGc3Vic2NyaXB0aW9ucyclMkMlMEElMjAlMjAlMjAnb3JnYW5pemF0aW9uc191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGb3JncyclMkMlMEElMjAlMjAlMjAncmVwb3NfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGdXNlcnMlMkZiaGF2aXR2eWFtYWxpayUyRnJlcG9zJyUyQyUwQSUyMCUyMCUyMCdldmVudHNfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGdXNlcnMlMkZiaGF2aXR2eWFtYWxpayUyRmV2ZW50cyU3QiUyRnByaXZhY3klN0QnJTJDJTBBJTIwJTIwJTIwJ3JlY2VpdmVkX2V2ZW50c191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGcmVjZWl2ZWRfZXZlbnRzJyUyQyUwQSUyMCUyMCUyMCd0eXBlJyUzQSUyMCdVc2VyJyUyQyUwQSUyMCUyMCUyMCdzaXRlX2FkbWluJyUzQSUyMEZhbHNlJTdEJTJDJTBBJTIwJTIwJ2xhYmVscyclM0ElMjAlNUIlNUQlMkMlMEElMjAlMjAnc3RhdGUnJTNBJTIwJ29wZW4nJTJDJTBBJTIwJTIwJ2xvY2tlZCclM0ElMjBGYWxzZSUyQyUwQSUyMCUyMCdhc3NpZ25lZSclM0ElMjBOb25lJTJDJTBBJTIwJTIwJ2Fzc2lnbmVlcyclM0ElMjAlNUIlNUQlMkMlMEElMjAlMjAnbWlsZXN0b25lJyUzQSUyME5vbmUlMkMlMEElMjAlMjAnY29tbWVudHMnJTNBJTIwMSUyQyUwQSUyMCUyMCdjcmVhdGVkX2F0JyUzQSUyMCcyMDIxLTA4LTEyVDExJTNBNDAlM0ExOFonJTJDJTBBJTIwJTIwJ3VwZGF0ZWRfYXQnJTNBJTIwJzIwMjEtMDgtMTJUMTIlM0EzMSUzQTE3WiclMkMlMEElMjAlMjAnY2xvc2VkX2F0JyUzQSUyME5vbmUlMkMlMEElMjAlMjAnYXV0aG9yX2Fzc29jaWF0aW9uJyUzQSUyMCdDT05UUklCVVRPUiclMkMlMEElMjAlMjAnYWN0aXZlX2xvY2tfcmVhc29uJyUzQSUyME5vbmUlMkMlMEElMjAlMjAncHVsbF9yZXF1ZXN0JyUzQSUyMCU3Qid1cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZyZXBvcyUyRmh1Z2dpbmdmYWNlJTJGZGF0YXNldHMlMkZwdWxscyUyRjI3OTInJTJDJTBBJTIwJTIwJTIwJ2h0bWxfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbCUyRjI3OTInJTJDJTBBJTIwJTIwJTIwJ2RpZmZfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbCUyRjI3OTIuZGlmZiclMkMlMEElMjAlMjAlMjAncGF0Y2hfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbCUyRjI3OTIucGF0Y2gnJTdEJTJDJTBBJTIwJTIwJ2JvZHknJTNBJTIwJyU1Qkdvb0FRJTVEKGh0dHBzJTNBJTJGJTJGZ2l0aHViLmNvbSUyRmFsbGVuYWklMkZnb29hcSklMjBkYXRhc2V0JTIwd2FzJTIwcmVjZW50bHklMjB1cGRhdGVkJTIwYWZ0ZXIlMjBzcGxpdHMlMjB3ZXJlJTIwYWRkZWQlMjBmb3IlMjB0aGUlMjBzYW1lLiUyMFRoaXMlMjBQUiUyMGNvbnRhaW5zJTIwbmV3JTIwdXBkYXRlZCUyMEdvb0FRJTIwd2l0aCUyMHRyYWluJTJGdmFsJTJGdGVzdCUyMHNwbGl0cyUyMGFuZCUyMHVwZGF0ZWQlMjBSRUFETUUlMjBhcyUyMHdlbGwuJyUyQyUwQSUyMCUyMCdwZXJmb3JtZWRfdmlhX2dpdGh1Yl9hcHAnJTNBJTIwTm9uZSU3RCU1RA==",highlighted:`[{<span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/issues/2792'</span>, | |
| <span class="hljs-string">'repository_url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets'</span>, | |
| <span class="hljs-string">'labels_url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/issues/2792/labels{/name}'</span>, | |
| <span class="hljs-string">'comments_url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/issues/2792/comments'</span>, | |
| <span class="hljs-string">'events_url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/issues/2792/events'</span>, | |
| <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/2792'</span>, | |
| <span class="hljs-string">'id'</span>: <span class="hljs-number">968650274</span>, | |
| <span class="hljs-string">'node_id'</span>: <span class="hljs-string">'MDExOlB1bGxSZXF1ZXN0NzEwNzUyMjc0'</span>, | |
| <span class="hljs-string">'number'</span>: <span class="hljs-number">2792</span>, | |
| <span class="hljs-string">'title'</span>: <span class="hljs-string">'Update GooAQ'</span>, | |
| <span class="hljs-string">'user'</span>: {<span class="hljs-string">'login'</span>: <span class="hljs-string">'bhavitvyamalik'</span>, | |
| <span class="hljs-string">'id'</span>: <span class="hljs-number">19718818</span>, | |
| <span class="hljs-string">'node_id'</span>: <span class="hljs-string">'MDQ6VXNlcjE5NzE4ODE4'</span>, | |
| <span class="hljs-string">'avatar_url'</span>: <span class="hljs-string">'https://avatars.githubusercontent.com/u/19718818?v=4'</span>, | |
| <span class="hljs-string">'gravatar_id'</span>: <span class="hljs-string">''</span>, | |
| <span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik'</span>, | |
| <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/bhavitvyamalik'</span>, | |
| <span class="hljs-string">'followers_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/followers'</span>, | |
| <span class="hljs-string">'following_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/following{/other_user}'</span>, | |
| <span class="hljs-string">'gists_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/gists{/gist_id}'</span>, | |
| <span class="hljs-string">'starred_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/starred{/owner}{/repo}'</span>, | |
| <span class="hljs-string">'subscriptions_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/subscriptions'</span>, | |
| <span class="hljs-string">'organizations_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/orgs'</span>, | |
| <span class="hljs-string">'repos_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/repos'</span>, | |
| <span class="hljs-string">'events_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/events{/privacy}'</span>, | |
| <span class="hljs-string">'received_events_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/received_events'</span>, | |
| <span class="hljs-string">'type'</span>: <span class="hljs-string">'User'</span>, | |
| <span class="hljs-string">'site_admin'</span>: <span class="hljs-literal">False</span>}, | |
| <span class="hljs-string">'labels'</span>: [], | |
| <span class="hljs-string">'state'</span>: <span class="hljs-string">'open'</span>, | |
| <span class="hljs-string">'locked'</span>: <span class="hljs-literal">False</span>, | |
| <span class="hljs-string">'assignee'</span>: <span class="hljs-literal">None</span>, | |
| <span class="hljs-string">'assignees'</span>: [], | |
| <span class="hljs-string">'milestone'</span>: <span class="hljs-literal">None</span>, | |
| <span class="hljs-string">'comments'</span>: <span class="hljs-number">1</span>, | |
| <span class="hljs-string">'created_at'</span>: <span class="hljs-string">'2021-08-12T11:40:18Z'</span>, | |
| <span class="hljs-string">'updated_at'</span>: <span class="hljs-string">'2021-08-12T12:31:17Z'</span>, | |
| <span class="hljs-string">'closed_at'</span>: <span class="hljs-literal">None</span>, | |
| <span class="hljs-string">'author_association'</span>: <span class="hljs-string">'CONTRIBUTOR'</span>, | |
| <span class="hljs-string">'active_lock_reason'</span>: <span class="hljs-literal">None</span>, | |
| <span class="hljs-string">'pull_request'</span>: {<span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/pulls/2792'</span>, | |
| <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/2792'</span>, | |
| <span class="hljs-string">'diff_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/2792.diff'</span>, | |
| <span class="hljs-string">'patch_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/2792.patch'</span>}, | |
| <span class="hljs-string">'body'</span>: <span class="hljs-string">'[GooAQ](https://github.com/allenai/gooaq) dataset was recently updated after splits were added for the same. This PR contains new updated GooAQ with train/val/test splits and updated README as well.'</span>, | |
| <span class="hljs-string">'performed_via_github_app'</span>: <span class="hljs-literal">None</span>}]`,wrap:!1}}),w=new ua({props:{$$slots:{default:[bt]},$$scope:{ctx:j}}}),ls=new h({props:{code:"R0lUSFVCX1RPS0VOJTIwJTNEJTIweHh4JTIwJTIwJTIzJTIwQ29weSUyMHlvdXIlMjBHaXRIdWIlMjB0b2tlbiUyMGhlcmUlMEFoZWFkZXJzJTIwJTNEJTIwJTdCJTIyQXV0aG9yaXphdGlvbiUyMiUzQSUyMGYlMjJ0b2tlbiUyMCU3QkdJVEhVQl9UT0tFTiU3RCUyMiU3RA==",highlighted:`GITHUB_TOKEN = xxx <span class="hljs-comment"># Copy your GitHub token here</span> | |
| headers = {<span class="hljs-string">"Authorization"</span>: <span class="hljs-string">f"token <span class="hljs-subst">{GITHUB_TOKEN}</span>"</span>}`,wrap:!1}}),x=new ua({props:{warning:!0,$$slots:{default:[gt]},$$scope:{ctx:j}}}),ns=new h({props:{code:"aW1wb3J0JTIwdGltZSUwQWltcG9ydCUyMG1hdGglMEFmcm9tJTIwcGF0aGxpYiUyMGltcG9ydCUyMFBhdGglMEFpbXBvcnQlMjBwYW5kYXMlMjBhcyUyMHBkJTBBZnJvbSUyMHRxZG0ubm90ZWJvb2slMjBpbXBvcnQlMjB0cWRtJTBBJTBBJTBBZGVmJTIwZmV0Y2hfaXNzdWVzKCUwQSUyMCUyMCUyMCUyMG93bmVyJTNEJTIyaHVnZ2luZ2ZhY2UlMjIlMkMlMEElMjAlMjAlMjAlMjByZXBvJTNEJTIyZGF0YXNldHMlMjIlMkMlMEElMjAlMjAlMjAlMjBudW1faXNzdWVzJTNEMTBfMDAwJTJDJTBBJTIwJTIwJTIwJTIwcmF0ZV9saW1pdCUzRDVfMDAwJTJDJTBBJTIwJTIwJTIwJTIwaXNzdWVzX3BhdGglM0RQYXRoKCUyMi4lMjIpJTJDJTBBKSUzQSUwQSUyMCUyMCUyMCUyMGlmJTIwbm90JTIwaXNzdWVzX3BhdGguaXNfZGlyKCklM0ElMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjBpc3N1ZXNfcGF0aC5ta2RpcihleGlzdF9vayUzRFRydWUpJTBBJTBBJTIwJTIwJTIwJTIwYmF0Y2glMjAlM0QlMjAlNUIlNUQlMEElMjAlMjAlMjAlMjBhbGxfaXNzdWVzJTIwJTNEJTIwJTVCJTVEJTBBJTIwJTIwJTIwJTIwcGVyX3BhZ2UlMjAlM0QlMjAxMDAlMjAlMjAlMjMlMjBOdW1iZXIlMjBvZiUyMGlzc3VlcyUyMHRvJTIwcmV0dXJuJTIwcGVyJTIwcGFnZSUwQSUyMCUyMCUyMCUyMG51bV9wYWdlcyUyMCUzRCUyMG1hdGguY2VpbChudW1faXNzdWVzJTIwJTJGJTIwcGVyX3BhZ2UpJTBBJTIwJTIwJTIwJTIwYmFzZV91cmwlMjAlM0QlMjAlMjJodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMjIlMEElMEElMjAlMjAlMjAlMjBmb3IlMjBwYWdlJTIwaW4lMjB0cWRtKHJhbmdlKG51bV9wYWdlcykpJTNBJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIzJTIwUXVlcnklMjB3aXRoJTIwc3RhdGUlM0RhbGwlMjB0byUyMGdldCUyMGJvdGglMjBvcGVuJTIwYW5kJTIwY2xvc2VkJTIwaXNzdWVzJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwcXVlcnklMjAlM0QlMjBmJTIyaXNzdWVzJTNGcGFnZSUzRCU3QnBhZ2UlN0QlMjZwZXJfcGFnZSUzRCU3QnBlcl9wYWdlJTdEJTI2c3RhdGUlM0RhbGwlMjIlMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjBpc3N1ZXMlMjAlM0QlMjByZXF1ZXN0cy5nZXQoZiUyMiU3QmJhc2VfdXJsJTdEJTJGJTdCb3duZXIlN0QlMkYlN0JyZXBvJTdEJTJGJTdCcXVlcnklN0QlMjIlMkMlMjBoZWFkZXJzJTNEaGVhZGVycyklMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjBiYXRjaC5leHRlbmQoaXNzdWVzLmpzb24oKSklMEElMEElMjAlMjAlMjAlMjAlMjAlMjAlMjAlMjBpZiUyMGxlbihiYXRjaCklMjAlM0UlMjByYXRlX2xpbWl0JTIwYW5kJTIwbGVuKGFsbF9pc3N1ZXMpJTIwJTNDJTIwbnVtX2lzc3VlcyUzQSUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMGFsbF9pc3N1ZXMuZXh0ZW5kKGJhdGNoKSUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMGJhdGNoJTIwJTNEJTIwJTVCJTVEJTIwJTIwJTIzJTIwRmx1c2glMjBiYXRjaCUyMGZvciUyMG5leHQlMjB0aW1lJTIwcGVyaW9kJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwcHJpbnQoZiUyMlJlYWNoZWQlMjBHaXRIdWIlMjByYXRlJTIwbGltaXQuJTIwU2xlZXBpbmclMjBmb3IlMjBvbmUlMjBob3VyJTIwLi4uJTIyKSUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMHRpbWUuc2xlZXAoNjAlMjAqJTIwNjAlMjAlMkIlMjAxKSUwQSUwQSUyMCUyMCUyMCUyMGFsbF9pc3N1ZXMuZXh0ZW5kKGJhdGNoKSUwQSUyMCUyMCUyMCUyMGRmJTIwJTNEJTIwcGQuRGF0YUZyYW1lLmZyb21fcmVjb3JkcyhhbGxfaXNzdWVzKSUwQSUyMCUyMCUyMCUyMGRmLnRvX2pzb24oZiUyMiU3Qmlzc3Vlc19wYXRoJTdEJTJGJTdCcmVwbyU3RC1pc3N1ZXMuanNvbmwlMjIlMkMlMjBvcmllbnQlM0QlMjJyZWNvcmRzJTIyJTJDJTIwbGluZXMlM0RUcnVlKSUwQSUyMCUyMCUyMCUyMHByaW50KCUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMGYlMjJEb3dubG9hZGVkJTIwYWxsJTIwdGhlJTIwaXNzdWVzJTIwZm9yJTIwJTdCcmVwbyU3RCElMjBEYXRhc2V0JTIwc3RvcmVkJTIwYXQlMjAlN0Jpc3N1ZXNfcGF0aCU3RCUyRiU3QnJlcG8lN0QtaXNzdWVzLmpzb25sJTIyJTBBJTIwJTIwJTIwJTIwKQ==",highlighted:`<span class="hljs-keyword">import</span> time | |
| <span class="hljs-keyword">import</span> math | |
| <span class="hljs-keyword">from</span> pathlib <span class="hljs-keyword">import</span> Path | |
| <span class="hljs-keyword">import</span> pandas <span class="hljs-keyword">as</span> pd | |
| <span class="hljs-keyword">from</span> tqdm.notebook <span class="hljs-keyword">import</span> tqdm | |
| <span class="hljs-keyword">def</span> <span class="hljs-title function_">fetch_issues</span>(<span class="hljs-params"> | |
| owner=<span class="hljs-string">"huggingface"</span>, | |
| repo=<span class="hljs-string">"datasets"</span>, | |
| num_issues=<span class="hljs-number">10_000</span>, | |
| rate_limit=<span class="hljs-number">5_000</span>, | |
| issues_path=Path(<span class="hljs-params"><span class="hljs-string">"."</span></span>), | |
| </span>): | |
| <span class="hljs-keyword">if</span> <span class="hljs-keyword">not</span> issues_path.is_dir(): | |
| issues_path.mkdir(exist_ok=<span class="hljs-literal">True</span>) | |
| batch = [] | |
| all_issues = [] | |
| per_page = <span class="hljs-number">100</span> <span class="hljs-comment"># Number of issues to return per page</span> | |
| num_pages = math.ceil(num_issues / per_page) | |
| base_url = <span class="hljs-string">"https://api.github.com/repos"</span> | |
| <span class="hljs-keyword">for</span> page <span class="hljs-keyword">in</span> tqdm(<span class="hljs-built_in">range</span>(num_pages)): | |
| <span class="hljs-comment"># Query with state=all to get both open and closed issues</span> | |
| query = <span class="hljs-string">f"issues?page=<span class="hljs-subst">{page}</span>&per_page=<span class="hljs-subst">{per_page}</span>&state=all"</span> | |
| issues = requests.get(<span class="hljs-string">f"<span class="hljs-subst">{base_url}</span>/<span class="hljs-subst">{owner}</span>/<span class="hljs-subst">{repo}</span>/<span class="hljs-subst">{query}</span>"</span>, headers=headers) | |
| batch.extend(issues.json()) | |
| <span class="hljs-keyword">if</span> <span class="hljs-built_in">len</span>(batch) > rate_limit <span class="hljs-keyword">and</span> <span class="hljs-built_in">len</span>(all_issues) < num_issues: | |
| all_issues.extend(batch) | |
| batch = [] <span class="hljs-comment"># Flush batch for next time period</span> | |
| <span class="hljs-built_in">print</span>(<span class="hljs-string">f"Reached GitHub rate limit. Sleeping for one hour ..."</span>) | |
| time.sleep(<span class="hljs-number">60</span> * <span class="hljs-number">60</span> + <span class="hljs-number">1</span>) | |
| all_issues.extend(batch) | |
| df = pd.DataFrame.from_records(all_issues) | |
| df.to_json(<span class="hljs-string">f"<span class="hljs-subst">{issues_path}</span>/<span class="hljs-subst">{repo}</span>-issues.jsonl"</span>, orient=<span class="hljs-string">"records"</span>, lines=<span class="hljs-literal">True</span>) | |
| <span class="hljs-built_in">print</span>( | |
| <span class="hljs-string">f"Downloaded all the issues for <span class="hljs-subst">{repo}</span>! Dataset stored at <span class="hljs-subst">{issues_path}</span>/<span class="hljs-subst">{repo}</span>-issues.jsonl"</span> | |
| )`,wrap:!1}}),is=new h({props:{code:"JTIzJTIwRGVwZW5kaW5nJTIwb24lMjB5b3VyJTIwaW50ZXJuZXQlMjBjb25uZWN0aW9uJTJDJTIwdGhpcyUyMGNhbiUyMHRha2UlMjBzZXZlcmFsJTIwbWludXRlcyUyMHRvJTIwcnVuLi4uJTBBZmV0Y2hfaXNzdWVzKCk=",highlighted:`<span class="hljs-comment"># Depending on your internet connection, this can take several minutes to run...</span> | |
| fetch_issues()`,wrap:!1}}),cs=new h({props:{code:"aXNzdWVzX2RhdGFzZXQlMjAlM0QlMjBsb2FkX2RhdGFzZXQoJTIyanNvbiUyMiUyQyUyMGRhdGFfZmlsZXMlM0QlMjJkYXRhc2V0cy1pc3N1ZXMuanNvbmwlMjIlMkMlMjBzcGxpdCUzRCUyMnRyYWluJTIyKSUwQWlzc3Vlc19kYXRhc2V0",highlighted:`issues_dataset = load_dataset(<span class="hljs-string">"json"</span>, data_files=<span class="hljs-string">"datasets-issues.jsonl"</span>, split=<span class="hljs-string">"train"</span>) | |
| issues_dataset`,wrap:!1}}),rs=new h({props:{code:"RGF0YXNldCglN0IlMEElMjAlMjAlMjAlMjBmZWF0dXJlcyUzQSUyMCU1Qid1cmwnJTJDJTIwJ3JlcG9zaXRvcnlfdXJsJyUyQyUyMCdsYWJlbHNfdXJsJyUyQyUyMCdjb21tZW50c191cmwnJTJDJTIwJ2V2ZW50c191cmwnJTJDJTIwJ2h0bWxfdXJsJyUyQyUyMCdpZCclMkMlMjAnbm9kZV9pZCclMkMlMjAnbnVtYmVyJyUyQyUyMCd0aXRsZSclMkMlMjAndXNlciclMkMlMjAnbGFiZWxzJyUyQyUyMCdzdGF0ZSclMkMlMjAnbG9ja2VkJyUyQyUyMCdhc3NpZ25lZSclMkMlMjAnYXNzaWduZWVzJyUyQyUyMCdtaWxlc3RvbmUnJTJDJTIwJ2NvbW1lbnRzJyUyQyUyMCdjcmVhdGVkX2F0JyUyQyUyMCd1cGRhdGVkX2F0JyUyQyUyMCdjbG9zZWRfYXQnJTJDJTIwJ2F1dGhvcl9hc3NvY2lhdGlvbiclMkMlMjAnYWN0aXZlX2xvY2tfcmVhc29uJyUyQyUyMCdwdWxsX3JlcXVlc3QnJTJDJTIwJ2JvZHknJTJDJTIwJ3RpbWVsaW5lX3VybCclMkMlMjAncGVyZm9ybWVkX3ZpYV9naXRodWJfYXBwJyU1RCUyQyUwQSUyMCUyMCUyMCUyMG51bV9yb3dzJTNBJTIwMzAxOSUwQSU3RCk=",highlighted:`Dataset({ | |
| features: [<span class="hljs-string">'url'</span>, <span class="hljs-string">'repository_url'</span>, <span class="hljs-string">'labels_url'</span>, <span class="hljs-string">'comments_url'</span>, <span class="hljs-string">'events_url'</span>, <span class="hljs-string">'html_url'</span>, <span class="hljs-string">'id'</span>, <span class="hljs-string">'node_id'</span>, <span class="hljs-string">'number'</span>, <span class="hljs-string">'title'</span>, <span class="hljs-string">'user'</span>, <span class="hljs-string">'labels'</span>, <span class="hljs-string">'state'</span>, <span class="hljs-string">'locked'</span>, <span class="hljs-string">'assignee'</span>, <span class="hljs-string">'assignees'</span>, <span class="hljs-string">'milestone'</span>, <span class="hljs-string">'comments'</span>, <span class="hljs-string">'created_at'</span>, <span class="hljs-string">'updated_at'</span>, <span class="hljs-string">'closed_at'</span>, <span class="hljs-string">'author_association'</span>, <span class="hljs-string">'active_lock_reason'</span>, <span class="hljs-string">'pull_request'</span>, <span class="hljs-string">'body'</span>, <span class="hljs-string">'timeline_url'</span>, <span class="hljs-string">'performed_via_github_app'</span>], | |
| num_rows: <span class="hljs-number">3019</span> | |
| })`,wrap:!1}}),Ms=new Ma({props:{title:"Limpando os dados",local:"limpando-os-dados",headingTag:"h2"}}),ys=new h({props:{code:"c2FtcGxlJTIwJTNEJTIwaXNzdWVzX2RhdGFzZXQuc2h1ZmZsZShzZWVkJTNENjY2KS5zZWxlY3QocmFuZ2UoMykpJTBBJTBBJTIzJTIwUHJpbnQlMjBvdXQlMjB0aGUlMjBVUkwlMjBhbmQlMjBwdWxsJTIwcmVxdWVzdCUyMGVudHJpZXMlMEFmb3IlMjB1cmwlMkMlMjBwciUyMGluJTIwemlwKHNhbXBsZSU1QiUyMmh0bWxfdXJsJTIyJTVEJTJDJTIwc2FtcGxlJTVCJTIycHVsbF9yZXF1ZXN0JTIyJTVEKSUzQSUwQSUyMCUyMCUyMCUyMHByaW50KGYlMjIlM0UlM0UlMjBVUkwlM0ElMjAlN0J1cmwlN0QlMjIpJTBBJTIwJTIwJTIwJTIwcHJpbnQoZiUyMiUzRSUzRSUyMFB1bGwlMjByZXF1ZXN0JTNBJTIwJTdCcHIlN0QlNUNuJTIyKQ==",highlighted:`sample = issues_dataset.shuffle(seed=<span class="hljs-number">666</span>).select(<span class="hljs-built_in">range</span>(<span class="hljs-number">3</span>)) | |
| <span class="hljs-comment"># Print out the URL and pull request entries</span> | |
| <span class="hljs-keyword">for</span> url, pr <span class="hljs-keyword">in</span> <span class="hljs-built_in">zip</span>(sample[<span class="hljs-string">"html_url"</span>], sample[<span class="hljs-string">"pull_request"</span>]): | |
| <span class="hljs-built_in">print</span>(<span class="hljs-string">f">> URL: <span class="hljs-subst">{url}</span>"</span>) | |
| <span class="hljs-built_in">print</span>(<span class="hljs-string">f">> Pull request: <span class="hljs-subst">{pr}</span>\\n"</span>)`,wrap:!1}}),hs=new h({props:{code:"JTNFJTNFJTIwVVJMJTNBJTIwaHR0cHMlM0ElMkYlMkZnaXRodWIuY29tJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRnB1bGwlMkY4NTAlMEElM0UlM0UlMjBQdWxsJTIwcmVxdWVzdCUzQSUyMCU3Qid1cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZyZXBvcyUyRmh1Z2dpbmdmYWNlJTJGZGF0YXNldHMlMkZwdWxscyUyRjg1MCclMkMlMjAnaHRtbF91cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGZ2l0aHViLmNvbSUyRmh1Z2dpbmdmYWNlJTJGZGF0YXNldHMlMkZwdWxsJTJGODUwJyUyQyUyMCdkaWZmX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZnaXRodWIuY29tJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRnB1bGwlMkY4NTAuZGlmZiclMkMlMjAncGF0Y2hfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbCUyRjg1MC5wYXRjaCclN0QlMEElMEElM0UlM0UlMjBVUkwlM0ElMjBodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGaXNzdWVzJTJGMjc3MyUwQSUzRSUzRSUyMFB1bGwlMjByZXF1ZXN0JTNBJTIwTm9uZSUwQSUwQSUzRSUzRSUyMFVSTCUzQSUyMGh0dHBzJTNBJTJGJTJGZ2l0aHViLmNvbSUyRmh1Z2dpbmdmYWNlJTJGZGF0YXNldHMlMkZwdWxsJTJGNzgzJTBBJTNFJTNFJTIwUHVsbCUyMHJlcXVlc3QlM0ElMjAlN0IndXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbHMlMkY3ODMnJTJDJTIwJ2h0bWxfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmdpdGh1Yi5jb20lMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGcHVsbCUyRjc4MyclMkMlMjAnZGlmZl91cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGZ2l0aHViLmNvbSUyRmh1Z2dpbmdmYWNlJTJGZGF0YXNldHMlMkZwdWxsJTJGNzgzLmRpZmYnJTJDJTIwJ3BhdGNoX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZnaXRodWIuY29tJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRnB1bGwlMkY3ODMucGF0Y2gnJTdE",highlighted:`>> URL: https://github.com/huggingface/datasets/pull/<span class="hljs-number">850</span> | |
| >> Pull request: {<span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/pulls/850'</span>, <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/850'</span>, <span class="hljs-string">'diff_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/850.diff'</span>, <span class="hljs-string">'patch_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/850.patch'</span>} | |
| >> URL: https://github.com/huggingface/datasets/issues/<span class="hljs-number">2773</span> | |
| >> Pull request: <span class="hljs-literal">None</span> | |
| >> URL: https://github.com/huggingface/datasets/pull/<span class="hljs-number">783</span> | |
| >> Pull request: {<span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/pulls/783'</span>, <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/783'</span>, <span class="hljs-string">'diff_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/783.diff'</span>, <span class="hljs-string">'patch_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/783.patch'</span>}`,wrap:!1}}),Us=new h({props:{code:"aXNzdWVzX2RhdGFzZXQlMjAlM0QlMjBpc3N1ZXNfZGF0YXNldC5tYXAoJTBBJTIwJTIwJTIwJTIwbGFtYmRhJTIweCUzQSUyMCU3QiUyMmlzX3B1bGxfcmVxdWVzdCUyMiUzQSUyMEZhbHNlJTIwaWYlMjB4JTVCJTIycHVsbF9yZXF1ZXN0JTIyJTVEJTIwaXMlMjBOb25lJTIwZWxzZSUyMFRydWUlN0QlMEEp",highlighted:`issues_dataset = issues_dataset.<span class="hljs-built_in">map</span>( | |
| <span class="hljs-keyword">lambda</span> x: {<span class="hljs-string">"is_pull_request"</span>: <span class="hljs-literal">False</span> <span class="hljs-keyword">if</span> x[<span class="hljs-string">"pull_request"</span>] <span class="hljs-keyword">is</span> <span class="hljs-literal">None</span> <span class="hljs-keyword">else</span> <span class="hljs-literal">True</span>} | |
| )`,wrap:!1}}),Z=new ua({props:{$$slots:{default:[ft]},$$scope:{ctx:j}}}),gs=new Ma({props:{title:"Aumentando o conjunto de dados",local:"aumentando-o-conjunto-de-dados",headingTag:"h2"}}),xs=new h({props:{code:"aXNzdWVfbnVtYmVyJTIwJTNEJTIwMjc5MiUwQXVybCUyMCUzRCUyMGYlMjJodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGaXNzdWVzJTJGJTdCaXNzdWVfbnVtYmVyJTdEJTJGY29tbWVudHMlMjIlMEFyZXNwb25zZSUyMCUzRCUyMHJlcXVlc3RzLmdldCh1cmwlMkMlMjBoZWFkZXJzJTNEaGVhZGVycyklMEFyZXNwb25zZS5qc29uKCk=",highlighted:`issue_number = <span class="hljs-number">2792</span> | |
| url = <span class="hljs-string">f"https://api.github.com/repos/huggingface/datasets/issues/<span class="hljs-subst">{issue_number}</span>/comments"</span> | |
| response = requests.get(url, headers=headers) | |
| response.json()`,wrap:!1}}),Zs=new h({props:{code:"JTVCJTdCJ3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnJlcG9zJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRmlzc3VlcyUyRmNvbW1lbnRzJTJGODk3NTk0MTI4JyUyQyUwQSUyMCUyMCdodG1sX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZnaXRodWIuY29tJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRnB1bGwlMkYyNzkyJTIzaXNzdWVjb21tZW50LTg5NzU5NDEyOCclMkMlMEElMjAlMjAnaXNzdWVfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGcmVwb3MlMkZodWdnaW5nZmFjZSUyRmRhdGFzZXRzJTJGaXNzdWVzJTJGMjc5MiclMkMlMEElMjAlMjAnaWQnJTNBJTIwODk3NTk0MTI4JTJDJTBBJTIwJTIwJ25vZGVfaWQnJTNBJTIwJ0lDX2t3RE9EdW56cHM0MWdETVEnJTJDJTBBJTIwJTIwJ3VzZXInJTNBJTIwJTdCJ2xvZ2luJyUzQSUyMCdiaGF2aXR2eWFtYWxpayclMkMlMEElMjAlMjAlMjAnaWQnJTNBJTIwMTk3MTg4MTglMkMlMEElMjAlMjAlMjAnbm9kZV9pZCclM0ElMjAnTURRNlZYTmxjakU1TnpFNE9ERTQnJTJDJTBBJTIwJTIwJTIwJ2F2YXRhcl91cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXZhdGFycy5naXRodWJ1c2VyY29udGVudC5jb20lMkZ1JTJGMTk3MTg4MTglM0Z2JTNENCclMkMlMEElMjAlMjAlMjAnZ3JhdmF0YXJfaWQnJTNBJTIwJyclMkMlMEElMjAlMjAlMjAndXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGdXNlcnMlMkZiaGF2aXR2eWFtYWxpayclMkMlMEElMjAlMjAlMjAnaHRtbF91cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGZ2l0aHViLmNvbSUyRmJoYXZpdHZ5YW1hbGlrJyUyQyUwQSUyMCUyMCUyMCdmb2xsb3dlcnNfdXJsJyUzQSUyMCdodHRwcyUzQSUyRiUyRmFwaS5naXRodWIuY29tJTJGdXNlcnMlMkZiaGF2aXR2eWFtYWxpayUyRmZvbGxvd2VycyclMkMlMEElMjAlMjAlMjAnZm9sbG93aW5nX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWslMkZmb2xsb3dpbmclN0IlMkZvdGhlcl91c2VyJTdEJyUyQyUwQSUyMCUyMCUyMCdnaXN0c191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGZ2lzdHMlN0IlMkZnaXN0X2lkJTdEJyUyQyUwQSUyMCUyMCUyMCdzdGFycmVkX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWslMkZzdGFycmVkJTdCJTJGb3duZXIlN0QlN0IlMkZyZXBvJTdEJyUyQyUwQSUyMCUyMCUyMCdzdWJzY3JpcHRpb25zX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWslMkZzdWJzY3JpcHRpb25zJyUyQyUwQSUyMCUyMCUyMCdvcmdhbml6YXRpb25zX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWslMkZvcmdzJyUyQyUwQSUyMCUyMCUyMCdyZXBvc191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGcmVwb3MnJTJDJTBBJTIwJTIwJTIwJ2V2ZW50c191cmwnJTNBJTIwJ2h0dHBzJTNBJTJGJTJGYXBpLmdpdGh1Yi5jb20lMkZ1c2VycyUyRmJoYXZpdHZ5YW1hbGlrJTJGZXZlbnRzJTdCJTJGcHJpdmFjeSU3RCclMkMlMEElMjAlMjAlMjAncmVjZWl2ZWRfZXZlbnRzX3VybCclM0ElMjAnaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnVzZXJzJTJGYmhhdml0dnlhbWFsaWslMkZyZWNlaXZlZF9ldmVudHMnJTJDJTBBJTIwJTIwJTIwJ3R5cGUnJTNBJTIwJ1VzZXInJTJDJTBBJTIwJTIwJTIwJ3NpdGVfYWRtaW4nJTNBJTIwRmFsc2UlN0QlMkMlMEElMjAlMjAnY3JlYXRlZF9hdCclM0ElMjAnMjAyMS0wOC0xMlQxMiUzQTIxJTNBNTJaJyUyQyUwQSUyMCUyMCd1cGRhdGVkX2F0JyUzQSUyMCcyMDIxLTA4LTEyVDEyJTNBMzElM0ExN1onJTJDJTBBJTIwJTIwJ2F1dGhvcl9hc3NvY2lhdGlvbiclM0ElMjAnQ09OVFJJQlVUT1InJTJDJTBBJTIwJTIwJ2JvZHknJTNBJTIwJTIyJTQwYWxiZXJ0dmlsbGFub3ZhJTIwbXklMjB0ZXN0cyUyMGFyZSUyMGZhaWxpbmclMjBoZXJlJTNBJTVDciU1Q24lNjAlNjAlNjAlNUNyJTVDbmRhdGFzZXRfbmFtZSUyMCUzRCUyMCdnb29hcSclNUNyJTVDbiU1Q3IlNUNuJTIwJTIwJTIwJTIwZGVmJTIwdGVzdF9sb2FkX2RhdGFzZXQoc2VsZiUyQyUyMGRhdGFzZXRfbmFtZSklM0ElNUNyJTVDbiUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMGNvbmZpZ3MlMjAlM0QlMjBzZWxmLmRhdGFzZXRfdGVzdGVyLmxvYWRfYWxsX2NvbmZpZ3MoZGF0YXNldF9uYW1lJTJDJTIwaXNfbG9jYWwlM0RUcnVlKSU1QiUzQTElNUQlNUNyJTVDbiUzRSUyMCUyMCUyMCUyMCUyMCUyMCUyMHNlbGYuZGF0YXNldF90ZXN0ZXIuY2hlY2tfbG9hZF9kYXRhc2V0KGRhdGFzZXRfbmFtZSUyQyUyMGNvbmZpZ3MlMkMlMjBpc19sb2NhbCUzRFRydWUlMkMlMjB1c2VfbG9jYWxfZHVtbXlfZGF0YSUzRFRydWUpJTVDciU1Q24lNUNyJTVDbnRlc3RzJTJGdGVzdF9kYXRhc2V0X2NvbW1vbi5weSUzQTIzNCUzQSUyMCU1Q3IlNUNuXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMCU1Q3IlNUNudGVzdHMlMkZ0ZXN0X2RhdGFzZXRfY29tbW9uLnB5JTNBMTg3JTNBJTIwaW4lMjBjaGVja19sb2FkX2RhdGFzZXQlNUNyJTVDbiUyMCUyMCUyMCUyMHNlbGYucGFyZW50LmFzc2VydFRydWUobGVuKGRhdGFzZXQlNUJzcGxpdCU1RCklMjAlM0UlMjAwKSU1Q3IlNUNuRSUyMCUyMCUyMEFzc2VydGlvbkVycm9yJTNBJTIwRmFsc2UlMjBpcyUyMG5vdCUyMHRydWUlNUNyJTVDbiU2MCU2MCU2MCU1Q3IlNUNuV2hlbiUyMEklMjB0cnklMjBsb2FkaW5nJTIwZGF0YXNldCUyMG9uJTIwbG9jYWwlMjBtYWNoaW5lJTIwaXQlMjB3b3JrcyUyMGZpbmUuJTIwQW55JTIwc3VnZ2VzdGlvbnMlMjBvbiUyMGhvdyUyMGNhbiUyMEklMjBhdm9pZCUyMHRoaXMlMjBlcnJvciUzRiUyMiUyQyUwQSUyMCUyMCdwZXJmb3JtZWRfdmlhX2dpdGh1Yl9hcHAnJTNBJTIwTm9uZSU3RCU1RA==",highlighted:`[{<span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/issues/comments/897594128'</span>, | |
| <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/huggingface/datasets/pull/2792#issuecomment-897594128'</span>, | |
| <span class="hljs-string">'issue_url'</span>: <span class="hljs-string">'https://api.github.com/repos/huggingface/datasets/issues/2792'</span>, | |
| <span class="hljs-string">'id'</span>: <span class="hljs-number">897594128</span>, | |
| <span class="hljs-string">'node_id'</span>: <span class="hljs-string">'IC_kwDODunzps41gDMQ'</span>, | |
| <span class="hljs-string">'user'</span>: {<span class="hljs-string">'login'</span>: <span class="hljs-string">'bhavitvyamalik'</span>, | |
| <span class="hljs-string">'id'</span>: <span class="hljs-number">19718818</span>, | |
| <span class="hljs-string">'node_id'</span>: <span class="hljs-string">'MDQ6VXNlcjE5NzE4ODE4'</span>, | |
| <span class="hljs-string">'avatar_url'</span>: <span class="hljs-string">'https://avatars.githubusercontent.com/u/19718818?v=4'</span>, | |
| <span class="hljs-string">'gravatar_id'</span>: <span class="hljs-string">''</span>, | |
| <span class="hljs-string">'url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik'</span>, | |
| <span class="hljs-string">'html_url'</span>: <span class="hljs-string">'https://github.com/bhavitvyamalik'</span>, | |
| <span class="hljs-string">'followers_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/followers'</span>, | |
| <span class="hljs-string">'following_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/following{/other_user}'</span>, | |
| <span class="hljs-string">'gists_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/gists{/gist_id}'</span>, | |
| <span class="hljs-string">'starred_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/starred{/owner}{/repo}'</span>, | |
| <span class="hljs-string">'subscriptions_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/subscriptions'</span>, | |
| <span class="hljs-string">'organizations_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/orgs'</span>, | |
| <span class="hljs-string">'repos_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/repos'</span>, | |
| <span class="hljs-string">'events_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/events{/privacy}'</span>, | |
| <span class="hljs-string">'received_events_url'</span>: <span class="hljs-string">'https://api.github.com/users/bhavitvyamalik/received_events'</span>, | |
| <span class="hljs-string">'type'</span>: <span class="hljs-string">'User'</span>, | |
| <span class="hljs-string">'site_admin'</span>: <span class="hljs-literal">False</span>}, | |
| <span class="hljs-string">'created_at'</span>: <span class="hljs-string">'2021-08-12T12:21:52Z'</span>, | |
| <span class="hljs-string">'updated_at'</span>: <span class="hljs-string">'2021-08-12T12:31:17Z'</span>, | |
| <span class="hljs-string">'author_association'</span>: <span class="hljs-string">'CONTRIBUTOR'</span>, | |
| <span class="hljs-string">'body'</span>: <span class="hljs-string">"@albertvillanova my tests are failing here:\\r\\n\`\`\`\\r\\ndataset_name = 'gooaq'\\r\\n\\r\\n def test_load_dataset(self, dataset_name):\\r\\n configs = self.dataset_tester.load_all_configs(dataset_name, is_local=True)[:1]\\r\\n> self.dataset_tester.check_load_dataset(dataset_name, configs, is_local=True, use_local_dummy_data=True)\\r\\n\\r\\ntests/test_dataset_common.py:234: \\r\\n_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ \\r\\ntests/test_dataset_common.py:187: in check_load_dataset\\r\\n self.parent.assertTrue(len(dataset[split]) > 0)\\r\\nE AssertionError: False is not true\\r\\n\`\`\`\\r\\nWhen I try loading dataset on local machine it works fine. Any suggestions on how can I avoid this error?"</span>, | |
| <span class="hljs-string">'performed_via_github_app'</span>: <span class="hljs-literal">None</span>}]`,wrap:!1}}),Rs=new h({props:{code:"ZGVmJTIwZ2V0X2NvbW1lbnRzKGlzc3VlX251bWJlciklM0ElMEElMjAlMjAlMjAlMjB1cmwlMjAlM0QlMjBmJTIyaHR0cHMlM0ElMkYlMkZhcGkuZ2l0aHViLmNvbSUyRnJlcG9zJTJGaHVnZ2luZ2ZhY2UlMkZkYXRhc2V0cyUyRmlzc3VlcyUyRiU3Qmlzc3VlX251bWJlciU3RCUyRmNvbW1lbnRzJTIyJTBBJTIwJTIwJTIwJTIwcmVzcG9uc2UlMjAlM0QlMjByZXF1ZXN0cy5nZXQodXJsJTJDJTIwaGVhZGVycyUzRGhlYWRlcnMpJTBBJTIwJTIwJTIwJTIwcmV0dXJuJTIwJTVCciU1QiUyMmJvZHklMjIlNUQlMjBmb3IlMjByJTIwaW4lMjByZXNwb25zZS5qc29uKCklNUQlMEElMEElMEElMjMlMjBUZXN0JTIwb3VyJTIwZnVuY3Rpb24lMjB3b3JrcyUyMGFzJTIwZXhwZWN0ZWQlMEFnZXRfY29tbWVudHMoMjc5Mik=",highlighted:`<span class="hljs-keyword">def</span> <span class="hljs-title function_">get_comments</span>(<span class="hljs-params">issue_number</span>): | |
| url = <span class="hljs-string">f"https://api.github.com/repos/huggingface/datasets/issues/<span class="hljs-subst">{issue_number}</span>/comments"</span> | |
| response = requests.get(url, headers=headers) | |
| <span class="hljs-keyword">return</span> [r[<span class="hljs-string">"body"</span>] <span class="hljs-keyword">for</span> r <span class="hljs-keyword">in</span> response.json()] | |
| <span class="hljs-comment"># Test our function works as expected</span> | |
| get_comments(<span class="hljs-number">2792</span>)`,wrap:!1}}),vs=new h({props:{code:"JTVCJTIyJTQwYWxiZXJ0dmlsbGFub3ZhJTIwbXklMjB0ZXN0cyUyMGFyZSUyMGZhaWxpbmclMjBoZXJlJTNBJTVDciU1Q24lNjAlNjAlNjAlNUNyJTVDbmRhdGFzZXRfbmFtZSUyMCUzRCUyMCdnb29hcSclNUNyJTVDbiU1Q3IlNUNuJTIwJTIwJTIwJTIwZGVmJTIwdGVzdF9sb2FkX2RhdGFzZXQoc2VsZiUyQyUyMGRhdGFzZXRfbmFtZSklM0ElNUNyJTVDbiUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMGNvbmZpZ3MlMjAlM0QlMjBzZWxmLmRhdGFzZXRfdGVzdGVyLmxvYWRfYWxsX2NvbmZpZ3MoZGF0YXNldF9uYW1lJTJDJTIwaXNfbG9jYWwlM0RUcnVlKSU1QiUzQTElNUQlNUNyJTVDbiUzRSUyMCUyMCUyMCUyMCUyMCUyMCUyMHNlbGYuZGF0YXNldF90ZXN0ZXIuY2hlY2tfbG9hZF9kYXRhc2V0KGRhdGFzZXRfbmFtZSUyQyUyMGNvbmZpZ3MlMkMlMjBpc19sb2NhbCUzRFRydWUlMkMlMjB1c2VfbG9jYWxfZHVtbXlfZGF0YSUzRFRydWUpJTVDciU1Q24lNUNyJTVDbnRlc3RzJTJGdGVzdF9kYXRhc2V0X2NvbW1vbi5weSUzQTIzNCUzQSUyMCU1Q3IlNUNuXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMF8lMjBfJTIwXyUyMCU1Q3IlNUNudGVzdHMlMkZ0ZXN0X2RhdGFzZXRfY29tbW9uLnB5JTNBMTg3JTNBJTIwaW4lMjBjaGVja19sb2FkX2RhdGFzZXQlNUNyJTVDbiUyMCUyMCUyMCUyMHNlbGYucGFyZW50LmFzc2VydFRydWUobGVuKGRhdGFzZXQlNUJzcGxpdCU1RCklMjAlM0UlMjAwKSU1Q3IlNUNuRSUyMCUyMCUyMEFzc2VydGlvbkVycm9yJTNBJTIwRmFsc2UlMjBpcyUyMG5vdCUyMHRydWUlNUNyJTVDbiU2MCU2MCU2MCU1Q3IlNUNuV2hlbiUyMEklMjB0cnklMjBsb2FkaW5nJTIwZGF0YXNldCUyMG9uJTIwbG9jYWwlMjBtYWNoaW5lJTIwaXQlMjB3b3JrcyUyMGZpbmUuJTIwQW55JTIwc3VnZ2VzdGlvbnMlMjBvbiUyMGhvdyUyMGNhbiUyMEklMjBhdm9pZCUyMHRoaXMlMjBlcnJvciUzRiUyMiU1RA==",highlighted:'[<span class="hljs-string">"@albertvillanova my tests are failing here:\\r\\n```\\r\\ndataset_name = 'gooaq'\\r\\n\\r\\n def test_load_dataset(self, dataset_name):\\r\\n configs = self.dataset_tester.load_all_configs(dataset_name, is_local=True)[:1]\\r\\n> self.dataset_tester.check_load_dataset(dataset_name, configs, is_local=True, use_local_dummy_data=True)\\r\\n\\r\\ntests/test_dataset_common.py:234: \\r\\n_ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ _ \\r\\ntests/test_dataset_common.py:187: in check_load_dataset\\r\\n self.parent.assertTrue(len(dataset[split]) > 0)\\r\\nE AssertionError: False is not true\\r\\n```\\r\\nWhen I try loading dataset on local machine it works fine. Any suggestions on how can I avoid this error?"</span>]',wrap:!1}}),Xs=new h({props:{code:"JTIzJTIwRGVwZW5kaW5nJTIwb24lMjB5b3VyJTIwaW50ZXJuZXQlMjBjb25uZWN0aW9uJTJDJTIwdGhpcyUyMGNhbiUyMHRha2UlMjBhJTIwZmV3JTIwbWludXRlcy4uLiUwQWlzc3Vlc193aXRoX2NvbW1lbnRzX2RhdGFzZXQlMjAlM0QlMjBpc3N1ZXNfZGF0YXNldC5tYXAoJTBBJTIwJTIwJTIwJTIwbGFtYmRhJTIweCUzQSUyMCU3QiUyMmNvbW1lbnRzJTIyJTNBJTIwZ2V0X2NvbW1lbnRzKHglNUIlMjJudW1iZXIlMjIlNUQpJTdEJTBBKQ==",highlighted:`<span class="hljs-comment"># Depending on your internet connection, this can take a few minutes...</span> | |
| issues_with_comments_dataset = issues_dataset.<span class="hljs-built_in">map</span>( | |
| <span class="hljs-keyword">lambda</span> x: {<span class="hljs-string">"comments"</span>: get_comments(x[<span class="hljs-string">"number"</span>])} | |
| )`,wrap:!1}}),Ns=new h({props:{code:"aXNzdWVzX3dpdGhfY29tbWVudHNfZGF0YXNldC50b19qc29uKCUyMmlzc3Vlcy1kYXRhc2V0cy13aXRoLWNvbW1lbnRzLmpzb25sJTIyKQ==",highlighted:'issues_with_comments_dataset.to_json(<span class="hljs-string">"issues-datasets-with-comments.jsonl"</span>)',wrap:!1}}),_s=new Ma({props:{title:"Carregando o conjunto de dados para o Hugging Face Hub",local:"carregando-o-conjunto-de-dados-para-o-hugging-face-hub",headingTag:"h2"}}),ks=new Tt({props:{id:"HaN6qCr_Afc"}}),Vs=new h({props:{code:"ZnJvbSUyMGh1Z2dpbmdmYWNlX2h1YiUyMGltcG9ydCUyMGxpc3RfZGF0YXNldHMlMEElMEFhbGxfZGF0YXNldHMlMjAlM0QlMjBsaXN0X2RhdGFzZXRzKCklMEFwcmludChmJTIyTnVtYmVyJTIwb2YlMjBkYXRhc2V0cyUyMG9uJTIwSHViJTNBJTIwJTdCbGVuKGFsbF9kYXRhc2V0cyklN0QlMjIpJTBBcHJpbnQoYWxsX2RhdGFzZXRzJTVCMCU1RCk=",highlighted:`<span class="hljs-keyword">from</span> huggingface_hub <span class="hljs-keyword">import</span> list_datasets | |
| all_datasets = list_datasets() | |
| <span class="hljs-built_in">print</span>(<span class="hljs-string">f"Number of datasets on Hub: <span class="hljs-subst">{<span class="hljs-built_in">len</span>(all_datasets)}</span>"</span>) | |
| <span class="hljs-built_in">print</span>(all_datasets[<span class="hljs-number">0</span>])`,wrap:!1}}),$s=new h({props:{code:"TnVtYmVyJTIwb2YlMjBkYXRhc2V0cyUyMG9uJTIwSHViJTNBJTIwMTQ4NyUwQURhdGFzZXQlMjBOYW1lJTNBJTIwYWNyb255bV9pZGVudGlmaWNhdGlvbiUyQyUyMFRhZ3MlM0ElMjAlNUInYW5ub3RhdGlvbnNfY3JlYXRvcnMlM0FleHBlcnQtZ2VuZXJhdGVkJyUyQyUyMCdsYW5ndWFnZV9jcmVhdG9ycyUzQWZvdW5kJyUyQyUyMCdsYW5ndWFnZXMlM0FlbiclMkMlMjAnbGljZW5zZXMlM0FtaXQnJTJDJTIwJ211bHRpbGluZ3VhbGl0eSUzQW1vbm9saW5ndWFsJyUyQyUyMCdzaXplX2NhdGVnb3JpZXMlM0ExMEslM0NuJTNDMTAwSyclMkMlMjAnc291cmNlX2RhdGFzZXRzJTNBb3JpZ2luYWwnJTJDJTIwJ3Rhc2tfY2F0ZWdvcmllcyUzQXN0cnVjdHVyZS1wcmVkaWN0aW9uJyUyQyUyMCd0YXNrX2lkcyUzQXN0cnVjdHVyZS1wcmVkaWN0aW9uLW90aGVyLWFjcm9ueW0taWRlbnRpZmljYXRpb24nJTVE",highlighted:`Number of datasets on Hub: <span class="hljs-number">1487</span> | |
| Dataset Name: acronym_identification, Tags: [<span class="hljs-string">'annotations_creators:expert-generated'</span>, <span class="hljs-string">'language_creators:found'</span>, <span class="hljs-string">'languages:en'</span>, <span class="hljs-string">'licenses:mit'</span>, <span class="hljs-string">'multilinguality:monolingual'</span>, <span class="hljs-string">'size_categories:10K<n<100K'</span>, <span class="hljs-string">'source_datasets:original'</span>, <span class="hljs-string">'task_categories:structure-prediction'</span>, <span class="hljs-string">'task_ids:structure-prediction-other-acronym-identification'</span>]`,wrap:!1}}),Ws=new h({props:{code:"ZnJvbSUyMGh1Z2dpbmdmYWNlX2h1YiUyMGltcG9ydCUyMG5vdGVib29rX2xvZ2luJTBBJTBBbm90ZWJvb2tfbG9naW4oKQ==",highlighted:`<span class="hljs-keyword">from</span> huggingface_hub <span class="hljs-keyword">import</span> notebook_login | |
| notebook_login()`,wrap:!1}}),Qs=new h({props:{code:"aHVnZ2luZ2ZhY2UtY2xpJTIwbG9naW4=",highlighted:"huggingface-cli login",wrap:!1}}),Es=new h({props:{code:"ZnJvbSUyMGh1Z2dpbmdmYWNlX2h1YiUyMGltcG9ydCUyMGNyZWF0ZV9yZXBvJTBBJTBBcmVwb191cmwlMjAlM0QlMjBjcmVhdGVfcmVwbyhuYW1lJTNEJTIyZ2l0aHViLWlzc3VlcyUyMiUyQyUyMHJlcG9fdHlwZSUzRCUyMmRhdGFzZXQlMjIpJTBBcmVwb191cmw=",highlighted:`<span class="hljs-keyword">from</span> huggingface_hub <span class="hljs-keyword">import</span> create_repo | |
| repo_url = create_repo(name=<span class="hljs-string">"github-issues"</span>, repo_type=<span class="hljs-string">"dataset"</span>) | |
| repo_url`,wrap:!1}}),Ss=new h({props:{code:"J2h0dHBzJTNBJTJGJTJGaHVnZ2luZ2ZhY2UuY28lMkZkYXRhc2V0cyUyRmxld3R1biUyRmdpdGh1Yi1pc3N1ZXMn",highlighted:'<span class="hljs-string">'https://huggingface.co/datasets/lewtun/github-issues'</span>',wrap:!1}}),R=new ua({props:{$$slots:{default:[wt]},$$scope:{ctx:j}}}),Ls=new h({props:{code:"ZnJvbSUyMGh1Z2dpbmdmYWNlX2h1YiUyMGltcG9ydCUyMFJlcG9zaXRvcnklMEElMEFyZXBvJTIwJTNEJTIwUmVwb3NpdG9yeShsb2NhbF9kaXIlM0QlMjJnaXRodWItaXNzdWVzJTIyJTJDJTIwY2xvbmVfZnJvbSUzRHJlcG9fdXJsKSUwQSFjcCUyMGRhdGFzZXRzLWlzc3Vlcy13aXRoLWNvbW1lbnRzLmpzb25sJTIwZ2l0aHViLWlzc3VlcyUyRg==",highlighted:`<span class="hljs-keyword">from</span> huggingface_hub <span class="hljs-keyword">import</span> Repository | |
| repo = Repository(local_dir=<span class="hljs-string">"github-issues"</span>, clone_from=repo_url) | |
| !cp datasets-issues-<span class="hljs-keyword">with</span>-comments.jsonl github-issues/`,wrap:!1}}),Ps=new h({props:{code:"cmVwby5sZnNfdHJhY2soJTIyKi5qc29ubCUyMik=",highlighted:'repo.lfs_track(<span class="hljs-string">"*.jsonl"</span>)',wrap:!1}}),Ks=new h({props:{code:"cmVwby5wdXNoX3RvX2h1Yigp",highlighted:"repo.push_to_hub()",wrap:!1}}),ea=new h({props:{code:"cmVtb3RlX2RhdGFzZXQlMjAlM0QlMjBsb2FkX2RhdGFzZXQoJTIybGV3dHVuJTJGZ2l0aHViLWlzc3VlcyUyMiUyQyUyMHNwbGl0JTNEJTIydHJhaW4lMjIpJTBBcmVtb3RlX2RhdGFzZXQ=",highlighted:`remote_dataset = load_dataset(<span class="hljs-string">"lewtun/github-issues"</span>, split=<span class="hljs-string">"train"</span>) | |
| remote_dataset`,wrap:!1}}),la=new h({props:{code:"RGF0YXNldCglN0IlMEElMjAlMjAlMjAlMjBmZWF0dXJlcyUzQSUyMCU1Qid1cmwnJTJDJTIwJ3JlcG9zaXRvcnlfdXJsJyUyQyUyMCdsYWJlbHNfdXJsJyUyQyUyMCdjb21tZW50c191cmwnJTJDJTIwJ2V2ZW50c191cmwnJTJDJTIwJ2h0bWxfdXJsJyUyQyUyMCdpZCclMkMlMjAnbm9kZV9pZCclMkMlMjAnbnVtYmVyJyUyQyUyMCd0aXRsZSclMkMlMjAndXNlciclMkMlMjAnbGFiZWxzJyUyQyUyMCdzdGF0ZSclMkMlMjAnbG9ja2VkJyUyQyUyMCdhc3NpZ25lZSclMkMlMjAnYXNzaWduZWVzJyUyQyUyMCdtaWxlc3RvbmUnJTJDJTIwJ2NvbW1lbnRzJyUyQyUyMCdjcmVhdGVkX2F0JyUyQyUyMCd1cGRhdGVkX2F0JyUyQyUyMCdjbG9zZWRfYXQnJTJDJTIwJ2F1dGhvcl9hc3NvY2lhdGlvbiclMkMlMjAnYWN0aXZlX2xvY2tfcmVhc29uJyUyQyUyMCdwdWxsX3JlcXVlc3QnJTJDJTIwJ2JvZHknJTJDJTIwJ3BlcmZvcm1lZF92aWFfZ2l0aHViX2FwcCclMkMlMjAnaXNfcHVsbF9yZXF1ZXN0JyU1RCUyQyUwQSUyMCUyMCUyMCUyMG51bV9yb3dzJTNBJTIwMjg1NSUwQSU3RCk=",highlighted:`Dataset({ | |
| features: [<span class="hljs-string">'url'</span>, <span class="hljs-string">'repository_url'</span>, <span class="hljs-string">'labels_url'</span>, <span class="hljs-string">'comments_url'</span>, <span class="hljs-string">'events_url'</span>, <span class="hljs-string">'html_url'</span>, <span class="hljs-string">'id'</span>, <span class="hljs-string">'node_id'</span>, <span class="hljs-string">'number'</span>, <span class="hljs-string">'title'</span>, <span class="hljs-string">'user'</span>, <span class="hljs-string">'labels'</span>, <span class="hljs-string">'state'</span>, <span class="hljs-string">'locked'</span>, <span class="hljs-string">'assignee'</span>, <span class="hljs-string">'assignees'</span>, <span class="hljs-string">'milestone'</span>, <span class="hljs-string">'comments'</span>, <span class="hljs-string">'created_at'</span>, <span class="hljs-string">'updated_at'</span>, <span class="hljs-string">'closed_at'</span>, <span class="hljs-string">'author_association'</span>, <span class="hljs-string">'active_lock_reason'</span>, <span class="hljs-string">'pull_request'</span>, <span class="hljs-string">'body'</span>, <span class="hljs-string">'performed_via_github_app'</span>, <span class="hljs-string">'is_pull_request'</span>], | |
| num_rows: <span class="hljs-number">2855</span> | |
| })`,wrap:!1}}),I=new ua({props:{$$slots:{default:[xt]},$$scope:{ctx:j}}}),na=new Ma({props:{title:"Criando um cartão do datasets",local:"criando-um-cartão-do-datasets",headingTag:"h2"}}),_=new ua({props:{$$slots:{default:[Zt]},$$scope:{ctx:j}}}),k=new ua({props:{$$slots:{default:[Gt]},$$scope:{ctx:j}}}),da=new jt({props:{source:"https://github.com/huggingface/course/blob/main/chapters/pt/chapter5/5.mdx"}}),{c(){o=i("meta"),T=t(),r=i("p"),U=t(),d(z.$$.fragment),ya=t(),d(V.$$.fragment),ha=t(),$=i("p"),$.innerHTML=il,Ta=t(),B=i("ul"),B.innerHTML=pl,Ua=t(),H=i("p"),H.textContent=cl,ja=t(),d(W.$$.fragment),ba=t(),F=i("p"),F.innerHTML=rl,ga=t(),g=i("div"),g.innerHTML=dl,fa=t(),Q=i("p"),Q.textContent=ul,wa=t(),f=i("div"),f.innerHTML=ml,xa=t(),Y=i("p"),Y.innerHTML=Ml,Za=t(),E=i("p"),E.innerHTML=Jl,Ga=t(),d(S.$$.fragment),Ra=t(),A=i("p"),A.innerHTML=yl,va=t(),d(q.$$.fragment),Ia=t(),L=i("p"),L.innerHTML=hl,Xa=t(),d(D.$$.fragment),Ca=t(),d(P.$$.fragment),Na=t(),O=i("p"),O.innerHTML=Tl,_a=t(),d(K.$$.fragment),ka=t(),d(ss.$$.fragment),za=t(),as=i("p"),as.innerHTML=Ul,Va=t(),d(w.$$.fragment),$a=t(),es=i("p"),es.innerHTML=jl,Ba=t(),d(ls.$$.fragment),Ha=t(),d(x.$$.fragment),Wa=t(),ts=i("p"),ts.textContent=bl,Fa=t(),d(ns.$$.fragment),Qa=t(),os=i("p"),os.innerHTML=gl,Ya=t(),d(is.$$.fragment),Ea=t(),ps=i("p"),ps.innerHTML=fl,Sa=t(),d(cs.$$.fragment),Aa=t(),d(rs.$$.fragment),qa=t(),ds=i("p"),ds.innerHTML=wl,La=t(),us=i("blockquote"),us.innerHTML=xl,Da=t(),ms=i("p"),ms.textContent=Zl,Pa=t(),d(Ms.$$.fragment),Oa=t(),Js=i("p"),Js.innerHTML=Gl,Ka=t(),d(ys.$$.fragment),se=t(),d(hs.$$.fragment),ae=t(),Ts=i("p"),Ts.innerHTML=Rl,ee=t(),d(Us.$$.fragment),le=t(),d(Z.$$.fragment),te=t(),js=i("p"),js.textContent=vl,ne=t(),bs=i("p"),bs.textContent=Il,oe=t(),d(gs.$$.fragment),ie=t(),fs=i("p"),fs.textContent=Xl,pe=t(),G=i("div"),G.innerHTML=Cl,ce=t(),ws=i("p"),ws.innerHTML=Nl,re=t(),d(xs.$$.fragment),de=t(),d(Zs.$$.fragment),ue=t(),Gs=i("p"),Gs.innerHTML=_l,me=t(),d(Rs.$$.fragment),Me=t(),d(vs.$$.fragment),Je=t(),Is=i("p"),Is.innerHTML=kl,ye=t(),d(Xs.$$.fragment),he=t(),Cs=i("p"),Cs.textContent=zl,Te=t(),d(Ns.$$.fragment),Ue=t(),d(_s.$$.fragment),je=t(),d(ks.$$.fragment),be=t(),zs=i("p"),zs.innerHTML=Vl,ge=t(),d(Vs.$$.fragment),fe=t(),d($s.$$.fragment),we=t(),Bs=i("p"),Bs.innerHTML=$l,xe=t(),Hs=i("p"),Hs.innerHTML=Bl,Ze=t(),d(Ws.$$.fragment),Ge=t(),Fs=i("p"),Fs.innerHTML=Hl,Re=t(),d(Qs.$$.fragment),ve=t(),Ys=i("p"),Ys.innerHTML=Wl,Ie=t(),d(Es.$$.fragment),Xe=t(),d(Ss.$$.fragment),Ce=t(),As=i("p"),As.innerHTML=Fl,Ne=t(),d(R.$$.fragment),_e=t(),qs=i("p"),qs.innerHTML=Ql,ke=t(),d(Ls.$$.fragment),ze=t(),Ds=i("p"),Ds.innerHTML=Yl,Ve=t(),d(Ps.$$.fragment),$e=t(),Os=i("p"),Os.innerHTML=El,Be=t(),d(Ks.$$.fragment),He=t(),sa=i("p"),sa.innerHTML=Sl,We=t(),v=i("div"),v.innerHTML=Al,Fe=t(),aa=i("p"),aa.innerHTML=ql,Qe=t(),d(ea.$$.fragment),Ye=t(),d(la.$$.fragment),Ee=t(),ta=i("p"),ta.innerHTML=Ll,Se=t(),d(I.$$.fragment),Ae=t(),d(na.$$.fragment),qe=t(),oa=i("p"),oa.textContent=Dl,Le=t(),ia=i("p"),ia.innerHTML=Pl,De=t(),pa=i("ol"),pa.innerHTML=Ol,Pe=t(),X=i("div"),X.innerHTML=Kl,Oe=t(),C=i("ol"),C.innerHTML=st,Ke=t(),ca=i("p"),ca.innerHTML=at,sl=t(),N=i("div"),N.innerHTML=et,al=t(),d(_.$$.fragment),el=t(),ra=i("p"),ra.textContent=lt,ll=t(),d(k.$$.fragment),tl=t(),d(da.$$.fragment),nl=t(),Ja=i("p"),this.h()},l(s){const a=yt("svelte-u9bgzb",document.head);o=p(a,"META",{name:!0,content:!0}),a.forEach(e),T=n(s),r=p(s,"P",{}),dt(r).forEach(e),U=n(s),u(z.$$.fragment,s),ya=n(s),u(V.$$.fragment,s),ha=n(s),$=p(s,"P",{"data-svelte-h":!0}),c($)!=="svelte-qzjzzu"&&($.innerHTML=il),Ta=n(s),B=p(s,"UL",{"data-svelte-h":!0}),c(B)!=="svelte-13fgdbo"&&(B.innerHTML=pl),Ua=n(s),H=p(s,"P",{"data-svelte-h":!0}),c(H)!=="svelte-1t92jpo"&&(H.textContent=cl),ja=n(s),u(W.$$.fragment,s),ba=n(s),F=p(s,"P",{"data-svelte-h":!0}),c(F)!=="svelte-724jk"&&(F.innerHTML=rl),ga=n(s),g=p(s,"DIV",{class:!0,"data-svelte-h":!0}),c(g)!=="svelte-1htetkm"&&(g.innerHTML=dl),fa=n(s),Q=p(s,"P",{"data-svelte-h":!0}),c(Q)!=="svelte-1abvgj5"&&(Q.textContent=ul),wa=n(s),f=p(s,"DIV",{class:!0,"data-svelte-h":!0}),c(f)!=="svelte-1jsgvzc"&&(f.innerHTML=ml),xa=n(s),Y=p(s,"P",{"data-svelte-h":!0}),c(Y)!=="svelte-jyvc3q"&&(Y.innerHTML=Ml),Za=n(s),E=p(s,"P",{"data-svelte-h":!0}),c(E)!=="svelte-2cc0nx"&&(E.innerHTML=Jl),Ga=n(s),u(S.$$.fragment,s),Ra=n(s),A=p(s,"P",{"data-svelte-h":!0}),c(A)!=="svelte-nc35xk"&&(A.innerHTML=yl),va=n(s),u(q.$$.fragment,s),Ia=n(s),L=p(s,"P",{"data-svelte-h":!0}),c(L)!=="svelte-1ag02sh"&&(L.innerHTML=hl),Xa=n(s),u(D.$$.fragment,s),Ca=n(s),u(P.$$.fragment,s),Na=n(s),O=p(s,"P",{"data-svelte-h":!0}),c(O)!=="svelte-1t5kbkx"&&(O.innerHTML=Tl),_a=n(s),u(K.$$.fragment,s),ka=n(s),u(ss.$$.fragment,s),za=n(s),as=p(s,"P",{"data-svelte-h":!0}),c(as)!=="svelte-15zd9ok"&&(as.innerHTML=Ul),Va=n(s),u(w.$$.fragment,s),$a=n(s),es=p(s,"P",{"data-svelte-h":!0}),c(es)!=="svelte-nznw16"&&(es.innerHTML=jl),Ba=n(s),u(ls.$$.fragment,s),Ha=n(s),u(x.$$.fragment,s),Wa=n(s),ts=p(s,"P",{"data-svelte-h":!0}),c(ts)!=="svelte-1u5zgji"&&(ts.textContent=bl),Fa=n(s),u(ns.$$.fragment,s),Qa=n(s),os=p(s,"P",{"data-svelte-h":!0}),c(os)!=="svelte-1enlzi5"&&(os.innerHTML=gl),Ya=n(s),u(is.$$.fragment,s),Ea=n(s),ps=p(s,"P",{"data-svelte-h":!0}),c(ps)!=="svelte-16hcfk7"&&(ps.innerHTML=fl),Sa=n(s),u(cs.$$.fragment,s),Aa=n(s),u(rs.$$.fragment,s),qa=n(s),ds=p(s,"P",{"data-svelte-h":!0}),c(ds)!=="svelte-97971k"&&(ds.innerHTML=wl),La=n(s),us=p(s,"BLOCKQUOTE",{"data-svelte-h":!0}),c(us)!=="svelte-127vg01"&&(us.innerHTML=xl),Da=n(s),ms=p(s,"P",{"data-svelte-h":!0}),c(ms)!=="svelte-1uym4u1"&&(ms.textContent=Zl),Pa=n(s),u(Ms.$$.fragment,s),Oa=n(s),Js=p(s,"P",{"data-svelte-h":!0}),c(Js)!=="svelte-r1iiw0"&&(Js.innerHTML=Gl),Ka=n(s),u(ys.$$.fragment,s),se=n(s),u(hs.$$.fragment,s),ae=n(s),Ts=p(s,"P",{"data-svelte-h":!0}),c(Ts)!=="svelte-z4trhs"&&(Ts.innerHTML=Rl),ee=n(s),u(Us.$$.fragment,s),le=n(s),u(Z.$$.fragment,s),te=n(s),js=p(s,"P",{"data-svelte-h":!0}),c(js)!=="svelte-58dtlq"&&(js.textContent=vl),ne=n(s),bs=p(s,"P",{"data-svelte-h":!0}),c(bs)!=="svelte-p477r1"&&(bs.textContent=Il),oe=n(s),u(gs.$$.fragment,s),ie=n(s),fs=p(s,"P",{"data-svelte-h":!0}),c(fs)!=="svelte-18m93nm"&&(fs.textContent=Xl),pe=n(s),G=p(s,"DIV",{class:!0,"data-svelte-h":!0}),c(G)!=="svelte-1fxxwaz"&&(G.innerHTML=Cl),ce=n(s),ws=p(s,"P",{"data-svelte-h":!0}),c(ws)!=="svelte-1aq93c6"&&(ws.innerHTML=Nl),re=n(s),u(xs.$$.fragment,s),de=n(s),u(Zs.$$.fragment,s),ue=n(s),Gs=p(s,"P",{"data-svelte-h":!0}),c(Gs)!=="svelte-1m47af7"&&(Gs.innerHTML=_l),me=n(s),u(Rs.$$.fragment,s),Me=n(s),u(vs.$$.fragment,s),Je=n(s),Is=p(s,"P",{"data-svelte-h":!0}),c(Is)!=="svelte-an9xq1"&&(Is.innerHTML=kl),ye=n(s),u(Xs.$$.fragment,s),he=n(s),Cs=p(s,"P",{"data-svelte-h":!0}),c(Cs)!=="svelte-inkiuv"&&(Cs.textContent=zl),Te=n(s),u(Ns.$$.fragment,s),Ue=n(s),u(_s.$$.fragment,s),je=n(s),u(ks.$$.fragment,s),be=n(s),zs=p(s,"P",{"data-svelte-h":!0}),c(zs)!=="svelte-1pq8ng9"&&(zs.innerHTML=Vl),ge=n(s),u(Vs.$$.fragment,s),fe=n(s),u($s.$$.fragment,s),we=n(s),Bs=p(s,"P",{"data-svelte-h":!0}),c(Bs)!=="svelte-elk9an"&&(Bs.innerHTML=$l),xe=n(s),Hs=p(s,"P",{"data-svelte-h":!0}),c(Hs)!=="svelte-mwq422"&&(Hs.innerHTML=Bl),Ze=n(s),u(Ws.$$.fragment,s),Ge=n(s),Fs=p(s,"P",{"data-svelte-h":!0}),c(Fs)!=="svelte-3ay613"&&(Fs.innerHTML=Hl),Re=n(s),u(Qs.$$.fragment,s),ve=n(s),Ys=p(s,"P",{"data-svelte-h":!0}),c(Ys)!=="svelte-1sk1cve"&&(Ys.innerHTML=Wl),Ie=n(s),u(Es.$$.fragment,s),Xe=n(s),u(Ss.$$.fragment,s),Ce=n(s),As=p(s,"P",{"data-svelte-h":!0}),c(As)!=="svelte-1b7m61j"&&(As.innerHTML=Fl),Ne=n(s),u(R.$$.fragment,s),_e=n(s),qs=p(s,"P",{"data-svelte-h":!0}),c(qs)!=="svelte-ksirvg"&&(qs.innerHTML=Ql),ke=n(s),u(Ls.$$.fragment,s),ze=n(s),Ds=p(s,"P",{"data-svelte-h":!0}),c(Ds)!=="svelte-946zbw"&&(Ds.innerHTML=Yl),Ve=n(s),u(Ps.$$.fragment,s),$e=n(s),Os=p(s,"P",{"data-svelte-h":!0}),c(Os)!=="svelte-uq1g87"&&(Os.innerHTML=El),Be=n(s),u(Ks.$$.fragment,s),He=n(s),sa=p(s,"P",{"data-svelte-h":!0}),c(sa)!=="svelte-ov0i84"&&(sa.innerHTML=Sl),We=n(s),v=p(s,"DIV",{class:!0,"data-svelte-h":!0}),c(v)!=="svelte-18puw29"&&(v.innerHTML=Al),Fe=n(s),aa=p(s,"P",{"data-svelte-h":!0}),c(aa)!=="svelte-1v7sua7"&&(aa.innerHTML=ql),Qe=n(s),u(ea.$$.fragment,s),Ye=n(s),u(la.$$.fragment,s),Ee=n(s),ta=p(s,"P",{"data-svelte-h":!0}),c(ta)!=="svelte-zqtc7l"&&(ta.innerHTML=Ll),Se=n(s),u(I.$$.fragment,s),Ae=n(s),u(na.$$.fragment,s),qe=n(s),oa=p(s,"P",{"data-svelte-h":!0}),c(oa)!=="svelte-dylmg9"&&(oa.textContent=Dl),Le=n(s),ia=p(s,"P",{"data-svelte-h":!0}),c(ia)!=="svelte-17tg70u"&&(ia.innerHTML=Pl),De=n(s),pa=p(s,"OL",{"data-svelte-h":!0}),c(pa)!=="svelte-gkbv46"&&(pa.innerHTML=Ol),Pe=n(s),X=p(s,"DIV",{class:!0,"data-svelte-h":!0}),c(X)!=="svelte-1gqifn5"&&(X.innerHTML=Kl),Oe=n(s),C=p(s,"OL",{start:!0,"data-svelte-h":!0}),c(C)!=="svelte-1u3mfkz"&&(C.innerHTML=st),Ke=n(s),ca=p(s,"P",{"data-svelte-h":!0}),c(ca)!=="svelte-1tv90dr"&&(ca.innerHTML=at),sl=n(s),N=p(s,"DIV",{class:!0,"data-svelte-h":!0}),c(N)!=="svelte-ct1wn8"&&(N.innerHTML=et),al=n(s),u(_.$$.fragment,s),el=n(s),ra=p(s,"P",{"data-svelte-h":!0}),c(ra)!=="svelte-k6tkf8"&&(ra.textContent=lt),ll=n(s),u(k.$$.fragment,s),tl=n(s),u(da.$$.fragment,s),nl=n(s),Ja=p(s,"P",{}),dt(Ja).forEach(e),this.h()},h(){b(o,"name","hf:doc:metadata"),b(o,"content",vt),b(g,"class","flex justify-center"),b(f,"class","flex justify-center"),b(G,"class","flex justify-center"),b(v,"class","flex justify-center"),b(X,"class","flex justify-center"),b(C,"start","2"),b(N,"class","flex justify-center")},m(s,a){ht(document.head,o),l(s,T,a),l(s,r,a),l(s,U,a),m(z,s,a),l(s,ya,a),m(V,s,a),l(s,ha,a),l(s,$,a),l(s,Ta,a),l(s,B,a),l(s,Ua,a),l(s,H,a),l(s,ja,a),m(W,s,a),l(s,ba,a),l(s,F,a),l(s,ga,a),l(s,g,a),l(s,fa,a),l(s,Q,a),l(s,wa,a),l(s,f,a),l(s,xa,a),l(s,Y,a),l(s,Za,a),l(s,E,a),l(s,Ga,a),m(S,s,a),l(s,Ra,a),l(s,A,a),l(s,va,a),m(q,s,a),l(s,Ia,a),l(s,L,a),l(s,Xa,a),m(D,s,a),l(s,Ca,a),m(P,s,a),l(s,Na,a),l(s,O,a),l(s,_a,a),m(K,s,a),l(s,ka,a),m(ss,s,a),l(s,za,a),l(s,as,a),l(s,Va,a),m(w,s,a),l(s,$a,a),l(s,es,a),l(s,Ba,a),m(ls,s,a),l(s,Ha,a),m(x,s,a),l(s,Wa,a),l(s,ts,a),l(s,Fa,a),m(ns,s,a),l(s,Qa,a),l(s,os,a),l(s,Ya,a),m(is,s,a),l(s,Ea,a),l(s,ps,a),l(s,Sa,a),m(cs,s,a),l(s,Aa,a),m(rs,s,a),l(s,qa,a),l(s,ds,a),l(s,La,a),l(s,us,a),l(s,Da,a),l(s,ms,a),l(s,Pa,a),m(Ms,s,a),l(s,Oa,a),l(s,Js,a),l(s,Ka,a),m(ys,s,a),l(s,se,a),m(hs,s,a),l(s,ae,a),l(s,Ts,a),l(s,ee,a),m(Us,s,a),l(s,le,a),m(Z,s,a),l(s,te,a),l(s,js,a),l(s,ne,a),l(s,bs,a),l(s,oe,a),m(gs,s,a),l(s,ie,a),l(s,fs,a),l(s,pe,a),l(s,G,a),l(s,ce,a),l(s,ws,a),l(s,re,a),m(xs,s,a),l(s,de,a),m(Zs,s,a),l(s,ue,a),l(s,Gs,a),l(s,me,a),m(Rs,s,a),l(s,Me,a),m(vs,s,a),l(s,Je,a),l(s,Is,a),l(s,ye,a),m(Xs,s,a),l(s,he,a),l(s,Cs,a),l(s,Te,a),m(Ns,s,a),l(s,Ue,a),m(_s,s,a),l(s,je,a),m(ks,s,a),l(s,be,a),l(s,zs,a),l(s,ge,a),m(Vs,s,a),l(s,fe,a),m($s,s,a),l(s,we,a),l(s,Bs,a),l(s,xe,a),l(s,Hs,a),l(s,Ze,a),m(Ws,s,a),l(s,Ge,a),l(s,Fs,a),l(s,Re,a),m(Qs,s,a),l(s,ve,a),l(s,Ys,a),l(s,Ie,a),m(Es,s,a),l(s,Xe,a),m(Ss,s,a),l(s,Ce,a),l(s,As,a),l(s,Ne,a),m(R,s,a),l(s,_e,a),l(s,qs,a),l(s,ke,a),m(Ls,s,a),l(s,ze,a),l(s,Ds,a),l(s,Ve,a),m(Ps,s,a),l(s,$e,a),l(s,Os,a),l(s,Be,a),m(Ks,s,a),l(s,He,a),l(s,sa,a),l(s,We,a),l(s,v,a),l(s,Fe,a),l(s,aa,a),l(s,Qe,a),m(ea,s,a),l(s,Ye,a),m(la,s,a),l(s,Ee,a),l(s,ta,a),l(s,Se,a),m(I,s,a),l(s,Ae,a),m(na,s,a),l(s,qe,a),l(s,oa,a),l(s,Le,a),l(s,ia,a),l(s,De,a),l(s,pa,a),l(s,Pe,a),l(s,X,a),l(s,Oe,a),l(s,C,a),l(s,Ke,a),l(s,ca,a),l(s,sl,a),l(s,N,a),l(s,al,a),m(_,s,a),l(s,el,a),l(s,ra,a),l(s,ll,a),m(k,s,a),l(s,tl,a),m(da,s,a),l(s,nl,a),l(s,Ja,a),ol=!0},p(s,[a]){const tt={};a&2&&(tt.$$scope={dirty:a,ctx:s}),w.$set(tt);const nt={};a&2&&(nt.$$scope={dirty:a,ctx:s}),x.$set(nt);const ot={};a&2&&(ot.$$scope={dirty:a,ctx:s}),Z.$set(ot);const it={};a&2&&(it.$$scope={dirty:a,ctx:s}),R.$set(it);const pt={};a&2&&(pt.$$scope={dirty:a,ctx:s}),I.$set(pt);const ct={};a&2&&(ct.$$scope={dirty:a,ctx:s}),_.$set(ct);const rt={};a&2&&(rt.$$scope={dirty:a,ctx:s}),k.$set(rt)},i(s){ol||(M(z.$$.fragment,s),M(V.$$.fragment,s),M(W.$$.fragment,s),M(S.$$.fragment,s),M(q.$$.fragment,s),M(D.$$.fragment,s),M(P.$$.fragment,s),M(K.$$.fragment,s),M(ss.$$.fragment,s),M(w.$$.fragment,s),M(ls.$$.fragment,s),M(x.$$.fragment,s),M(ns.$$.fragment,s),M(is.$$.fragment,s),M(cs.$$.fragment,s),M(rs.$$.fragment,s),M(Ms.$$.fragment,s),M(ys.$$.fragment,s),M(hs.$$.fragment,s),M(Us.$$.fragment,s),M(Z.$$.fragment,s),M(gs.$$.fragment,s),M(xs.$$.fragment,s),M(Zs.$$.fragment,s),M(Rs.$$.fragment,s),M(vs.$$.fragment,s),M(Xs.$$.fragment,s),M(Ns.$$.fragment,s),M(_s.$$.fragment,s),M(ks.$$.fragment,s),M(Vs.$$.fragment,s),M($s.$$.fragment,s),M(Ws.$$.fragment,s),M(Qs.$$.fragment,s),M(Es.$$.fragment,s),M(Ss.$$.fragment,s),M(R.$$.fragment,s),M(Ls.$$.fragment,s),M(Ps.$$.fragment,s),M(Ks.$$.fragment,s),M(ea.$$.fragment,s),M(la.$$.fragment,s),M(I.$$.fragment,s),M(na.$$.fragment,s),M(_.$$.fragment,s),M(k.$$.fragment,s),M(da.$$.fragment,s),ol=!0)},o(s){J(z.$$.fragment,s),J(V.$$.fragment,s),J(W.$$.fragment,s),J(S.$$.fragment,s),J(q.$$.fragment,s),J(D.$$.fragment,s),J(P.$$.fragment,s),J(K.$$.fragment,s),J(ss.$$.fragment,s),J(w.$$.fragment,s),J(ls.$$.fragment,s),J(x.$$.fragment,s),J(ns.$$.fragment,s),J(is.$$.fragment,s),J(cs.$$.fragment,s),J(rs.$$.fragment,s),J(Ms.$$.fragment,s),J(ys.$$.fragment,s),J(hs.$$.fragment,s),J(Us.$$.fragment,s),J(Z.$$.fragment,s),J(gs.$$.fragment,s),J(xs.$$.fragment,s),J(Zs.$$.fragment,s),J(Rs.$$.fragment,s),J(vs.$$.fragment,s),J(Xs.$$.fragment,s),J(Ns.$$.fragment,s),J(_s.$$.fragment,s),J(ks.$$.fragment,s),J(Vs.$$.fragment,s),J($s.$$.fragment,s),J(Ws.$$.fragment,s),J(Qs.$$.fragment,s),J(Es.$$.fragment,s),J(Ss.$$.fragment,s),J(R.$$.fragment,s),J(Ls.$$.fragment,s),J(Ps.$$.fragment,s),J(Ks.$$.fragment,s),J(ea.$$.fragment,s),J(la.$$.fragment,s),J(I.$$.fragment,s),J(na.$$.fragment,s),J(_.$$.fragment,s),J(k.$$.fragment,s),J(da.$$.fragment,s),ol=!1},d(s){s&&(e(T),e(r),e(U),e(ya),e(ha),e($),e(Ta),e(B),e(Ua),e(H),e(ja),e(ba),e(F),e(ga),e(g),e(fa),e(Q),e(wa),e(f),e(xa),e(Y),e(Za),e(E),e(Ga),e(Ra),e(A),e(va),e(Ia),e(L),e(Xa),e(Ca),e(Na),e(O),e(_a),e(ka),e(za),e(as),e(Va),e($a),e(es),e(Ba),e(Ha),e(Wa),e(ts),e(Fa),e(Qa),e(os),e(Ya),e(Ea),e(ps),e(Sa),e(Aa),e(qa),e(ds),e(La),e(us),e(Da),e(ms),e(Pa),e(Oa),e(Js),e(Ka),e(se),e(ae),e(Ts),e(ee),e(le),e(te),e(js),e(ne),e(bs),e(oe),e(ie),e(fs),e(pe),e(G),e(ce),e(ws),e(re),e(de),e(ue),e(Gs),e(me),e(Me),e(Je),e(Is),e(ye),e(he),e(Cs),e(Te),e(Ue),e(je),e(be),e(zs),e(ge),e(fe),e(we),e(Bs),e(xe),e(Hs),e(Ze),e(Ge),e(Fs),e(Re),e(ve),e(Ys),e(Ie),e(Xe),e(Ce),e(As),e(Ne),e(_e),e(qs),e(ke),e(ze),e(Ds),e(Ve),e($e),e(Os),e(Be),e(He),e(sa),e(We),e(v),e(Fe),e(aa),e(Qe),e(Ye),e(Ee),e(ta),e(Se),e(Ae),e(qe),e(oa),e(Le),e(ia),e(De),e(pa),e(Pe),e(X),e(Oe),e(C),e(Ke),e(ca),e(sl),e(N),e(al),e(el),e(ra),e(ll),e(tl),e(nl),e(Ja)),e(o),y(z,s),y(V,s),y(W,s),y(S,s),y(q,s),y(D,s),y(P,s),y(K,s),y(ss,s),y(w,s),y(ls,s),y(x,s),y(ns,s),y(is,s),y(cs,s),y(rs,s),y(Ms,s),y(ys,s),y(hs,s),y(Us,s),y(Z,s),y(gs,s),y(xs,s),y(Zs,s),y(Rs,s),y(vs,s),y(Xs,s),y(Ns,s),y(_s,s),y(ks,s),y(Vs,s),y($s,s),y(Ws,s),y(Qs,s),y(Es,s),y(Ss,s),y(R,s),y(Ls,s),y(Ps,s),y(Ks,s),y(ea,s),y(la,s),y(I,s),y(na,s),y(_,s),y(k,s),y(da,s)}}}const vt='{"title":"Criando seu próprio dataset","local":"criando-seu-próprio-dataset","sections":[{"title":"Obtendo os dados","local":"obtendo-os-dados","sections":[],"depth":2},{"title":"Limpando os dados","local":"limpando-os-dados","sections":[],"depth":2},{"title":"Aumentando o conjunto de dados","local":"aumentando-o-conjunto-de-dados","sections":[],"depth":2},{"title":"Carregando o conjunto de dados para o Hugging Face Hub","local":"carregando-o-conjunto-de-dados-para-o-hugging-face-hub","sections":[],"depth":2},{"title":"Criando um cartão do datasets","local":"criando-um-cartão-do-datasets","sections":[],"depth":2}],"depth":1}';function It(j){return mt(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class $t extends Mt{constructor(o){super(),Jt(this,o,It,Rt,ut,{})}}export{$t as component}; | |
Xet Storage Details
- Size:
- 85.8 kB
- Xet hash:
- 1f6f318ab3c2b63b7bc15d6689c38817f8553e9c353efab6e4c720f078a58641
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.