Buckets:
| import{s as dn,n as cn,o as mn}from"../chunks/scheduler.d75c11ed.js";import{S as hn,i as un,e as p,s as l,c as r,h as yn,a as i,d as a,b as n,f as Oe,g as d,j as o,k as f,l as Mn,m as e,n as c,t as m,o as h,p as u}from"../chunks/index.4ec9dfe9.js";import{C as fn,H as M,E as gn}from"../chunks/MermaidChart.svelte_svelte_type_style_lang.7f9223a4.js";import{C as y}from"../chunks/CodeBlock.438b04e1.js";import{C as xt}from"../chunks/CodeBlockFw.6e472e07.js";function jn(sl){let g,vt,Zt,Yt,$,Xt,C,Wt,k,tl="Your data can be stored in various places; they can be on your local machine’s disk, in a Github repository, and in in-memory data structures like Python dictionaries and Pandas DataFrames. Wherever a dataset is stored, 🤗 Datasets can help you load it.",Nt,R,al="This guide will show you how to load a dataset from:",zt,I,el="<li>The Hugging Face Hub</li> <li>Local files</li> <li>In-memory data</li> <li>Offline</li> <li>A specific slice of a split</li>",Qt,G,ll='For more details specific to loading other dataset modalities, take a look at the <a class="underline decoration-pink-400 decoration-2 font-semibold" href="./audio_load">load audio dataset guide</a>, the <a class="underline decoration-yellow-400 decoration-2 font-semibold" href="./image_load">load image dataset guide</a>, the <a class="underline decoration-blue-400 decoration-2 font-semibold" href="./video_load">load video dataset guide</a>, or the <a class="underline decoration-green-400 decoration-2 font-semibold" href="./nlp_load">load text dataset guide</a>.',Vt,_t,Ht,_,Bt,q,nl='You can also load a dataset from any dataset repository on the Hub! Begin by <a href="share#create-the-repository">creating a dataset repository</a> and upload your data files. Now you can use the <a href="/docs/datasets/pr_7933/en/package_reference/loading_methods#datasets.load_dataset">load_dataset()</a> function to load the dataset.',Lt,Z,pl='For example, try loading the files from this <a href="https://huggingface.co/datasets/lhoestq/demo1" rel="nofollow">demo repository</a> by providing the repository namespace and dataset name. This dataset repository contains CSV files, and the code below loads the dataset from the CSV files:',St,F,Et,x,il="Some datasets may have more than one version based on Git tags, branches, or commits. Use the <code>revision</code> parameter to specify the dataset version you want to load:",Dt,v,At,j,ol='<p>Refer to the <a href="./upload_dataset">Upload a dataset to the Hub</a> tutorial for more details on how to create a dataset repository on the Hub, and how to upload your data files.</p>',Pt,Y,rl="A dataset loads by default all the data into the <code>train</code> split, or checks for mentions or split names in the data files names (e.g. “train”, “test” and “validation”). Use the <code>data_files</code> parameter to map data files to splits like <code>train</code>, <code>validation</code> and <code>test</code>:",Kt,X,Ot,J,dl='<p>If you don’t specify which data files to use, <a href="/docs/datasets/pr_7933/en/package_reference/loading_methods#datasets.load_dataset">load_dataset()</a> will return all the data files. This can take a long time if you load a large dataset like C4, which is approximately 13TB of data.</p>',sa,W,cl="You can also load a specific subset of the files with the <code>data_files</code> or <code>data_dir</code> parameter. These parameters can accept a relative path which resolves to the base path corresponding to where the dataset is loaded from.",ta,N,aa,z,ml="The <code>split</code> parameter can also map a data file to a specific split:",ea,Q,la,V,na,H,hl='Datasets can be loaded from local files stored on your computer and from remote files. The datasets are most likely stored as a <code>csv</code>, <code>json</code>, <code>txt</code> or <code>parquet</code> file. The <a href="/docs/datasets/pr_7933/en/package_reference/loading_methods#datasets.load_dataset">load_dataset()</a> function can load each of these file types.',pa,B,ia,L,ul="🤗 Datasets can read a dataset made up of one or several CSV files (in this case, pass your CSV files as a list):",oa,S,ra,T,yl='<p>For more details, check out the <a href="tabular_load#csv-files">how to load tabular datasets from CSV files</a> guide.</p>',da,E,ca,D,Ml='JSON files are loaded directly with <a href="/docs/datasets/pr_7933/en/package_reference/loading_methods#datasets.load_dataset">load_dataset()</a> as shown below:',ma,A,ha,P,fl="JSON files have diverse formats, but we think the most efficient format is to have multiple JSON objects; each line represents an individual row of data. For example:",ua,K,ya,O,gl="Another JSON format you may encounter is a nested field, in which case you’ll need to specify the <code>field</code> argument as shown in the following:",Ma,ss,fa,ts,jl="To load remote JSON files via HTTP, pass the URLs instead:",ga,as,ja,es,Jl="While these are the most common JSON formats, you’ll see other datasets that are formatted differently. 🤗 Datasets recognizes these other formats and will fallback accordingly on the Python JSON loading methods to handle them.",Ja,ls,Ta,ns,Tl="Parquet files are stored in a columnar format, unlike row-based files like a CSV. Large datasets may be stored in a Parquet file because it is more efficient and faster at returning your query.",wa,ps,wl="To load a Parquet file:",ba,is,Ua,os,bl="To load remote Parquet files via HTTP, pass the URLs instead:",$a,rs,Ca,ds,ka,cs,Ul="Arrow files are stored in an in-memory columnar format, unlike row-based formats like CSV and uncompressed formats like Parquet.",Ra,ms,$l="To load an Arrow file:",Ia,hs,Ga,us,Cl="To load remote Arrow files via HTTP, pass the URLs instead:",_a,ys,qa,Ms,kl='Arrow is the file format used by 🤗 Datasets under the hood, therefore you can load a local Arrow file using <a href="/docs/datasets/pr_7933/en/package_reference/main_classes#datasets.Dataset.from_file">Dataset.from_file()</a> directly:',Za,fs,Fa,gs,Rl=`Unlike <a href="/docs/datasets/pr_7933/en/package_reference/loading_methods#datasets.load_dataset">load_dataset()</a>, <a href="/docs/datasets/pr_7933/en/package_reference/main_classes#datasets.Dataset.from_file">Dataset.from_file()</a> memory maps the Arrow file without preparing the dataset in the cache, saving you disk space. | |
| The cache directory to store intermediate processing results will be the Arrow file directory in that case.`,xa,js,Il="For now only the Arrow streaming format is supported. The Arrow IPC file format (also known as Feather V2) is not supported.",va,Js,Ya,Ts,Gl='<a href="https://www.hdfgroup.org/solutions/hdf5/" rel="nofollow">HDF5</a> files are commonly used for storing large amounts of numerical data in scientific computing and machine learning. Loading HDF5 files with 🤗 Datasets is similar to loading CSV files:',Xa,ws,Wa,bs,_l="Note that the HDF5 loader assumes that the file has “tabular” structure, i.e. that all datasets in the file have (the same number of) rows on their first dimension.",Na,Us,za,$s,ql='Read database contents with <a href="/docs/datasets/pr_7933/en/package_reference/main_classes#datasets.Dataset.from_sql">from_sql()</a> by specifying the URI to connect to your database. You can read both table names and queries:',Qa,Cs,Va,w,Zl='<p>For more details, check out the <a href="tabular_load#databases">how to load tabular datasets from SQL databases</a> guide.</p>',Ha,ks,Ba,Rs,Fl=`The <a href="https://github.com/webdataset/webdataset" rel="nofollow">WebDataset</a> format is based on TAR archives and is suitable for big image datasets. | |
| Because of their size, WebDatasets are generally loaded in streaming mode (using <code>streaming=True</code>).`,La,Is,xl="You can load a WebDataset like this:",Sa,Gs,Ea,_s,vl="To load remote WebDatasets via HTTP, pass the URLs instead:",Da,qs,Aa,Zs,Pa,Fs,Yl="When a dataset is made of several files (that we call “shards”), it is possible to significantly speed up the dataset downloading and preparation step.",Ka,xs,Xl=`You can choose how many processes you’d like to use to prepare a dataset in parallel using <code>num_proc</code>. | |
| In this case, each process is given a subset of shards to prepare:`,Oa,vs,se,Ys,te,Xs,Wl='🤗 Datasets will also allow you to create a <a href="/docs/datasets/pr_7933/en/package_reference/main_classes#datasets.Dataset">Dataset</a> directly from in-memory data structures like Python dictionaries and Pandas DataFrames.',ae,Ws,ee,Ns,Nl='Load Python dictionaries with <a href="/docs/datasets/pr_7933/en/package_reference/main_classes#datasets.Dataset.from_dict">from_dict()</a>:',le,zs,ne,Qs,pe,Vs,zl="Load a list of Python dictionaries with <code>from_list()</code>:",ie,Hs,oe,Bs,re,Ls,Ql='Create a dataset from a Python generator with <a href="/docs/datasets/pr_7933/en/package_reference/main_classes#datasets.Dataset.from_generator">from_generator()</a>:',de,Ss,ce,Es,Vl="This approach supports loading data larger than available memory.",me,Ds,Hl="You can also define a sharded dataset by passing lists to <code>gen_kwargs</code>:",he,As,ue,Ps,ye,Ks,Bl='Load Pandas DataFrames with <a href="/docs/datasets/pr_7933/en/package_reference/main_classes#datasets.Dataset.from_pandas">from_pandas()</a>:',Me,Os,fe,b,Ll='<p>For more details, check out the <a href="tabular_load#pandas-dataframes">how to load tabular datasets from Pandas DataFrames</a> guide.</p>',ge,st,je,tt,Sl="Even if you don’t have an internet connection, it is still possible to load a dataset. As long as you’ve downloaded a dataset from the Hub repository before, it should be cached. This means you can reload the dataset from the cache and use it offline.",Je,at,El="If you know you won’t have internet access, you can run 🤗 Datasets in full offline mode. This saves time because instead of waiting for the Dataset builder download to time out, 🤗 Datasets will look directly in the cache. Set the environment variable <code>HF_HUB_OFFLINE</code> to <code>1</code> to enable full offline mode.",Te,et,we,lt,Dl='You can also choose only to load specific slices of a split. There are two options for slicing a split: using strings or the <a href="/docs/datasets/pr_7933/en/package_reference/builder_classes#datasets.ReadInstruction">ReadInstruction</a> API. Strings are more compact and readable for simple cases, while <a href="/docs/datasets/pr_7933/en/package_reference/builder_classes#datasets.ReadInstruction">ReadInstruction</a> is easier to use with variable slicing parameters.',be,nt,Al="Concatenate a <code>train</code> and <code>test</code> split by:",Ue,pt,$e,it,Pl="Select specific rows of the <code>train</code> split:",Ce,ot,ke,rt,Kl="Or select a percentage of a split with:",Re,dt,Ie,ct,Ol="Select a combination of percentages from each split:",Ge,mt,_e,ht,sn="Finally, you can even create cross-validated splits. The example below creates 10-fold cross-validated splits. Each validation dataset is a 10% chunk, and the training dataset makes up the remaining complementary 90% chunk:",qe,ut,Ze,yt,Fe,Mt,tn="The default behavior is to round the boundaries to the nearest integer for datasets where the requested slice boundaries do not divide evenly by 100. As shown below, some slices may contain more examples than others. For instance, if the following train split includes 999 records, then:",xe,ft,ve,gt,an="If you want equal sized splits, use <code>pct1_dropremainder</code> rounding instead. This treats the specified percentage boundaries as multiples of 1%.",Ye,jt,Xe,U,en="<p><code>pct1_dropremainder</code> rounding may truncate the last examples in a dataset if the number of examples in your dataset don’t divide evenly by 100.</p>",We,qt,Ne,Jt,ze,Tt,ln="Sometimes, you may get unexpected results when you load a dataset. Two of the most common issues you may encounter are manually downloading a dataset and specifying features of a dataset.",Qe,wt,Ve,bt,nn='When you create a dataset from local files, the <a href="/docs/datasets/pr_7933/en/package_reference/main_classes#datasets.Features">Features</a> are automatically inferred by <a href="https://arrow.apache.org/docs/" rel="nofollow">Apache Arrow</a>. However, the dataset’s features may not always align with your expectations, or you may want to define the features yourself. The following example shows how you can add custom labels with the <a href="/docs/datasets/pr_7933/en/package_reference/main_classes#datasets.ClassLabel">ClassLabel</a> feature.',He,Ut,pn='Start by defining your own labels with the <a href="/docs/datasets/pr_7933/en/package_reference/main_classes#datasets.Features">Features</a> class:',Be,$t,Le,Ct,on='Next, specify the <code>features</code> parameter in <a href="/docs/datasets/pr_7933/en/package_reference/loading_methods#datasets.load_dataset">load_dataset()</a> with the features you just created:',Se,kt,Ee,Rt,rn="Now when you look at your dataset features, you can see it uses the custom labels you defined:",De,It,Ae,Gt,Pe,Ft,Ke;return $=new fn({props:{containerStyle:"float: right; margin-left: 10px; display: inline-flex; position: relative; z-index: 10;"}}),C=new M({props:{title:"Load",local:"load",headingTag:"h1"}}),_=new M({props:{title:"Hugging Face Hub",local:"hugging-face-hub",headingTag:"h2"}}),F=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBZGF0YXNldCUyMCUzRCUyMGxvYWRfZGF0YXNldCglMjJsaG9lc3RxJTJGZGVtbzElMjIp",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset | |
| <span class="hljs-meta">>>> </span>dataset = load_dataset(<span class="hljs-string">"lhoestq/demo1"</span>)`,wrap:!1}}),v=new y({props:{code:"ZGF0YXNldCUyMCUzRCUyMGxvYWRfZGF0YXNldCglMEElMjAlMjAlMjJsaG9lc3RxJTJGY3VzdG9tX3NxdWFkJTIyJTJDJTBBJTIwJTIwcmV2aXNpb24lM0QlMjJtYWluJTIyJTIwJTIwJTIzJTIwdGFnJTIwbmFtZSUyQyUyMG9yJTIwYnJhbmNoJTIwbmFtZSUyQyUyMG9yJTIwY29tbWl0JTIwaGFzaCUwQSk=",highlighted:`<span class="hljs-meta">>>> </span>dataset = load_dataset( | |
| <span class="hljs-meta">... </span> <span class="hljs-string">"lhoestq/custom_squad"</span>, | |
| <span class="hljs-meta">... </span> revision=<span class="hljs-string">"main"</span> <span class="hljs-comment"># tag name, or branch name, or commit hash</span> | |
| <span class="hljs-meta">... </span>)`,wrap:!1}}),X=new y({props:{code:"ZGF0YV9maWxlcyUyMCUzRCUyMCU3QiUyMnRyYWluJTIyJTNBJTIwJTIydHJhaW4uY3N2JTIyJTJDJTIwJTIydGVzdCUyMiUzQSUyMCUyMnRlc3QuY3N2JTIyJTdEJTBBZGF0YXNldCUyMCUzRCUyMGxvYWRfZGF0YXNldCglMjJuYW1lc3BhY2UlMkZ5b3VyX2RhdGFzZXRfbmFtZSUyMiUyQyUyMGRhdGFfZmlsZXMlM0RkYXRhX2ZpbGVzKQ==",highlighted:`<span class="hljs-meta">>>> </span>data_files = {<span class="hljs-string">"train"</span>: <span class="hljs-string">"train.csv"</span>, <span class="hljs-string">"test"</span>: <span class="hljs-string">"test.csv"</span>} | |
| <span class="hljs-meta">>>> </span>dataset = load_dataset(<span class="hljs-string">"namespace/your_dataset_name"</span>, data_files=data_files)`,wrap:!1}}),N=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBJTBBYzRfc3Vic2V0JTIwJTNEJTIwbG9hZF9kYXRhc2V0KCUyMmFsbGVuYWklMkZjNCUyMiUyQyUyMGRhdGFfZmlsZXMlM0QlMjJlbiUyRmM0LXRyYWluLjAwMDAqLW9mLTAxMDI0Lmpzb24uZ3olMjIpJTBBJTBBYzRfc3Vic2V0JTIwJTNEJTIwbG9hZF9kYXRhc2V0KCUyMmFsbGVuYWklMkZjNCUyMiUyQyUyMGRhdGFfZGlyJTNEJTIyZW4lMjIp",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset | |
| <span class="hljs-comment"># load files that match the grep pattern</span> | |
| <span class="hljs-meta">>>> </span>c4_subset = load_dataset(<span class="hljs-string">"allenai/c4"</span>, data_files=<span class="hljs-string">"en/c4-train.0000*-of-01024.json.gz"</span>) | |
| <span class="hljs-comment"># load dataset from the en directory on the Hub</span> | |
| <span class="hljs-meta">>>> </span>c4_subset = load_dataset(<span class="hljs-string">"allenai/c4"</span>, data_dir=<span class="hljs-string">"en"</span>)`,wrap:!1}}),Q=new y({props:{code:"ZGF0YV9maWxlcyUyMCUzRCUyMCU3QiUyMnZhbGlkYXRpb24lMjIlM0ElMjAlMjJlbiUyRmM0LXZhbGlkYXRpb24uKi5qc29uLmd6JTIyJTdEJTBBYzRfdmFsaWRhdGlvbiUyMCUzRCUyMGxvYWRfZGF0YXNldCglMjJhbGxlbmFpJTJGYzQlMjIlMkMlMjBkYXRhX2ZpbGVzJTNEZGF0YV9maWxlcyUyQyUyMHNwbGl0JTNEJTIydmFsaWRhdGlvbiUyMik=",highlighted:`<span class="hljs-meta">>>> </span>data_files = {<span class="hljs-string">"validation"</span>: <span class="hljs-string">"en/c4-validation.*.json.gz"</span>} | |
| <span class="hljs-meta">>>> </span>c4_validation = load_dataset(<span class="hljs-string">"allenai/c4"</span>, data_files=data_files, split=<span class="hljs-string">"validation"</span>)`,wrap:!1}}),V=new M({props:{title:"Local and remote files",local:"local-and-remote-files",headingTag:"h2"}}),B=new M({props:{title:"CSV",local:"csv",headingTag:"h3"}}),S=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBZGF0YXNldCUyMCUzRCUyMGxvYWRfZGF0YXNldCglMjJjc3YlMjIlMkMlMjBkYXRhX2ZpbGVzJTNEJTIybXlfZmlsZS5jc3YlMjIp",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset | |
| <span class="hljs-meta">>>> </span>dataset = load_dataset(<span class="hljs-string">"csv"</span>, data_files=<span class="hljs-string">"my_file.csv"</span>)`,wrap:!1}}),E=new M({props:{title:"JSON",local:"json",headingTag:"h3"}}),A=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBZGF0YXNldCUyMCUzRCUyMGxvYWRfZGF0YXNldCglMjJqc29uJTIyJTJDJTIwZGF0YV9maWxlcyUzRCUyMm15X2ZpbGUuanNvbiUyMik=",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset | |
| <span class="hljs-meta">>>> </span>dataset = load_dataset(<span class="hljs-string">"json"</span>, data_files=<span class="hljs-string">"my_file.json"</span>)`,wrap:!1}}),K=new y({props:{code:"JTdCJTIyYSUyMiUzQSUyMDElMkMlMjAlMjJiJTIyJTNBJTIwMi4wJTJDJTIwJTIyYyUyMiUzQSUyMCUyMmZvbyUyMiUyQyUyMCUyMmQlMjIlM0ElMjBmYWxzZSU3RCUwQSU3QiUyMmElMjIlM0ElMjA0JTJDJTIwJTIyYiUyMiUzQSUyMC01LjUlMkMlMjAlMjJjJTIyJTNBJTIwbnVsbCUyQyUyMCUyMmQlMjIlM0ElMjB0cnVlJTdE",highlighted:`<span class="hljs-punctuation">{</span><span class="hljs-attr">"a"</span><span class="hljs-punctuation">:</span> <span class="hljs-number">1</span><span class="hljs-punctuation">,</span> <span class="hljs-attr">"b"</span><span class="hljs-punctuation">:</span> <span class="hljs-number">2.0</span><span class="hljs-punctuation">,</span> <span class="hljs-attr">"c"</span><span class="hljs-punctuation">:</span> <span class="hljs-string">"foo"</span><span class="hljs-punctuation">,</span> <span class="hljs-attr">"d"</span><span class="hljs-punctuation">:</span> <span class="hljs-literal"><span class="hljs-keyword">false</span></span><span class="hljs-punctuation">}</span> | |
| <span class="hljs-punctuation">{</span><span class="hljs-attr">"a"</span><span class="hljs-punctuation">:</span> <span class="hljs-number">4</span><span class="hljs-punctuation">,</span> <span class="hljs-attr">"b"</span><span class="hljs-punctuation">:</span> <span class="hljs-number">-5.5</span><span class="hljs-punctuation">,</span> <span class="hljs-attr">"c"</span><span class="hljs-punctuation">:</span> <span class="hljs-literal"><span class="hljs-keyword">null</span></span><span class="hljs-punctuation">,</span> <span class="hljs-attr">"d"</span><span class="hljs-punctuation">:</span> <span class="hljs-literal"><span class="hljs-keyword">true</span></span><span class="hljs-punctuation">}</span>`,wrap:!1}}),ss=new y({props:{code:"JTBBZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBZGF0YXNldCUyMCUzRCUyMGxvYWRfZGF0YXNldCglMjJqc29uJTIyJTJDJTIwZGF0YV9maWxlcyUzRCUyMm15X2ZpbGUuanNvbiUyMiUyQyUyMGZpZWxkJTNEJTIyZGF0YSUyMik=",highlighted:`{<span class="hljs-string">"version"</span>: <span class="hljs-string">"0.1.0"</span>, | |
| <span class="hljs-string">"data"</span>: [{<span class="hljs-string">"a"</span>: <span class="hljs-number">1</span>, <span class="hljs-string">"b"</span>: <span class="hljs-number">2.0</span>, <span class="hljs-string">"c"</span>: <span class="hljs-string">"foo"</span>, <span class="hljs-string">"d"</span>: false}, | |
| {<span class="hljs-string">"a"</span>: <span class="hljs-number">4</span>, <span class="hljs-string">"b"</span>: -<span class="hljs-number">5.5</span>, <span class="hljs-string">"c"</span>: null, <span class="hljs-string">"d"</span>: true}] | |
| } | |
| <span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset | |
| <span class="hljs-meta">>>> </span>dataset = load_dataset(<span class="hljs-string">"json"</span>, data_files=<span class="hljs-string">"my_file.json"</span>, field=<span class="hljs-string">"data"</span>)`,wrap:!1}}),as=new y({props:{code:"YmFzZV91cmwlMjAlM0QlMjAlMjJodHRwcyUzQSUyRiUyRnJhanB1cmthci5naXRodWIuaW8lMkZTUXVBRC1leHBsb3JlciUyRmRhdGFzZXQlMkYlMjIlMEFkYXRhc2V0JTIwJTNEJTIwbG9hZF9kYXRhc2V0KCUyMmpzb24lMjIlMkMlMjBkYXRhX2ZpbGVzJTNEJTdCJTIydHJhaW4lMjIlM0ElMjBiYXNlX3VybCUyMCUyQiUyMCUyMnRyYWluLXYxLjEuanNvbiUyMiUyQyUyMCUyMnZhbGlkYXRpb24lMjIlM0ElMjBiYXNlX3VybCUyMCUyQiUyMCUyMmRldi12MS4xLmpzb24lMjIlN0QlMkMlMjBmaWVsZCUzRCUyMmRhdGElMjIp",highlighted:`<span class="hljs-meta">>>> </span>base_url = <span class="hljs-string">"https://rajpurkar.github.io/SQuAD-explorer/dataset/"</span> | |
| <span class="hljs-meta">>>> </span>dataset = load_dataset(<span class="hljs-string">"json"</span>, data_files={<span class="hljs-string">"train"</span>: base_url + <span class="hljs-string">"train-v1.1.json"</span>, <span class="hljs-string">"validation"</span>: base_url + <span class="hljs-string">"dev-v1.1.json"</span>}, field=<span class="hljs-string">"data"</span>)`,wrap:!1}}),ls=new M({props:{title:"Parquet",local:"parquet",headingTag:"h3"}}),is=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBZGF0YXNldCUyMCUzRCUyMGxvYWRfZGF0YXNldCglMjJwYXJxdWV0JTIyJTJDJTIwZGF0YV9maWxlcyUzRCU3Qid0cmFpbiclM0ElMjAndHJhaW4ucGFycXVldCclMkMlMjAndGVzdCclM0ElMjAndGVzdC5wYXJxdWV0JyU3RCk=",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset | |
| <span class="hljs-meta">>>> </span>dataset = load_dataset(<span class="hljs-string">"parquet"</span>, data_files={<span class="hljs-string">'train'</span>: <span class="hljs-string">'train.parquet'</span>, <span class="hljs-string">'test'</span>: <span class="hljs-string">'test.parquet'</span>})`,wrap:!1}}),rs=new y({props:{code:"YmFzZV91cmwlMjAlM0QlMjAlMjJodHRwcyUzQSUyRiUyRmh1Z2dpbmdmYWNlLmNvJTJGZGF0YXNldHMlMkZ3aWtpbWVkaWElMkZ3aWtpcGVkaWElMkZyZXNvbHZlJTJGbWFpbiUyRjIwMjMxMTAxLmFiJTJGJTIyJTBBZGF0YV9maWxlcyUyMCUzRCUyMCU3QiUyMnRyYWluJTIyJTNBJTIwYmFzZV91cmwlMjAlMkIlMjAlMjJ0cmFpbi0wMDAwMC1vZi0wMDAwMS5wYXJxdWV0JTIyJTdEJTBBd2lraSUyMCUzRCUyMGxvYWRfZGF0YXNldCglMjJwYXJxdWV0JTIyJTJDJTIwZGF0YV9maWxlcyUzRGRhdGFfZmlsZXMlMkMlMjBzcGxpdCUzRCUyMnRyYWluJTIyKQ==",highlighted:`<span class="hljs-meta">>>> </span>base_url = <span class="hljs-string">"https://huggingface.co/datasets/wikimedia/wikipedia/resolve/main/20231101.ab/"</span> | |
| <span class="hljs-meta">>>> </span>data_files = {<span class="hljs-string">"train"</span>: base_url + <span class="hljs-string">"train-00000-of-00001.parquet"</span>} | |
| <span class="hljs-meta">>>> </span>wiki = load_dataset(<span class="hljs-string">"parquet"</span>, data_files=data_files, split=<span class="hljs-string">"train"</span>)`,wrap:!1}}),ds=new M({props:{title:"Arrow",local:"arrow",headingTag:"h3"}}),hs=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBZGF0YXNldCUyMCUzRCUyMGxvYWRfZGF0YXNldCglMjJhcnJvdyUyMiUyQyUyMGRhdGFfZmlsZXMlM0QlN0IndHJhaW4nJTNBJTIwJ3RyYWluLmFycm93JyUyQyUyMCd0ZXN0JyUzQSUyMCd0ZXN0LmFycm93JyU3RCk=",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset | |
| <span class="hljs-meta">>>> </span>dataset = load_dataset(<span class="hljs-string">"arrow"</span>, data_files={<span class="hljs-string">'train'</span>: <span class="hljs-string">'train.arrow'</span>, <span class="hljs-string">'test'</span>: <span class="hljs-string">'test.arrow'</span>})`,wrap:!1}}),ys=new y({props:{code:"YmFzZV91cmwlMjAlM0QlMjAlMjJodHRwcyUzQSUyRiUyRmh1Z2dpbmdmYWNlLmNvJTJGZGF0YXNldHMlMkZjcm9pc3NhbnRsbG0lMkZjcm9pc3NhbnRfZGF0YXNldCUyRnJlc29sdmUlMkZtYWluJTJGZW5nbGlzaF82NjBCXzExJTJGJTIyJTBBZGF0YV9maWxlcyUyMCUzRCUyMCU3QiUyMnRyYWluJTIyJTNBJTIwYmFzZV91cmwlMjAlMkIlMjAlMjJ0cmFpbiUyRmRhdGEtMDAwMDAtb2YtMDAwODAuYXJyb3clMjIlN0QlMEF3aWtpJTIwJTNEJTIwbG9hZF9kYXRhc2V0KCUyMmFycm93JTIyJTJDJTIwZGF0YV9maWxlcyUzRGRhdGFfZmlsZXMlMkMlMjBzcGxpdCUzRCUyMnRyYWluJTIyKQ==",highlighted:`<span class="hljs-meta">>>> </span>base_url = <span class="hljs-string">"https://huggingface.co/datasets/croissantllm/croissant_dataset/resolve/main/english_660B_11/"</span> | |
| <span class="hljs-meta">>>> </span>data_files = {<span class="hljs-string">"train"</span>: base_url + <span class="hljs-string">"train/data-00000-of-00080.arrow"</span>} | |
| <span class="hljs-meta">>>> </span>wiki = load_dataset(<span class="hljs-string">"arrow"</span>, data_files=data_files, split=<span class="hljs-string">"train"</span>)`,wrap:!1}}),fs=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwRGF0YXNldCUwQWRhdGFzZXQlMjAlM0QlMjBEYXRhc2V0LmZyb21fZmlsZSglMjJkYXRhLmFycm93JTIyKQ==",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> Dataset | |
| <span class="hljs-meta">>>> </span>dataset = Dataset.from_file(<span class="hljs-string">"data.arrow"</span>)`,wrap:!1}}),Js=new M({props:{title:"HDF5 files",local:"hdf5-files",headingTag:"h2"}}),ws=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBZGF0YXNldCUyMCUzRCUyMGxvYWRfZGF0YXNldCglMjJoZGY1JTIyJTJDJTIwZGF0YV9maWxlcyUzRCUyMmRhdGEuaDUlMjIp",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset | |
| <span class="hljs-meta">>>> </span>dataset = load_dataset(<span class="hljs-string">"hdf5"</span>, data_files=<span class="hljs-string">"data.h5"</span>)`,wrap:!1}}),Us=new M({props:{title:"SQL",local:"sql",headingTag:"h3"}}),Cs=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwRGF0YXNldCUwQWRhdGFzZXQlMjAlM0QlMjBEYXRhc2V0LmZyb21fc3FsKCUyMmRhdGFfdGFibGVfbmFtZSUyMiUyQyUyMGNvbiUzRCUyMnNxbGl0ZSUzQSUyRiUyRiUyRnNxbGl0ZV9maWxlLmRiJTIyKSUwQWRhdGFzZXQlMjAlM0QlMjBEYXRhc2V0LmZyb21fc3FsKCUyMlNFTEVDVCUyMHRleHQlMjBGUk9NJTIwdGFibGUlMjBXSEVSRSUyMGxlbmd0aCh0ZXh0KSUyMCUzRSUyMDEwMCUyMExJTUlUJTIwMTAlMjIlMkMlMjBjb24lM0QlMjJzcWxpdGUlM0ElMkYlMkYlMkZzcWxpdGVfZmlsZS5kYiUyMik=",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> Dataset | |
| <span class="hljs-comment"># load entire table</span> | |
| <span class="hljs-meta">>>> </span>dataset = Dataset.from_sql(<span class="hljs-string">"data_table_name"</span>, con=<span class="hljs-string">"sqlite:///sqlite_file.db"</span>) | |
| <span class="hljs-comment"># load from query</span> | |
| <span class="hljs-meta">>>> </span>dataset = Dataset.from_sql(<span class="hljs-string">"SELECT text FROM table WHERE length(text) > 100 LIMIT 10"</span>, con=<span class="hljs-string">"sqlite:///sqlite_file.db"</span>)`,wrap:!1}}),ks=new M({props:{title:"WebDataset",local:"webdataset",headingTag:"h3"}}),Gs=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBcGF0aCUyMCUzRCUyMCUyMnBhdGglMkZ0byUyRnRyYWluJTJGKi50YXIlMjIlMEFkYXRhc2V0JTIwJTNEJTIwbG9hZF9kYXRhc2V0KCUyMndlYmRhdGFzZXQlMjIlMkMlMjBkYXRhX2ZpbGVzJTNEJTdCJTIydHJhaW4lMjIlM0ElMjBwYXRoJTdEJTJDJTIwc3BsaXQlM0QlMjJ0cmFpbiUyMiUyQyUyMHN0cmVhbWluZyUzRFRydWUp",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset | |
| >>> | |
| <span class="hljs-meta">>>> </span>path = <span class="hljs-string">"path/to/train/*.tar"</span> | |
| <span class="hljs-meta">>>> </span>dataset = load_dataset(<span class="hljs-string">"webdataset"</span>, data_files={<span class="hljs-string">"train"</span>: path}, split=<span class="hljs-string">"train"</span>, streaming=<span class="hljs-literal">True</span>)`,wrap:!1}}),qs=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBYmFzZV91cmwlMjAlM0QlMjAlMjJodHRwcyUzQSUyRiUyRmh1Z2dpbmdmYWNlLmNvJTJGZGF0YXNldHMlMkZsaG9lc3RxJTJGc21hbGwtcHVibGF5bmV0LXdkcyUyRnJlc29sdmUlMkZtYWluJTJGcHVibGF5bmV0LXRyYWluLSU3QmklM0EwNmQlN0QudGFyJTIyJTBBdXJscyUyMCUzRCUyMCU1QmJhc2VfdXJsLmZvcm1hdChpJTNEaSklMjBmb3IlMjBpJTIwaW4lMjByYW5nZSg0KSU1RCUwQWRhdGFzZXQlMjAlM0QlMjBsb2FkX2RhdGFzZXQoJTIyd2ViZGF0YXNldCUyMiUyQyUyMGRhdGFfZmlsZXMlM0QlN0IlMjJ0cmFpbiUyMiUzQSUyMHVybHMlN0QlMkMlMjBzcGxpdCUzRCUyMnRyYWluJTIyJTJDJTIwc3RyZWFtaW5nJTNEVHJ1ZSk=",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset | |
| >>> | |
| <span class="hljs-meta">>>> </span>base_url = <span class="hljs-string">"https://huggingface.co/datasets/lhoestq/small-publaynet-wds/resolve/main/publaynet-train-{i:06d}.tar"</span> | |
| <span class="hljs-meta">>>> </span>urls = [base_url.<span class="hljs-built_in">format</span>(i=i) <span class="hljs-keyword">for</span> i <span class="hljs-keyword">in</span> <span class="hljs-built_in">range</span>(<span class="hljs-number">4</span>)] | |
| <span class="hljs-meta">>>> </span>dataset = load_dataset(<span class="hljs-string">"webdataset"</span>, data_files={<span class="hljs-string">"train"</span>: urls}, split=<span class="hljs-string">"train"</span>, streaming=<span class="hljs-literal">True</span>)`,wrap:!1}}),Zs=new M({props:{title:"Multiprocessing",local:"multiprocessing",headingTag:"h2"}}),vs=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwbG9hZF9kYXRhc2V0JTBBJTBBaW1hZ2VuZXQlMjAlM0QlMjBsb2FkX2RhdGFzZXQoJTIydGltbSUyRmltYWdlbmV0LTFrLXdkcyUyMiUyQyUyMG51bV9wcm9jJTNEOCklMEFtbF9saWJyaXNwZWVjaF9zcGFuaXNoJTIwJTNEJTIwbG9hZF9kYXRhc2V0KCUyMmZhY2Vib29rJTJGbXVsdGlsaW5ndWFsX2xpYnJpc3BlZWNoJTIyJTJDJTIwJTIyc3BhbmlzaCUyMiUyQyUyMG51bV9wcm9jJTNEOCk=",highlighted:`<span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> load_dataset | |
| imagenet = load_dataset(<span class="hljs-string">"timm/imagenet-1k-wds"</span>, num_proc=<span class="hljs-number">8</span>) | |
| ml_librispeech_spanish = load_dataset(<span class="hljs-string">"facebook/multilingual_librispeech"</span>, <span class="hljs-string">"spanish"</span>, num_proc=<span class="hljs-number">8</span>)`,wrap:!1}}),Ys=new M({props:{title:"In-memory data",local:"in-memory-data",headingTag:"h2"}}),Ws=new M({props:{title:"Python dictionary",local:"python-dictionary",headingTag:"h3"}}),zs=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwRGF0YXNldCUwQW15X2RpY3QlMjAlM0QlMjAlN0IlMjJhJTIyJTNBJTIwJTVCMSUyQyUyMDIlMkMlMjAzJTVEJTdEJTBBZGF0YXNldCUyMCUzRCUyMERhdGFzZXQuZnJvbV9kaWN0KG15X2RpY3Qp",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> Dataset | |
| <span class="hljs-meta">>>> </span>my_dict = {<span class="hljs-string">"a"</span>: [<span class="hljs-number">1</span>, <span class="hljs-number">2</span>, <span class="hljs-number">3</span>]} | |
| <span class="hljs-meta">>>> </span>dataset = Dataset.from_dict(my_dict)`,wrap:!1}}),Qs=new M({props:{title:"Python list of dictionaries",local:"python-list-of-dictionaries",headingTag:"h3"}}),Hs=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwRGF0YXNldCUwQW15X2xpc3QlMjAlM0QlMjAlNUIlN0IlMjJhJTIyJTNBJTIwMSU3RCUyQyUyMCU3QiUyMmElMjIlM0ElMjAyJTdEJTJDJTIwJTdCJTIyYSUyMiUzQSUyMDMlN0QlNUQlMEFkYXRhc2V0JTIwJTNEJTIwRGF0YXNldC5mcm9tX2xpc3QobXlfbGlzdCk=",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> Dataset | |
| <span class="hljs-meta">>>> </span>my_list = [{<span class="hljs-string">"a"</span>: <span class="hljs-number">1</span>}, {<span class="hljs-string">"a"</span>: <span class="hljs-number">2</span>}, {<span class="hljs-string">"a"</span>: <span class="hljs-number">3</span>}] | |
| <span class="hljs-meta">>>> </span>dataset = Dataset.from_list(my_list)`,wrap:!1}}),Bs=new M({props:{title:"Python generator",local:"python-generator",headingTag:"h3"}}),Ss=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwRGF0YXNldCUwQWRlZiUyMG15X2dlbigpJTNBJTBBJTIwJTIwJTIwJTIwZm9yJTIwaSUyMGluJTIwcmFuZ2UoMSUyQyUyMDQpJTNBJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIweWllbGQlMjAlN0IlMjJhJTIyJTNBJTIwaSU3RCUwQWRhdGFzZXQlMjAlM0QlMjBEYXRhc2V0LmZyb21fZ2VuZXJhdG9yKG15X2dlbik=",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> Dataset | |
| <span class="hljs-meta">>>> </span><span class="hljs-keyword">def</span> <span class="hljs-title function_">my_gen</span>(): | |
| <span class="hljs-meta">... </span> <span class="hljs-keyword">for</span> i <span class="hljs-keyword">in</span> <span class="hljs-built_in">range</span>(<span class="hljs-number">1</span>, <span class="hljs-number">4</span>): | |
| <span class="hljs-meta">... </span> <span class="hljs-keyword">yield</span> {<span class="hljs-string">"a"</span>: i} | |
| ... | |
| <span class="hljs-meta">>>> </span>dataset = Dataset.from_generator(my_gen)`,wrap:!1}}),As=new y({props:{code:"ZGVmJTIwZ2VuKHNoYXJkcyklM0ElMEElMjAlMjAlMjAlMjBmb3IlMjBzaGFyZCUyMGluJTIwc2hhcmRzJTNBJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwd2l0aCUyMG9wZW4oc2hhcmQpJTIwYXMlMjBmJTNBJTBBJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwJTIwZm9yJTIwbGluZSUyMGluJTIwZiUzQSUwQSUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMCUyMHlpZWxkJTIwJTdCJTIybGluZSUyMiUzQSUyMGxpbmUlN0QlMEFzaGFyZHMlMjAlM0QlMjAlNUJmJTIyZGF0YSU3QmklN0QudHh0JTIyJTIwZm9yJTIwaSUyMGluJTIwcmFuZ2UoMzIpJTVEJTBBZHMlMjAlM0QlMjBJdGVyYWJsZURhdGFzZXQuZnJvbV9nZW5lcmF0b3IoZ2VuJTJDJTIwZ2VuX2t3YXJncyUzRCU3QiUyMnNoYXJkcyUyMiUzQSUyMHNoYXJkcyU3RCklMEFkcyUyMCUzRCUyMGRzLnNodWZmbGUoc2VlZCUzRDQyJTJDJTIwYnVmZmVyX3NpemUlM0QxMF8wMDApJTIwJTIwJTIzJTIwc2h1ZmZsZXMlMjB0aGUlMjBzaGFyZHMlMjBvcmRlciUyMCUyQiUyMHVzZXMlMjBhJTIwc2h1ZmZsZSUyMGJ1ZmZlciUwQWZyb20lMjB0b3JjaC51dGlscy5kYXRhJTIwaW1wb3J0JTIwRGF0YUxvYWRlciUwQWRhdGFsb2FkZXIlMjAlM0QlMjBEYXRhTG9hZGVyKGRzLndpdGhfZm9ybWF0KCUyMnRvcmNoJTIyKSUyQyUyMG51bV93b3JrZXJzJTNENCklMjAlMjAlMjMlMjBnaXZlJTIwZWFjaCUyMHdvcmtlciUyMGElMjBzdWJzZXQlMjBvZiUyMDMyJTJGNCUzRDglMjBzaGFyZHM=",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">def</span> <span class="hljs-title function_">gen</span>(<span class="hljs-params">shards</span>): | |
| <span class="hljs-meta">... </span> <span class="hljs-keyword">for</span> shard <span class="hljs-keyword">in</span> shards: | |
| <span class="hljs-meta">... </span> <span class="hljs-keyword">with</span> <span class="hljs-built_in">open</span>(shard) <span class="hljs-keyword">as</span> f: | |
| <span class="hljs-meta">... </span> <span class="hljs-keyword">for</span> line <span class="hljs-keyword">in</span> f: | |
| <span class="hljs-meta">... </span> <span class="hljs-keyword">yield</span> {<span class="hljs-string">"line"</span>: line} | |
| ... | |
| <span class="hljs-meta">>>> </span>shards = [<span class="hljs-string">f"data<span class="hljs-subst">{i}</span>.txt"</span> <span class="hljs-keyword">for</span> i <span class="hljs-keyword">in</span> <span class="hljs-built_in">range</span>(<span class="hljs-number">32</span>)] | |
| <span class="hljs-meta">>>> </span>ds = IterableDataset.from_generator(gen, gen_kwargs={<span class="hljs-string">"shards"</span>: shards}) | |
| <span class="hljs-meta">>>> </span>ds = ds.shuffle(seed=<span class="hljs-number">42</span>, buffer_size=<span class="hljs-number">10_000</span>) <span class="hljs-comment"># shuffles the shards order + uses a shuffle buffer</span> | |
| <span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> torch.utils.data <span class="hljs-keyword">import</span> DataLoader | |
| <span class="hljs-meta">>>> </span>dataloader = DataLoader(ds.with_format(<span class="hljs-string">"torch"</span>), num_workers=<span class="hljs-number">4</span>) <span class="hljs-comment"># give each worker a subset of 32/4=8 shards</span>`,wrap:!1}}),Ps=new M({props:{title:"Pandas DataFrame",local:"pandas-dataframe",headingTag:"h3"}}),Os=new y({props:{code:"ZnJvbSUyMGRhdGFzZXRzJTIwaW1wb3J0JTIwRGF0YXNldCUwQWltcG9ydCUyMHBhbmRhcyUyMGFzJTIwcGQlMEFkZiUyMCUzRCUyMHBkLkRhdGFGcmFtZSglN0IlMjJhJTIyJTNBJTIwJTVCMSUyQyUyMDIlMkMlMjAzJTVEJTdEKSUwQWRhdGFzZXQlMjAlM0QlMjBEYXRhc2V0LmZyb21fcGFuZGFzKGRmKQ==",highlighted:`<span class="hljs-meta">>>> </span><span class="hljs-keyword">from</span> datasets <span class="hljs-keyword">import</span> Dataset | |
| <span class="hljs-meta">>>> </span><span class="hljs-keyword">import</span> pandas <span class="hljs-keyword">as</span> pd | |
| <span class="hljs-meta">>>> </span>df = pd.DataFrame({<span class="hljs-string">"a"</span>: [<span class="hljs-number">1</span>, <span class="hljs-number">2</span>, <span class="hljs-number">3</span>]}) | |
| <span class="hljs-meta">>>> </span>dataset = Dataset.from_pandas(df)`,wrap:!1}}),st=new M({props:{title:"Offline",local:"offline",headingTag:"h2"}}),et=new M({props:{title:"Slice splits",local:"slice-splits",headingTag:"h2"}}),pt=new xt({props:{group1:{id:"stringapi",code:"dHJhaW5fdGVzdF9kcyUyMCUzRCUyMGRhdGFzZXRzLmxvYWRfZGF0YXNldCglMjJhamliYXdhLTIwMjMlMkZHZW5lcmFsLVN0b3JpZXMtQ29sbGVjdGlvbiUyMiUyQyUyMHNwbGl0JTNEJTIydHJhaW4lMkJ0ZXN0JTIyKQ==",highlighted:'<span class="hljs-meta">>>> </span>train_test_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=<span class="hljs-string">"train+test"</span>)'},group2:{id:"readinstruction",code:"cmklMjAlM0QlMjBkYXRhc2V0cy5SZWFkSW5zdHJ1Y3Rpb24oJTIydHJhaW4lMjIpJTIwJTJCJTIwZGF0YXNldHMuUmVhZEluc3RydWN0aW9uKCUyMnRlc3QlMjIpJTBBdHJhaW5fdGVzdF9kcyUyMCUzRCUyMGRhdGFzZXRzLmxvYWRfZGF0YXNldCglMjJhamliYXdhLTIwMjMlMkZHZW5lcmFsLVN0b3JpZXMtQ29sbGVjdGlvbiUyMiUyQyUyMHNwbGl0JTNEcmkp",highlighted:`<span class="hljs-meta">>>> </span>ri = datasets.ReadInstruction(<span class="hljs-string">"train"</span>) + datasets.ReadInstruction(<span class="hljs-string">"test"</span>) | |
| <span class="hljs-meta">>>> </span>train_test_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=ri)`},wrap:!1}}),ot=new xt({props:{group1:{id:"stringapi",code:"dHJhaW5fMTBfMjBfZHMlMjAlM0QlMjBkYXRhc2V0cy5sb2FkX2RhdGFzZXQoJTIyYWppYmF3YS0yMDIzJTJGR2VuZXJhbC1TdG9yaWVzLUNvbGxlY3Rpb24lMjIlMkMlMjBzcGxpdCUzRCUyMnRyYWluJTVCMTAlM0EyMCU1RCUyMik=",highlighted:'<span class="hljs-meta">>>> </span>train_10_20_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=<span class="hljs-string">"train[10:20]"</span>)'},group2:{id:"readinstruction",code:"dHJhaW5fMTBfMjBfZHMlMjAlM0QlMjBkYXRhc2V0cy5sb2FkX2RhdGFzZXQoJTIycm9qYWd0YXAlMkZib29rY29ycHVzJTIyJTJDJTIwc3BsaXQlM0RkYXRhc2V0cy5SZWFkSW5zdHJ1Y3Rpb24oJTIydHJhaW4lMjIlMkMlMjBmcm9tXyUzRDEwJTJDJTIwdG8lM0QyMCUyQyUyMHVuaXQlM0QlMjJhYnMlMjIpKQ==",highlighted:'<span class="hljs-meta">>>> </span>train_10_20_ds = datasets.load_dataset(<span class="hljs-string">"rojagtap/bookcorpus"</span>, split=datasets.ReadInstruction(<span class="hljs-string">"train"</span>, from_=<span class="hljs-number">10</span>, to=<span class="hljs-number">20</span>, unit=<span class="hljs-string">"abs"</span>))'},wrap:!1}}),dt=new xt({props:{group1:{id:"stringapi",code:"dHJhaW5fMTBwY3RfZHMlMjAlM0QlMjBkYXRhc2V0cy5sb2FkX2RhdGFzZXQoJTIyYWppYmF3YS0yMDIzJTJGR2VuZXJhbC1TdG9yaWVzLUNvbGxlY3Rpb24lMjIlMkMlMjBzcGxpdCUzRCUyMnRyYWluJTVCJTNBMTAlMjUlNUQlMjIp",highlighted:'<span class="hljs-meta">>>> </span>train_10pct_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=<span class="hljs-string">"train[:10%]"</span>)'},group2:{id:"readinstruction",code:"dHJhaW5fMTBfMjBfZHMlMjAlM0QlMjBkYXRhc2V0cy5sb2FkX2RhdGFzZXQoJTIyYWppYmF3YS0yMDIzJTJGR2VuZXJhbC1TdG9yaWVzLUNvbGxlY3Rpb24lMjIlMkMlMjBzcGxpdCUzRGRhdGFzZXRzLlJlYWRJbnN0cnVjdGlvbiglMjJ0cmFpbiUyMiUyQyUyMHRvJTNEMTAlMkMlMjB1bml0JTNEJTIyJTI1JTIyKSk=",highlighted:'<span class="hljs-meta">>>> </span>train_10_20_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=datasets.ReadInstruction(<span class="hljs-string">"train"</span>, to=<span class="hljs-number">10</span>, unit=<span class="hljs-string">"%"</span>))'},wrap:!1}}),mt=new xt({props:{group1:{id:"stringapi",code:"dHJhaW5fMTBfODBwY3RfZHMlMjAlM0QlMjBkYXRhc2V0cy5sb2FkX2RhdGFzZXQoJTIyYWppYmF3YS0yMDIzJTJGR2VuZXJhbC1TdG9yaWVzLUNvbGxlY3Rpb24lMjIlMkMlMjBzcGxpdCUzRCUyMnRyYWluJTVCJTNBMTAlMjUlNUQlMkJ0cmFpbiU1Qi04MCUyNSUzQSU1RCUyMik=",highlighted:'<span class="hljs-meta">>>> </span>train_10_80pct_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=<span class="hljs-string">"train[:10%]+train[-80%:]"</span>)'},group2:{id:"readinstruction",code:"cmklMjAlM0QlMjAoZGF0YXNldHMuUmVhZEluc3RydWN0aW9uKCUyMnRyYWluJTIyJTJDJTIwdG8lM0QxMCUyQyUyMHVuaXQlM0QlMjIlMjUlMjIpJTIwJTJCJTIwZGF0YXNldHMuUmVhZEluc3RydWN0aW9uKCUyMnRyYWluJTIyJTJDJTIwZnJvbV8lM0QtODAlMkMlMjB1bml0JTNEJTIyJTI1JTIyKSklMEF0cmFpbl8xMF84MHBjdF9kcyUyMCUzRCUyMGRhdGFzZXRzLmxvYWRfZGF0YXNldCglMjJhamliYXdhLTIwMjMlMkZHZW5lcmFsLVN0b3JpZXMtQ29sbGVjdGlvbiUyMiUyQyUyMHNwbGl0JTNEcmkp",highlighted:`<span class="hljs-meta">>>> </span>ri = (datasets.ReadInstruction(<span class="hljs-string">"train"</span>, to=<span class="hljs-number">10</span>, unit=<span class="hljs-string">"%"</span>) + datasets.ReadInstruction(<span class="hljs-string">"train"</span>, from_=-<span class="hljs-number">80</span>, unit=<span class="hljs-string">"%"</span>)) | |
| <span class="hljs-meta">>>> </span>train_10_80pct_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=ri)`},wrap:!1}}),ut=new xt({props:{group1:{id:"stringapi",code:"dmFsX2RzJTIwJTNEJTIwZGF0YXNldHMubG9hZF9kYXRhc2V0KCUyMmFqaWJhd2EtMjAyMyUyRkdlbmVyYWwtU3Rvcmllcy1Db2xsZWN0aW9uJTIyJTJDJTIwc3BsaXQlM0QlNUJmJTIydHJhaW4lNUIlN0JrJTdEJTI1JTNBJTdCayUyQjEwJTdEJTI1JTVEJTIyJTIwZm9yJTIwayUyMGluJTIwcmFuZ2UoMCUyQyUyMDEwMCUyQyUyMDEwKSU1RCklMEF0cmFpbl9kcyUyMCUzRCUyMGRhdGFzZXRzLmxvYWRfZGF0YXNldCglMjJhamliYXdhLTIwMjMlMkZHZW5lcmFsLVN0b3JpZXMtQ29sbGVjdGlvbiUyMiUyQyUyMHNwbGl0JTNEJTVCZiUyMnRyYWluJTVCJTNBJTdCayU3RCUyNSU1RCUyQnRyYWluJTVCJTdCayUyQjEwJTdEJTI1JTNBJTVEJTIyJTIwZm9yJTIwayUyMGluJTIwcmFuZ2UoMCUyQyUyMDEwMCUyQyUyMDEwKSU1RCk=",highlighted:`<span class="hljs-meta">>>> </span>val_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=[<span class="hljs-string">f"train[<span class="hljs-subst">{k}</span>%:<span class="hljs-subst">{k+<span class="hljs-number">10</span>}</span>%]"</span> <span class="hljs-keyword">for</span> k <span class="hljs-keyword">in</span> <span class="hljs-built_in">range</span>(<span class="hljs-number">0</span>, <span class="hljs-number">100</span>, <span class="hljs-number">10</span>)]) | |
| <span class="hljs-meta">>>> </span>train_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=[<span class="hljs-string">f"train[:<span class="hljs-subst">{k}</span>%]+train[<span class="hljs-subst">{k+<span class="hljs-number">10</span>}</span>%:]"</span> <span class="hljs-keyword">for</span> k <span class="hljs-keyword">in</span> <span class="hljs-built_in">range</span>(<span class="hljs-number">0</span>, <span class="hljs-number">100</span>, <span class="hljs-number">10</span>)])`},group2:{id:"readinstruction",code:"dmFsX2RzJTIwJTNEJTIwZGF0YXNldHMubG9hZF9kYXRhc2V0KCUyMmFqaWJhd2EtMjAyMyUyRkdlbmVyYWwtU3Rvcmllcy1Db2xsZWN0aW9uJTIyJTJDJTIwJTVCZGF0YXNldHMuUmVhZEluc3RydWN0aW9uKCUyMnRyYWluJTIyJTJDJTIwZnJvbV8lM0RrJTJDJTIwdG8lM0RrJTJCMTAlMkMlMjB1bml0JTNEJTIyJTI1JTIyKSUyMGZvciUyMGslMjBpbiUyMHJhbmdlKDAlMkMlMjAxMDAlMkMlMjAxMCklNUQpJTBBdHJhaW5fZHMlMjAlM0QlMjBkYXRhc2V0cy5sb2FkX2RhdGFzZXQoJTIyYWppYmF3YS0yMDIzJTJGR2VuZXJhbC1TdG9yaWVzLUNvbGxlY3Rpb24lMjIlMkMlMjAlNUIoZGF0YXNldHMuUmVhZEluc3RydWN0aW9uKCUyMnRyYWluJTIyJTJDJTIwdG8lM0RrJTJDJTIwdW5pdCUzRCUyMiUyNSUyMiklMjAlMkIlMjBkYXRhc2V0cy5SZWFkSW5zdHJ1Y3Rpb24oJTIydHJhaW4lMjIlMkMlMjBmcm9tXyUzRGslMkIxMCUyQyUyMHVuaXQlM0QlMjIlMjUlMjIpKSUyMGZvciUyMGslMjBpbiUyMHJhbmdlKDAlMkMlMjAxMDAlMkMlMjAxMCklNUQp",highlighted:`<span class="hljs-meta">>>> </span>val_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, [datasets.ReadInstruction(<span class="hljs-string">"train"</span>, from_=k, to=k+<span class="hljs-number">10</span>, unit=<span class="hljs-string">"%"</span>) <span class="hljs-keyword">for</span> k <span class="hljs-keyword">in</span> <span class="hljs-built_in">range</span>(<span class="hljs-number">0</span>, <span class="hljs-number">100</span>, <span class="hljs-number">10</span>)]) | |
| <span class="hljs-meta">>>> </span>train_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, [(datasets.ReadInstruction(<span class="hljs-string">"train"</span>, to=k, unit=<span class="hljs-string">"%"</span>) + datasets.ReadInstruction(<span class="hljs-string">"train"</span>, from_=k+<span class="hljs-number">10</span>, unit=<span class="hljs-string">"%"</span>)) <span class="hljs-keyword">for</span> k <span class="hljs-keyword">in</span> <span class="hljs-built_in">range</span>(<span class="hljs-number">0</span>, <span class="hljs-number">100</span>, <span class="hljs-number">10</span>)])`},wrap:!1}}),yt=new M({props:{title:"Percent slicing and rounding",local:"percent-slicing-and-rounding",headingTag:"h3"}}),ft=new y({props:{code:"dHJhaW5fNTBfNTJfZHMlMjAlM0QlMjBkYXRhc2V0cy5sb2FkX2RhdGFzZXQoJTIyYWppYmF3YS0yMDIzJTJGR2VuZXJhbC1TdG9yaWVzLUNvbGxlY3Rpb24lMjIlMkMlMjBzcGxpdCUzRCUyMnRyYWluJTVCNTAlMjUlM0E1MiUyNSU1RCUyMiklMEF0cmFpbl81Ml81NF9kcyUyMCUzRCUyMGRhdGFzZXRzLmxvYWRfZGF0YXNldCglMjJhamliYXdhLTIwMjMlMkZHZW5lcmFsLVN0b3JpZXMtQ29sbGVjdGlvbiUyMiUyQyUyMHNwbGl0JTNEJTIydHJhaW4lNUI1MiUyNSUzQTU0JTI1JTVEJTIyKQ==",highlighted:`<span class="hljs-comment"># 19 records, from 500 (included) to 519 (excluded).</span> | |
| <span class="hljs-meta">>>> </span>train_50_52_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=<span class="hljs-string">"train[50%:52%]"</span>) | |
| <span class="hljs-comment"># 20 records, from 519 (included) to 539 (excluded).</span> | |
| <span class="hljs-meta">>>> </span>train_52_54_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=<span class="hljs-string">"train[52%:54%]"</span>)`,wrap:!1}}),jt=new y({props:{code:"dHJhaW5fNTBfNTJwY3QxX2RzJTIwJTNEJTIwZGF0YXNldHMubG9hZF9kYXRhc2V0KCUyMmFqaWJhd2EtMjAyMyUyRkdlbmVyYWwtU3Rvcmllcy1Db2xsZWN0aW9uJTIyJTJDJTIwc3BsaXQlM0RkYXRhc2V0cy5SZWFkSW5zdHJ1Y3Rpb24oJTIydHJhaW4lMjIlMkMlMjBmcm9tXyUzRDUwJTJDJTIwdG8lM0Q1MiUyQyUyMHVuaXQlM0QlMjIlMjUlMjIlMkMlMjByb3VuZGluZyUzRCUyMnBjdDFfZHJvcHJlbWFpbmRlciUyMikpJTBBdHJhaW5fNTJfNTRwY3QxX2RzJTIwJTNEJTIwZGF0YXNldHMubG9hZF9kYXRhc2V0KCUyMmFqaWJhd2EtMjAyMyUyRkdlbmVyYWwtU3Rvcmllcy1Db2xsZWN0aW9uJTIyJTJDJTIwc3BsaXQlM0RkYXRhc2V0cy5SZWFkSW5zdHJ1Y3Rpb24oJTIydHJhaW4lMjIlMkNmcm9tXyUzRDUyJTJDJTIwdG8lM0Q1NCUyQyUyMHVuaXQlM0QlMjIlMjUlMjIlMkMlMjByb3VuZGluZyUzRCUyMnBjdDFfZHJvcHJlbWFpbmRlciUyMikpJTBBdHJhaW5fNTBfNTJwY3QxX2RzJTIwJTNEJTIwZGF0YXNldHMubG9hZF9kYXRhc2V0KCUyMmFqaWJhd2EtMjAyMyUyRkdlbmVyYWwtU3Rvcmllcy1Db2xsZWN0aW9uJTIyJTJDJTIwc3BsaXQlM0QlMjJ0cmFpbiU1QjUwJTI1JTNBNTIlMjUlNUQocGN0MV9kcm9wcmVtYWluZGVyKSUyMiklMEF0cmFpbl81Ml81NHBjdDFfZHMlMjAlM0QlMjBkYXRhc2V0cy5sb2FkX2RhdGFzZXQoJTIyYWppYmF3YS0yMDIzJTJGR2VuZXJhbC1TdG9yaWVzLUNvbGxlY3Rpb24lMjIlMkMlMjBzcGxpdCUzRCUyMnRyYWluJTVCNTIlMjUlM0E1NCUyNSU1RChwY3QxX2Ryb3ByZW1haW5kZXIpJTIyKQ==",highlighted:`<span class="hljs-comment"># 18 records, from 450 (included) to 468 (excluded).</span> | |
| <span class="hljs-meta">>>> </span>train_50_52pct1_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=datasets.ReadInstruction(<span class="hljs-string">"train"</span>, from_=<span class="hljs-number">50</span>, to=<span class="hljs-number">52</span>, unit=<span class="hljs-string">"%"</span>, rounding=<span class="hljs-string">"pct1_dropremainder"</span>)) | |
| <span class="hljs-comment"># 18 records, from 468 (included) to 486 (excluded).</span> | |
| <span class="hljs-meta">>>> </span>train_52_54pct1_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=datasets.ReadInstruction(<span class="hljs-string">"train"</span>,from_=<span class="hljs-number">52</span>, to=<span class="hljs-number">54</span>, unit=<span class="hljs-string">"%"</span>, rounding=<span class="hljs-string">"pct1_dropremainder"</span>)) | |
| <span class="hljs-comment"># Or equivalently:</span> | |
| <span class="hljs-meta">>>> </span>train_50_52pct1_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=<span class="hljs-string">"train[50%:52%](pct1_dropremainder)"</span>) | |
| <span class="hljs-meta">>>> </span>train_52_54pct1_ds = datasets.load_dataset(<span class="hljs-string">"ajibawa-2023/General-Stories-Collection"</span>, split=<span class="hljs-string">"train[52%:54%](pct1_dropremainder)"</span>)`,wrap:!1}}),Jt=new M({props:{title:"Troubleshooting",local:"troubleshooting",headingTag:"h2"}}),wt=new M({props:{title:"Specify features",local:"specify-features",headingTag:"h3"}}),$t=new y({props:{code:"Y2xhc3NfbmFtZXMlMjAlM0QlMjAlNUIlMjJzYWRuZXNzJTIyJTJDJTIwJTIyam95JTIyJTJDJTIwJTIybG92ZSUyMiUyQyUyMCUyMmFuZ2VyJTIyJTJDJTIwJTIyZmVhciUyMiUyQyUyMCUyMnN1cnByaXNlJTIyJTVEJTBBZW1vdGlvbl9mZWF0dXJlcyUyMCUzRCUyMEZlYXR1cmVzKCU3Qid0ZXh0JyUzQSUyMFZhbHVlKCdzdHJpbmcnKSUyQyUyMCdsYWJlbCclM0ElMjBDbGFzc0xhYmVsKG5hbWVzJTNEY2xhc3NfbmFtZXMpJTdEKQ==",highlighted:`<span class="hljs-meta">>>> </span>class_names = [<span class="hljs-string">"sadness"</span>, <span class="hljs-string">"joy"</span>, <span class="hljs-string">"love"</span>, <span class="hljs-string">"anger"</span>, <span class="hljs-string">"fear"</span>, <span class="hljs-string">"surprise"</span>] | |
| <span class="hljs-meta">>>> </span>emotion_features = Features({<span class="hljs-string">'text'</span>: Value(<span class="hljs-string">'string'</span>), <span class="hljs-string">'label'</span>: ClassLabel(names=class_names)})`,wrap:!1}}),kt=new y({props:{code:"ZGF0YXNldCUyMCUzRCUyMGxvYWRfZGF0YXNldCgnY3N2JyUyQyUyMGRhdGFfZmlsZXMlM0RmaWxlX2RpY3QlMkMlMjBkZWxpbWl0ZXIlM0QnJTNCJyUyQyUyMGNvbHVtbl9uYW1lcyUzRCU1Qid0ZXh0JyUyQyUyMCdsYWJlbCclNUQlMkMlMjBmZWF0dXJlcyUzRGVtb3Rpb25fZmVhdHVyZXMp",highlighted:'<span class="hljs-meta">>>> </span>dataset = load_dataset(<span class="hljs-string">'csv'</span>, data_files=file_dict, delimiter=<span class="hljs-string">';'</span>, column_names=[<span class="hljs-string">'text'</span>, <span class="hljs-string">'label'</span>], features=emotion_features)',wrap:!1}}),It=new y({props:{code:"ZGF0YXNldCU1Qid0cmFpbiclNUQuZmVhdHVyZXM=",highlighted:`<span class="hljs-meta">>>> </span>dataset[<span class="hljs-string">'train'</span>].features | |
| {<span class="hljs-string">'text'</span>: Value(<span class="hljs-string">'string'</span>), | |
| <span class="hljs-string">'label'</span>: ClassLabel(names=[<span class="hljs-string">'sadness'</span>, <span class="hljs-string">'joy'</span>, <span class="hljs-string">'love'</span>, <span class="hljs-string">'anger'</span>, <span class="hljs-string">'fear'</span>, <span class="hljs-string">'surprise'</span>])}`,wrap:!1}}),Gt=new gn({props:{source:"https://github.com/huggingface/datasets/blob/main/docs/source/loading.mdx"}}),{c(){g=p("meta"),vt=l(),Zt=p("p"),Yt=l(),r($.$$.fragment),Xt=l(),r(C.$$.fragment),Wt=l(),k=p("p"),k.textContent=tl,Nt=l(),R=p("p"),R.textContent=al,zt=l(),I=p("ul"),I.innerHTML=el,Qt=l(),G=p("p"),G.innerHTML=ll,Vt=l(),_t=p("a"),Ht=l(),r(_.$$.fragment),Bt=l(),q=p("p"),q.innerHTML=nl,Lt=l(),Z=p("p"),Z.innerHTML=pl,St=l(),r(F.$$.fragment),Et=l(),x=p("p"),x.innerHTML=il,Dt=l(),r(v.$$.fragment),At=l(),j=p("blockquote"),j.innerHTML=ol,Pt=l(),Y=p("p"),Y.innerHTML=rl,Kt=l(),r(X.$$.fragment),Ot=l(),J=p("blockquote"),J.innerHTML=dl,sa=l(),W=p("p"),W.innerHTML=cl,ta=l(),r(N.$$.fragment),aa=l(),z=p("p"),z.innerHTML=ml,ea=l(),r(Q.$$.fragment),la=l(),r(V.$$.fragment),na=l(),H=p("p"),H.innerHTML=hl,pa=l(),r(B.$$.fragment),ia=l(),L=p("p"),L.textContent=ul,oa=l(),r(S.$$.fragment),ra=l(),T=p("blockquote"),T.innerHTML=yl,da=l(),r(E.$$.fragment),ca=l(),D=p("p"),D.innerHTML=Ml,ma=l(),r(A.$$.fragment),ha=l(),P=p("p"),P.textContent=fl,ua=l(),r(K.$$.fragment),ya=l(),O=p("p"),O.innerHTML=gl,Ma=l(),r(ss.$$.fragment),fa=l(),ts=p("p"),ts.textContent=jl,ga=l(),r(as.$$.fragment),ja=l(),es=p("p"),es.textContent=Jl,Ja=l(),r(ls.$$.fragment),Ta=l(),ns=p("p"),ns.textContent=Tl,wa=l(),ps=p("p"),ps.textContent=wl,ba=l(),r(is.$$.fragment),Ua=l(),os=p("p"),os.textContent=bl,$a=l(),r(rs.$$.fragment),Ca=l(),r(ds.$$.fragment),ka=l(),cs=p("p"),cs.textContent=Ul,Ra=l(),ms=p("p"),ms.textContent=$l,Ia=l(),r(hs.$$.fragment),Ga=l(),us=p("p"),us.textContent=Cl,_a=l(),r(ys.$$.fragment),qa=l(),Ms=p("p"),Ms.innerHTML=kl,Za=l(),r(fs.$$.fragment),Fa=l(),gs=p("p"),gs.innerHTML=Rl,xa=l(),js=p("p"),js.textContent=Il,va=l(),r(Js.$$.fragment),Ya=l(),Ts=p("p"),Ts.innerHTML=Gl,Xa=l(),r(ws.$$.fragment),Wa=l(),bs=p("p"),bs.textContent=_l,Na=l(),r(Us.$$.fragment),za=l(),$s=p("p"),$s.innerHTML=ql,Qa=l(),r(Cs.$$.fragment),Va=l(),w=p("blockquote"),w.innerHTML=Zl,Ha=l(),r(ks.$$.fragment),Ba=l(),Rs=p("p"),Rs.innerHTML=Fl,La=l(),Is=p("p"),Is.textContent=xl,Sa=l(),r(Gs.$$.fragment),Ea=l(),_s=p("p"),_s.textContent=vl,Da=l(),r(qs.$$.fragment),Aa=l(),r(Zs.$$.fragment),Pa=l(),Fs=p("p"),Fs.textContent=Yl,Ka=l(),xs=p("p"),xs.innerHTML=Xl,Oa=l(),r(vs.$$.fragment),se=l(),r(Ys.$$.fragment),te=l(),Xs=p("p"),Xs.innerHTML=Wl,ae=l(),r(Ws.$$.fragment),ee=l(),Ns=p("p"),Ns.innerHTML=Nl,le=l(),r(zs.$$.fragment),ne=l(),r(Qs.$$.fragment),pe=l(),Vs=p("p"),Vs.innerHTML=zl,ie=l(),r(Hs.$$.fragment),oe=l(),r(Bs.$$.fragment),re=l(),Ls=p("p"),Ls.innerHTML=Ql,de=l(),r(Ss.$$.fragment),ce=l(),Es=p("p"),Es.textContent=Vl,me=l(),Ds=p("p"),Ds.innerHTML=Hl,he=l(),r(As.$$.fragment),ue=l(),r(Ps.$$.fragment),ye=l(),Ks=p("p"),Ks.innerHTML=Bl,Me=l(),r(Os.$$.fragment),fe=l(),b=p("blockquote"),b.innerHTML=Ll,ge=l(),r(st.$$.fragment),je=l(),tt=p("p"),tt.textContent=Sl,Je=l(),at=p("p"),at.innerHTML=El,Te=l(),r(et.$$.fragment),we=l(),lt=p("p"),lt.innerHTML=Dl,be=l(),nt=p("p"),nt.innerHTML=Al,Ue=l(),r(pt.$$.fragment),$e=l(),it=p("p"),it.innerHTML=Pl,Ce=l(),r(ot.$$.fragment),ke=l(),rt=p("p"),rt.textContent=Kl,Re=l(),r(dt.$$.fragment),Ie=l(),ct=p("p"),ct.textContent=Ol,Ge=l(),r(mt.$$.fragment),_e=l(),ht=p("p"),ht.textContent=sn,qe=l(),r(ut.$$.fragment),Ze=l(),r(yt.$$.fragment),Fe=l(),Mt=p("p"),Mt.textContent=tn,xe=l(),r(ft.$$.fragment),ve=l(),gt=p("p"),gt.innerHTML=an,Ye=l(),r(jt.$$.fragment),Xe=l(),U=p("blockquote"),U.innerHTML=en,We=l(),qt=p("a"),Ne=l(),r(Jt.$$.fragment),ze=l(),Tt=p("p"),Tt.textContent=ln,Qe=l(),r(wt.$$.fragment),Ve=l(),bt=p("p"),bt.innerHTML=nn,He=l(),Ut=p("p"),Ut.innerHTML=pn,Be=l(),r($t.$$.fragment),Le=l(),Ct=p("p"),Ct.innerHTML=on,Se=l(),r(kt.$$.fragment),Ee=l(),Rt=p("p"),Rt.textContent=rn,De=l(),r(It.$$.fragment),Ae=l(),r(Gt.$$.fragment),Pe=l(),Ft=p("p"),this.h()},l(s){const t=yn("svelte-u9bgzb",document.head);g=i(t,"META",{name:!0,content:!0}),t.forEach(a),vt=n(s),Zt=i(s,"P",{}),Oe(Zt).forEach(a),Yt=n(s),d($.$$.fragment,s),Xt=n(s),d(C.$$.fragment,s),Wt=n(s),k=i(s,"P",{"data-svelte-h":!0}),o(k)!=="svelte-hbh3ke"&&(k.textContent=tl),Nt=n(s),R=i(s,"P",{"data-svelte-h":!0}),o(R)!=="svelte-ta2xky"&&(R.textContent=al),zt=n(s),I=i(s,"UL",{"data-svelte-h":!0}),o(I)!=="svelte-1iircxu"&&(I.innerHTML=el),Qt=n(s),G=i(s,"P",{"data-svelte-h":!0}),o(G)!=="svelte-1q7o0xf"&&(G.innerHTML=ll),Vt=n(s),_t=i(s,"A",{id:!0}),Oe(_t).forEach(a),Ht=n(s),d(_.$$.fragment,s),Bt=n(s),q=i(s,"P",{"data-svelte-h":!0}),o(q)!=="svelte-1e20l51"&&(q.innerHTML=nl),Lt=n(s),Z=i(s,"P",{"data-svelte-h":!0}),o(Z)!=="svelte-fqsv5w"&&(Z.innerHTML=pl),St=n(s),d(F.$$.fragment,s),Et=n(s),x=i(s,"P",{"data-svelte-h":!0}),o(x)!=="svelte-1iyrlkm"&&(x.innerHTML=il),Dt=n(s),d(v.$$.fragment,s),At=n(s),j=i(s,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),o(j)!=="svelte-8z2p39"&&(j.innerHTML=ol),Pt=n(s),Y=i(s,"P",{"data-svelte-h":!0}),o(Y)!=="svelte-16ovrtc"&&(Y.innerHTML=rl),Kt=n(s),d(X.$$.fragment,s),Ot=n(s),J=i(s,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),o(J)!=="svelte-11v68ph"&&(J.innerHTML=dl),sa=n(s),W=i(s,"P",{"data-svelte-h":!0}),o(W)!=="svelte-1i8sy5n"&&(W.innerHTML=cl),ta=n(s),d(N.$$.fragment,s),aa=n(s),z=i(s,"P",{"data-svelte-h":!0}),o(z)!=="svelte-11muxs5"&&(z.innerHTML=ml),ea=n(s),d(Q.$$.fragment,s),la=n(s),d(V.$$.fragment,s),na=n(s),H=i(s,"P",{"data-svelte-h":!0}),o(H)!=="svelte-1n3so6b"&&(H.innerHTML=hl),pa=n(s),d(B.$$.fragment,s),ia=n(s),L=i(s,"P",{"data-svelte-h":!0}),o(L)!=="svelte-fg4kbu"&&(L.textContent=ul),oa=n(s),d(S.$$.fragment,s),ra=n(s),T=i(s,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),o(T)!=="svelte-tpewfq"&&(T.innerHTML=yl),da=n(s),d(E.$$.fragment,s),ca=n(s),D=i(s,"P",{"data-svelte-h":!0}),o(D)!=="svelte-gi9r9"&&(D.innerHTML=Ml),ma=n(s),d(A.$$.fragment,s),ha=n(s),P=i(s,"P",{"data-svelte-h":!0}),o(P)!=="svelte-lihevk"&&(P.textContent=fl),ua=n(s),d(K.$$.fragment,s),ya=n(s),O=i(s,"P",{"data-svelte-h":!0}),o(O)!=="svelte-uf74g6"&&(O.innerHTML=gl),Ma=n(s),d(ss.$$.fragment,s),fa=n(s),ts=i(s,"P",{"data-svelte-h":!0}),o(ts)!=="svelte-sv3kzg"&&(ts.textContent=jl),ga=n(s),d(as.$$.fragment,s),ja=n(s),es=i(s,"P",{"data-svelte-h":!0}),o(es)!=="svelte-xpufyl"&&(es.textContent=Jl),Ja=n(s),d(ls.$$.fragment,s),Ta=n(s),ns=i(s,"P",{"data-svelte-h":!0}),o(ns)!=="svelte-1iqvf3b"&&(ns.textContent=Tl),wa=n(s),ps=i(s,"P",{"data-svelte-h":!0}),o(ps)!=="svelte-h7czyc"&&(ps.textContent=wl),ba=n(s),d(is.$$.fragment,s),Ua=n(s),os=i(s,"P",{"data-svelte-h":!0}),o(os)!=="svelte-u11d8o"&&(os.textContent=bl),$a=n(s),d(rs.$$.fragment,s),Ca=n(s),d(ds.$$.fragment,s),ka=n(s),cs=i(s,"P",{"data-svelte-h":!0}),o(cs)!=="svelte-1hx1xv3"&&(cs.textContent=Ul),Ra=n(s),ms=i(s,"P",{"data-svelte-h":!0}),o(ms)!=="svelte-ma1qmh"&&(ms.textContent=$l),Ia=n(s),d(hs.$$.fragment,s),Ga=n(s),us=i(s,"P",{"data-svelte-h":!0}),o(us)!=="svelte-ttm9cj"&&(us.textContent=Cl),_a=n(s),d(ys.$$.fragment,s),qa=n(s),Ms=i(s,"P",{"data-svelte-h":!0}),o(Ms)!=="svelte-uhhmkw"&&(Ms.innerHTML=kl),Za=n(s),d(fs.$$.fragment,s),Fa=n(s),gs=i(s,"P",{"data-svelte-h":!0}),o(gs)!=="svelte-1doqc0y"&&(gs.innerHTML=Rl),xa=n(s),js=i(s,"P",{"data-svelte-h":!0}),o(js)!=="svelte-kab5dk"&&(js.textContent=Il),va=n(s),d(Js.$$.fragment,s),Ya=n(s),Ts=i(s,"P",{"data-svelte-h":!0}),o(Ts)!=="svelte-evm8bo"&&(Ts.innerHTML=Gl),Xa=n(s),d(ws.$$.fragment,s),Wa=n(s),bs=i(s,"P",{"data-svelte-h":!0}),o(bs)!=="svelte-1bmsagx"&&(bs.textContent=_l),Na=n(s),d(Us.$$.fragment,s),za=n(s),$s=i(s,"P",{"data-svelte-h":!0}),o($s)!=="svelte-vbtv89"&&($s.innerHTML=ql),Qa=n(s),d(Cs.$$.fragment,s),Va=n(s),w=i(s,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),o(w)!=="svelte-1chq07d"&&(w.innerHTML=Zl),Ha=n(s),d(ks.$$.fragment,s),Ba=n(s),Rs=i(s,"P",{"data-svelte-h":!0}),o(Rs)!=="svelte-l9fgjb"&&(Rs.innerHTML=Fl),La=n(s),Is=i(s,"P",{"data-svelte-h":!0}),o(Is)!=="svelte-1e5cszd"&&(Is.textContent=xl),Sa=n(s),d(Gs.$$.fragment,s),Ea=n(s),_s=i(s,"P",{"data-svelte-h":!0}),o(_s)!=="svelte-12ynio"&&(_s.textContent=vl),Da=n(s),d(qs.$$.fragment,s),Aa=n(s),d(Zs.$$.fragment,s),Pa=n(s),Fs=i(s,"P",{"data-svelte-h":!0}),o(Fs)!=="svelte-1fk76jc"&&(Fs.textContent=Yl),Ka=n(s),xs=i(s,"P",{"data-svelte-h":!0}),o(xs)!=="svelte-eorgcn"&&(xs.innerHTML=Xl),Oa=n(s),d(vs.$$.fragment,s),se=n(s),d(Ys.$$.fragment,s),te=n(s),Xs=i(s,"P",{"data-svelte-h":!0}),o(Xs)!=="svelte-w04aqg"&&(Xs.innerHTML=Wl),ae=n(s),d(Ws.$$.fragment,s),ee=n(s),Ns=i(s,"P",{"data-svelte-h":!0}),o(Ns)!=="svelte-1ldlw3a"&&(Ns.innerHTML=Nl),le=n(s),d(zs.$$.fragment,s),ne=n(s),d(Qs.$$.fragment,s),pe=n(s),Vs=i(s,"P",{"data-svelte-h":!0}),o(Vs)!=="svelte-ajhscl"&&(Vs.innerHTML=zl),ie=n(s),d(Hs.$$.fragment,s),oe=n(s),d(Bs.$$.fragment,s),re=n(s),Ls=i(s,"P",{"data-svelte-h":!0}),o(Ls)!=="svelte-1pmayqr"&&(Ls.innerHTML=Ql),de=n(s),d(Ss.$$.fragment,s),ce=n(s),Es=i(s,"P",{"data-svelte-h":!0}),o(Es)!=="svelte-1plr9ti"&&(Es.textContent=Vl),me=n(s),Ds=i(s,"P",{"data-svelte-h":!0}),o(Ds)!=="svelte-i7ma5m"&&(Ds.innerHTML=Hl),he=n(s),d(As.$$.fragment,s),ue=n(s),d(Ps.$$.fragment,s),ye=n(s),Ks=i(s,"P",{"data-svelte-h":!0}),o(Ks)!=="svelte-1d1eten"&&(Ks.innerHTML=Bl),Me=n(s),d(Os.$$.fragment,s),fe=n(s),b=i(s,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),o(b)!=="svelte-1nyi9vo"&&(b.innerHTML=Ll),ge=n(s),d(st.$$.fragment,s),je=n(s),tt=i(s,"P",{"data-svelte-h":!0}),o(tt)!=="svelte-z93cul"&&(tt.textContent=Sl),Je=n(s),at=i(s,"P",{"data-svelte-h":!0}),o(at)!=="svelte-1ryoreq"&&(at.innerHTML=El),Te=n(s),d(et.$$.fragment,s),we=n(s),lt=i(s,"P",{"data-svelte-h":!0}),o(lt)!=="svelte-j07ugg"&&(lt.innerHTML=Dl),be=n(s),nt=i(s,"P",{"data-svelte-h":!0}),o(nt)!=="svelte-1ctwwfa"&&(nt.innerHTML=Al),Ue=n(s),d(pt.$$.fragment,s),$e=n(s),it=i(s,"P",{"data-svelte-h":!0}),o(it)!=="svelte-luua70"&&(it.innerHTML=Pl),Ce=n(s),d(ot.$$.fragment,s),ke=n(s),rt=i(s,"P",{"data-svelte-h":!0}),o(rt)!=="svelte-a2ozuk"&&(rt.textContent=Kl),Re=n(s),d(dt.$$.fragment,s),Ie=n(s),ct=i(s,"P",{"data-svelte-h":!0}),o(ct)!=="svelte-1k7wt2n"&&(ct.textContent=Ol),Ge=n(s),d(mt.$$.fragment,s),_e=n(s),ht=i(s,"P",{"data-svelte-h":!0}),o(ht)!=="svelte-17uck7y"&&(ht.textContent=sn),qe=n(s),d(ut.$$.fragment,s),Ze=n(s),d(yt.$$.fragment,s),Fe=n(s),Mt=i(s,"P",{"data-svelte-h":!0}),o(Mt)!=="svelte-281shm"&&(Mt.textContent=tn),xe=n(s),d(ft.$$.fragment,s),ve=n(s),gt=i(s,"P",{"data-svelte-h":!0}),o(gt)!=="svelte-ofjevf"&&(gt.innerHTML=an),Ye=n(s),d(jt.$$.fragment,s),Xe=n(s),U=i(s,"BLOCKQUOTE",{class:!0,"data-svelte-h":!0}),o(U)!=="svelte-1fqy32a"&&(U.innerHTML=en),We=n(s),qt=i(s,"A",{id:!0}),Oe(qt).forEach(a),Ne=n(s),d(Jt.$$.fragment,s),ze=n(s),Tt=i(s,"P",{"data-svelte-h":!0}),o(Tt)!=="svelte-1ycmr6d"&&(Tt.textContent=ln),Qe=n(s),d(wt.$$.fragment,s),Ve=n(s),bt=i(s,"P",{"data-svelte-h":!0}),o(bt)!=="svelte-glx4ms"&&(bt.innerHTML=nn),He=n(s),Ut=i(s,"P",{"data-svelte-h":!0}),o(Ut)!=="svelte-1sv4qhf"&&(Ut.innerHTML=pn),Be=n(s),d($t.$$.fragment,s),Le=n(s),Ct=i(s,"P",{"data-svelte-h":!0}),o(Ct)!=="svelte-17zvwot"&&(Ct.innerHTML=on),Se=n(s),d(kt.$$.fragment,s),Ee=n(s),Rt=i(s,"P",{"data-svelte-h":!0}),o(Rt)!=="svelte-60x7wj"&&(Rt.textContent=rn),De=n(s),d(It.$$.fragment,s),Ae=n(s),d(Gt.$$.fragment,s),Pe=n(s),Ft=i(s,"P",{}),Oe(Ft).forEach(a),this.h()},h(){f(g,"name","hf:doc:metadata"),f(g,"content",Jn),f(_t,"id","load-from-the-hub"),f(j,"class","tip"),f(J,"class","warning"),f(T,"class","tip"),f(w,"class","tip"),f(b,"class","tip"),f(U,"class","warning"),f(qt,"id","troubleshoot")},m(s,t){Mn(document.head,g),e(s,vt,t),e(s,Zt,t),e(s,Yt,t),c($,s,t),e(s,Xt,t),c(C,s,t),e(s,Wt,t),e(s,k,t),e(s,Nt,t),e(s,R,t),e(s,zt,t),e(s,I,t),e(s,Qt,t),e(s,G,t),e(s,Vt,t),e(s,_t,t),e(s,Ht,t),c(_,s,t),e(s,Bt,t),e(s,q,t),e(s,Lt,t),e(s,Z,t),e(s,St,t),c(F,s,t),e(s,Et,t),e(s,x,t),e(s,Dt,t),c(v,s,t),e(s,At,t),e(s,j,t),e(s,Pt,t),e(s,Y,t),e(s,Kt,t),c(X,s,t),e(s,Ot,t),e(s,J,t),e(s,sa,t),e(s,W,t),e(s,ta,t),c(N,s,t),e(s,aa,t),e(s,z,t),e(s,ea,t),c(Q,s,t),e(s,la,t),c(V,s,t),e(s,na,t),e(s,H,t),e(s,pa,t),c(B,s,t),e(s,ia,t),e(s,L,t),e(s,oa,t),c(S,s,t),e(s,ra,t),e(s,T,t),e(s,da,t),c(E,s,t),e(s,ca,t),e(s,D,t),e(s,ma,t),c(A,s,t),e(s,ha,t),e(s,P,t),e(s,ua,t),c(K,s,t),e(s,ya,t),e(s,O,t),e(s,Ma,t),c(ss,s,t),e(s,fa,t),e(s,ts,t),e(s,ga,t),c(as,s,t),e(s,ja,t),e(s,es,t),e(s,Ja,t),c(ls,s,t),e(s,Ta,t),e(s,ns,t),e(s,wa,t),e(s,ps,t),e(s,ba,t),c(is,s,t),e(s,Ua,t),e(s,os,t),e(s,$a,t),c(rs,s,t),e(s,Ca,t),c(ds,s,t),e(s,ka,t),e(s,cs,t),e(s,Ra,t),e(s,ms,t),e(s,Ia,t),c(hs,s,t),e(s,Ga,t),e(s,us,t),e(s,_a,t),c(ys,s,t),e(s,qa,t),e(s,Ms,t),e(s,Za,t),c(fs,s,t),e(s,Fa,t),e(s,gs,t),e(s,xa,t),e(s,js,t),e(s,va,t),c(Js,s,t),e(s,Ya,t),e(s,Ts,t),e(s,Xa,t),c(ws,s,t),e(s,Wa,t),e(s,bs,t),e(s,Na,t),c(Us,s,t),e(s,za,t),e(s,$s,t),e(s,Qa,t),c(Cs,s,t),e(s,Va,t),e(s,w,t),e(s,Ha,t),c(ks,s,t),e(s,Ba,t),e(s,Rs,t),e(s,La,t),e(s,Is,t),e(s,Sa,t),c(Gs,s,t),e(s,Ea,t),e(s,_s,t),e(s,Da,t),c(qs,s,t),e(s,Aa,t),c(Zs,s,t),e(s,Pa,t),e(s,Fs,t),e(s,Ka,t),e(s,xs,t),e(s,Oa,t),c(vs,s,t),e(s,se,t),c(Ys,s,t),e(s,te,t),e(s,Xs,t),e(s,ae,t),c(Ws,s,t),e(s,ee,t),e(s,Ns,t),e(s,le,t),c(zs,s,t),e(s,ne,t),c(Qs,s,t),e(s,pe,t),e(s,Vs,t),e(s,ie,t),c(Hs,s,t),e(s,oe,t),c(Bs,s,t),e(s,re,t),e(s,Ls,t),e(s,de,t),c(Ss,s,t),e(s,ce,t),e(s,Es,t),e(s,me,t),e(s,Ds,t),e(s,he,t),c(As,s,t),e(s,ue,t),c(Ps,s,t),e(s,ye,t),e(s,Ks,t),e(s,Me,t),c(Os,s,t),e(s,fe,t),e(s,b,t),e(s,ge,t),c(st,s,t),e(s,je,t),e(s,tt,t),e(s,Je,t),e(s,at,t),e(s,Te,t),c(et,s,t),e(s,we,t),e(s,lt,t),e(s,be,t),e(s,nt,t),e(s,Ue,t),c(pt,s,t),e(s,$e,t),e(s,it,t),e(s,Ce,t),c(ot,s,t),e(s,ke,t),e(s,rt,t),e(s,Re,t),c(dt,s,t),e(s,Ie,t),e(s,ct,t),e(s,Ge,t),c(mt,s,t),e(s,_e,t),e(s,ht,t),e(s,qe,t),c(ut,s,t),e(s,Ze,t),c(yt,s,t),e(s,Fe,t),e(s,Mt,t),e(s,xe,t),c(ft,s,t),e(s,ve,t),e(s,gt,t),e(s,Ye,t),c(jt,s,t),e(s,Xe,t),e(s,U,t),e(s,We,t),e(s,qt,t),e(s,Ne,t),c(Jt,s,t),e(s,ze,t),e(s,Tt,t),e(s,Qe,t),c(wt,s,t),e(s,Ve,t),e(s,bt,t),e(s,He,t),e(s,Ut,t),e(s,Be,t),c($t,s,t),e(s,Le,t),e(s,Ct,t),e(s,Se,t),c(kt,s,t),e(s,Ee,t),e(s,Rt,t),e(s,De,t),c(It,s,t),e(s,Ae,t),c(Gt,s,t),e(s,Pe,t),e(s,Ft,t),Ke=!0},p:cn,i(s){Ke||(m($.$$.fragment,s),m(C.$$.fragment,s),m(_.$$.fragment,s),m(F.$$.fragment,s),m(v.$$.fragment,s),m(X.$$.fragment,s),m(N.$$.fragment,s),m(Q.$$.fragment,s),m(V.$$.fragment,s),m(B.$$.fragment,s),m(S.$$.fragment,s),m(E.$$.fragment,s),m(A.$$.fragment,s),m(K.$$.fragment,s),m(ss.$$.fragment,s),m(as.$$.fragment,s),m(ls.$$.fragment,s),m(is.$$.fragment,s),m(rs.$$.fragment,s),m(ds.$$.fragment,s),m(hs.$$.fragment,s),m(ys.$$.fragment,s),m(fs.$$.fragment,s),m(Js.$$.fragment,s),m(ws.$$.fragment,s),m(Us.$$.fragment,s),m(Cs.$$.fragment,s),m(ks.$$.fragment,s),m(Gs.$$.fragment,s),m(qs.$$.fragment,s),m(Zs.$$.fragment,s),m(vs.$$.fragment,s),m(Ys.$$.fragment,s),m(Ws.$$.fragment,s),m(zs.$$.fragment,s),m(Qs.$$.fragment,s),m(Hs.$$.fragment,s),m(Bs.$$.fragment,s),m(Ss.$$.fragment,s),m(As.$$.fragment,s),m(Ps.$$.fragment,s),m(Os.$$.fragment,s),m(st.$$.fragment,s),m(et.$$.fragment,s),m(pt.$$.fragment,s),m(ot.$$.fragment,s),m(dt.$$.fragment,s),m(mt.$$.fragment,s),m(ut.$$.fragment,s),m(yt.$$.fragment,s),m(ft.$$.fragment,s),m(jt.$$.fragment,s),m(Jt.$$.fragment,s),m(wt.$$.fragment,s),m($t.$$.fragment,s),m(kt.$$.fragment,s),m(It.$$.fragment,s),m(Gt.$$.fragment,s),Ke=!0)},o(s){h($.$$.fragment,s),h(C.$$.fragment,s),h(_.$$.fragment,s),h(F.$$.fragment,s),h(v.$$.fragment,s),h(X.$$.fragment,s),h(N.$$.fragment,s),h(Q.$$.fragment,s),h(V.$$.fragment,s),h(B.$$.fragment,s),h(S.$$.fragment,s),h(E.$$.fragment,s),h(A.$$.fragment,s),h(K.$$.fragment,s),h(ss.$$.fragment,s),h(as.$$.fragment,s),h(ls.$$.fragment,s),h(is.$$.fragment,s),h(rs.$$.fragment,s),h(ds.$$.fragment,s),h(hs.$$.fragment,s),h(ys.$$.fragment,s),h(fs.$$.fragment,s),h(Js.$$.fragment,s),h(ws.$$.fragment,s),h(Us.$$.fragment,s),h(Cs.$$.fragment,s),h(ks.$$.fragment,s),h(Gs.$$.fragment,s),h(qs.$$.fragment,s),h(Zs.$$.fragment,s),h(vs.$$.fragment,s),h(Ys.$$.fragment,s),h(Ws.$$.fragment,s),h(zs.$$.fragment,s),h(Qs.$$.fragment,s),h(Hs.$$.fragment,s),h(Bs.$$.fragment,s),h(Ss.$$.fragment,s),h(As.$$.fragment,s),h(Ps.$$.fragment,s),h(Os.$$.fragment,s),h(st.$$.fragment,s),h(et.$$.fragment,s),h(pt.$$.fragment,s),h(ot.$$.fragment,s),h(dt.$$.fragment,s),h(mt.$$.fragment,s),h(ut.$$.fragment,s),h(yt.$$.fragment,s),h(ft.$$.fragment,s),h(jt.$$.fragment,s),h(Jt.$$.fragment,s),h(wt.$$.fragment,s),h($t.$$.fragment,s),h(kt.$$.fragment,s),h(It.$$.fragment,s),h(Gt.$$.fragment,s),Ke=!1},d(s){s&&(a(vt),a(Zt),a(Yt),a(Xt),a(Wt),a(k),a(Nt),a(R),a(zt),a(I),a(Qt),a(G),a(Vt),a(_t),a(Ht),a(Bt),a(q),a(Lt),a(Z),a(St),a(Et),a(x),a(Dt),a(At),a(j),a(Pt),a(Y),a(Kt),a(Ot),a(J),a(sa),a(W),a(ta),a(aa),a(z),a(ea),a(la),a(na),a(H),a(pa),a(ia),a(L),a(oa),a(ra),a(T),a(da),a(ca),a(D),a(ma),a(ha),a(P),a(ua),a(ya),a(O),a(Ma),a(fa),a(ts),a(ga),a(ja),a(es),a(Ja),a(Ta),a(ns),a(wa),a(ps),a(ba),a(Ua),a(os),a($a),a(Ca),a(ka),a(cs),a(Ra),a(ms),a(Ia),a(Ga),a(us),a(_a),a(qa),a(Ms),a(Za),a(Fa),a(gs),a(xa),a(js),a(va),a(Ya),a(Ts),a(Xa),a(Wa),a(bs),a(Na),a(za),a($s),a(Qa),a(Va),a(w),a(Ha),a(Ba),a(Rs),a(La),a(Is),a(Sa),a(Ea),a(_s),a(Da),a(Aa),a(Pa),a(Fs),a(Ka),a(xs),a(Oa),a(se),a(te),a(Xs),a(ae),a(ee),a(Ns),a(le),a(ne),a(pe),a(Vs),a(ie),a(oe),a(re),a(Ls),a(de),a(ce),a(Es),a(me),a(Ds),a(he),a(ue),a(ye),a(Ks),a(Me),a(fe),a(b),a(ge),a(je),a(tt),a(Je),a(at),a(Te),a(we),a(lt),a(be),a(nt),a(Ue),a($e),a(it),a(Ce),a(ke),a(rt),a(Re),a(Ie),a(ct),a(Ge),a(_e),a(ht),a(qe),a(Ze),a(Fe),a(Mt),a(xe),a(ve),a(gt),a(Ye),a(Xe),a(U),a(We),a(qt),a(Ne),a(ze),a(Tt),a(Qe),a(Ve),a(bt),a(He),a(Ut),a(Be),a(Le),a(Ct),a(Se),a(Ee),a(Rt),a(De),a(Ae),a(Pe),a(Ft)),a(g),u($,s),u(C,s),u(_,s),u(F,s),u(v,s),u(X,s),u(N,s),u(Q,s),u(V,s),u(B,s),u(S,s),u(E,s),u(A,s),u(K,s),u(ss,s),u(as,s),u(ls,s),u(is,s),u(rs,s),u(ds,s),u(hs,s),u(ys,s),u(fs,s),u(Js,s),u(ws,s),u(Us,s),u(Cs,s),u(ks,s),u(Gs,s),u(qs,s),u(Zs,s),u(vs,s),u(Ys,s),u(Ws,s),u(zs,s),u(Qs,s),u(Hs,s),u(Bs,s),u(Ss,s),u(As,s),u(Ps,s),u(Os,s),u(st,s),u(et,s),u(pt,s),u(ot,s),u(dt,s),u(mt,s),u(ut,s),u(yt,s),u(ft,s),u(jt,s),u(Jt,s),u(wt,s),u($t,s),u(kt,s),u(It,s),u(Gt,s)}}}const Jn='{"title":"Load","local":"load","sections":[{"title":"Hugging Face Hub","local":"hugging-face-hub","sections":[],"depth":2},{"title":"Local and remote files","local":"local-and-remote-files","sections":[{"title":"CSV","local":"csv","sections":[],"depth":3},{"title":"JSON","local":"json","sections":[],"depth":3},{"title":"Parquet","local":"parquet","sections":[],"depth":3},{"title":"Arrow","local":"arrow","sections":[],"depth":3}],"depth":2},{"title":"HDF5 files","local":"hdf5-files","sections":[{"title":"SQL","local":"sql","sections":[],"depth":3},{"title":"WebDataset","local":"webdataset","sections":[],"depth":3}],"depth":2},{"title":"Multiprocessing","local":"multiprocessing","sections":[],"depth":2},{"title":"In-memory data","local":"in-memory-data","sections":[{"title":"Python dictionary","local":"python-dictionary","sections":[],"depth":3},{"title":"Python list of dictionaries","local":"python-list-of-dictionaries","sections":[],"depth":3},{"title":"Python generator","local":"python-generator","sections":[],"depth":3},{"title":"Pandas DataFrame","local":"pandas-dataframe","sections":[],"depth":3}],"depth":2},{"title":"Offline","local":"offline","sections":[],"depth":2},{"title":"Slice splits","local":"slice-splits","sections":[{"title":"Percent slicing and rounding","local":"percent-slicing-and-rounding","sections":[],"depth":3}],"depth":2},{"title":"Troubleshooting","local":"troubleshooting","sections":[{"title":"Specify features","local":"specify-features","sections":[],"depth":3}],"depth":2}],"depth":1}';function Tn(sl){return mn(()=>{new URLSearchParams(window.location.search).get("fw")}),[]}class kn extends hn{constructor(g){super(),un(this,g,Tn,jn,dn,{})}}export{kn as component}; | |
Xet Storage Details
- Size:
- 73.5 kB
- Xet hash:
- e03e6ec21546df31569a4d93e7dfe697f9dab7e3da245b546e5faa6505a35a66
·
Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.