Buckets:

99 GB
58,246 files
Updated 3 months ago
NameSize
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000661.jsonl.zst2.27 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000662.jsonl.zst2.4 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000664.jsonl.zst2.71 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000665.jsonl.zst2.15 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000667.jsonl.zst2.88 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000668.jsonl.zst2.19 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000669.jsonl.zst2.66 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000670.jsonl.zst2.25 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000671.jsonl.zst2.43 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000672.jsonl.zst1.86 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000673.jsonl.zst2.15 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000675.jsonl.zst2.32 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000677.jsonl.zst2.37 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000678.jsonl.zst2.3 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000679.jsonl.zst2.37 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000680.jsonl.zst1.92 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000681.jsonl.zst2.4 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000682.jsonl.zst2.64 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000683.jsonl.zst2.07 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000684.jsonl.zst2.32 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000685.jsonl.zst2.09 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000686.jsonl.zst2.21 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000687.jsonl.zst2.18 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000689.jsonl.zst2.44 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000690.jsonl.zst2.2 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000691.jsonl.zst3.12 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000692.jsonl.zst2.27 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000693.jsonl.zst2.39 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000694.jsonl.zst2.45 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000695.jsonl.zst2.34 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000696.jsonl.zst2.51 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000699.jsonl.zst1.17 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000700.jsonl.zst2.29 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000701.jsonl.zst2.21 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000702.jsonl.zst2.15 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000703.jsonl.zst1.85 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000704.jsonl.zst1.96 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000705.jsonl.zst2.28 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000706.jsonl.zst2.23 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000707.jsonl.zst2.6 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0013__shard_00000708.jsonl.zst1.71 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000000.jsonl.zst2.01 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000001.jsonl.zst2.01 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000002.jsonl.zst1.99 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000003.jsonl.zst1.84 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000004.jsonl.zst1.77 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000005.jsonl.zst2.33 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000006.jsonl.zst1.98 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000007.jsonl.zst1.94 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000008.jsonl.zst2.16 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000009.jsonl.zst2.09 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000010.jsonl.zst2.09 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000011.jsonl.zst2.33 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000012.jsonl.zst1.91 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000013.jsonl.zst1.68 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000014.jsonl.zst2.35 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000015.jsonl.zst2.39 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000016.jsonl.zst2.02 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000017.jsonl.zst1.82 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000018.jsonl.zst2.07 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000019.jsonl.zst1.73 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000020.jsonl.zst2.24 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000021.jsonl.zst2.25 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000022.jsonl.zst2.14 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000023.jsonl.zst1.79 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000024.jsonl.zst1.78 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000025.jsonl.zst2.16 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000026.jsonl.zst2.27 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000027.jsonl.zst2.28 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000028.jsonl.zst1.69 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000029.jsonl.zst1.97 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000030.jsonl.zst2.07 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000031.jsonl.zst2.09 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000032.jsonl.zst2.18 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000033.jsonl.zst2 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000034.jsonl.zst1.87 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000035.jsonl.zst2.25 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000036.jsonl.zst1.8 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000037.jsonl.zst1.67 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000038.jsonl.zst2.07 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000039.jsonl.zst2.09 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000040.jsonl.zst1.71 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000041.jsonl.zst1.82 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000042.jsonl.zst1.94 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000043.jsonl.zst2.02 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000044.jsonl.zst2.03 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000045.jsonl.zst2.4 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000046.jsonl.zst1.9 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000047.jsonl.zst2.08 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000048.jsonl.zst1.79 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000049.jsonl.zst2.01 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000050.jsonl.zst2.03 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000051.jsonl.zst2.1 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000052.jsonl.zst1.92 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000053.jsonl.zst1.95 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000054.jsonl.zst2.1 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000055.jsonl.zst2.09 MB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000056.jsonl.zst944 kB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000057.jsonl.zst791 kB
xet
soc127__phase1_pool_shared__common_crawl__part_004__data__common_crawl-science_math_and_technology-0014__shard_00000058.jsonl.zst713 kB
xet
Total size
99 GB
Files
58,246
Last updated
Mar 23
Pre-warmed CDN
US EU US EU

Contributors