Norah / tokenized_norah /dataset_info.json
Visdom9's picture
Pushing fine-tuned Norah model
3254881
{
"builder_name": "parquet",
"citation": "",
"config_name": "default",
"dataset_name": "oasst1",
"dataset_size": 106034902,
"description": "",
"download_checksums": {
"hf://datasets/OpenAssistant/oasst1@fdf72ae0827c1cda404aff25b6603abec9e3399b/data/train-00000-of-00001-b42a775f407cee45.parquet": {
"num_bytes": 39516251,
"checksum": null
},
"hf://datasets/OpenAssistant/oasst1@fdf72ae0827c1cda404aff25b6603abec9e3399b/data/validation-00000-of-00001-134b8fd0c89408b6.parquet": {
"num_bytes": 2080179,
"checksum": null
}
},
"download_size": 41596430,
"features": {
"labels": {
"feature": {
"dtype": "int64",
"_type": "Value"
},
"_type": "Sequence"
},
"input_ids": {
"feature": {
"dtype": "int32",
"_type": "Value"
},
"_type": "Sequence"
},
"attention_mask": {
"feature": {
"dtype": "int8",
"_type": "Value"
},
"_type": "Sequence"
}
},
"homepage": "",
"license": "",
"size_in_bytes": 147631332,
"splits": {
"train": {
"name": "train",
"num_bytes": 100770129,
"num_examples": 84437,
"dataset_name": "oasst1"
},
"validation": {
"name": "validation",
"num_bytes": 5264773,
"num_examples": 4401,
"dataset_name": "oasst1"
}
},
"version": {
"version_str": "0.0.0",
"major": 0,
"minor": 0,
"patch": 0
}
}