| { | |
| "raw_selected_examples": 25000, | |
| "kept_examples": 25000, | |
| "filtered_examples_total": 0, | |
| "filtered_examples_empty_problem_or_response": 0, | |
| "filtered_examples_missing_stage3_tokens": 0, | |
| "examples_with_non_empty_stage2": 25000, | |
| "examples_with_non_empty_stage3": 25000, | |
| "samples_with_valid_answer_spans": 25000, | |
| "samples_with_numeric_answers": 24867, | |
| "samples_excluded_or_degraded": 0, | |
| "samples_truncated_to_max_seq_length": 0, | |
| "samples_with_answer_span_truncated": 0, | |
| "train_eval_partition_strategy": "single_split_shuffle_then_dedup_by_problem_answer_signature", | |
| "train_eval_split_source": "train", | |
| "train_examples_written": 22500, | |
| "eval_examples_written": 1760, | |
| "eval_candidates_dropped_signature_overlap": 740, | |
| "dataset_name": "metamath_qa", | |
| "upstream_split": "train", | |
| "dataset_seed": 11, | |
| "preprocessing_settings": { | |
| "cache_dir": "./.cache/hf_datasets", | |
| "eval_fraction": 0.1, | |
| "max_seq_length": 4096, | |
| "seed": 11, | |
| "split": "train", | |
| "subset_size": 25000 | |
| }, | |
| "selected_sample_ids_hash": "70022c80c635901076a799be6fe83ba924bad908c0b242c2a746a23ceb3e86e3", | |
| "selected_sample_count": 25000, | |
| "train_sample_ids_hash": "dd0fd108e819feee53926d4a57f1857e1aa5515d1595fbb3a9ac2be292a8f746", | |
| "eval_sample_ids_hash": "ce705200861db74727559b9a50b132eddf4d365c4375a076eaa1c89c5d2c7ee8", | |
| "train_sample_count": 22500, | |
| "eval_sample_count": 1760, | |
| "dataset_fingerprint": "3e24605ae1a046959bfb217607e9dfb2f6cfc41609949391757d19a77050cdb6", | |
| "dataset_split": "train", | |
| "dataset_subset_size": 25000, | |
| "dataset_eval_fraction": 0.1 | |
| } |