leideng/QCFuse / data /final_data /ruler_blend_metadata.json
leideng's picture
download
raw
1.86 kB
{
"script_version": "qcfuse-ruler-v1-10k-cache-count",
"tasks": {
"vt": {
"output": "ruler_vt.jsonl",
"template": "Find all variables that are assigned the value {query} in the text above."
},
"niah_multiquery": {
"output": "ruler_mq.jsonl",
"template": "What are all the special magic numbers for {query} mentioned in the provided text?"
},
"niah_multivalue": {
"output": "ruler_mv.jsonl",
"template": "What are all the special magic numbers for {query} mentioned in the provided text?"
}
},
"raw_save_dir": "/data/ldeng/code/kvbridge/QCFuse/data/ruler_raw/421fbba47bd64a20",
"raw_config": {
"script_version": "qcfuse-ruler-v1-10k-cache-count",
"ruler_git_rev": "ab17b7853df4e0a30b78cd5d2b463ac7dff6ee13",
"generator_source_hashes": {
"niah.py": "eef12b62d5fcc177df307f26c4722b57229fc8955cfa0c48ece37a1f95a4223e",
"variable_tracking.py": "7e221ff8a276a21ca1320d64cb9ab12e5b2dc6978b56e16fa1dfbaa0816c27b8"
},
"subset": "validation",
"tokenizer_path": "/public/models/Qwen3-8B",
"tokenizer_type": "hf",
"model_template_type": "base",
"ruler_max_seq_length": 11264,
"raw_num_samples": 1000,
"seed": 42
},
"final_num_samples_per_task": 200,
"raw_num_samples_per_task": 1000,
"chunk_size": 512,
"target_num_chunks": 20,
"target_context_tokens": 10240,
"ruler_max_seq_length": 11264,
"stats_by_task": {
"vt": {
"kept": 200,
"skipped_short": 0,
"skipped_missing_evidence": 0,
"skipped_bad_fields": 0
},
"niah_multiquery": {
"kept": 200,
"skipped_short": 6,
"skipped_missing_evidence": 0,
"skipped_bad_fields": 0
},
"niah_multivalue": {
"kept": 200,
"skipped_short": 3,
"skipped_missing_evidence": 0,
"skipped_bad_fields": 0
}
}
}

Xet Storage Details

Size:
1.86 kB
·
Xet hash:
987594f71da9969846a5c5736c5bda1da605384707ec6cd9b72098f0250e79ed

Xet efficiently stores files, intelligently splitting them into unique chunks and accelerating uploads and downloads. More info.