| {"step": 2500, "acc_step": 0, "data_loader_state": {"it_state": {"start_token": 4371, "it_state": {"it_state": {"root_dir": "/scratch/dyvm6xra/dyvm6xrauseryuhao/dataset/Pretraining_Dataset", "sources": {"data1": 1.0}, "source_to_state": {"data1": {"file_path": "/scratch/dyvm6xra/dyvm6xrauseryuhao/dataset/Pretraining_Dataset/data1/data1.chunk.00.jsonl", "position": 44372642, "block_size": 8, "offset": 7, "current_iter": 1}}, "rng_state": {"bit_generator": "PCG64", "state": {"state": 98717493748280879239644659893389689105, "inc": 53245743019587277358203950863334653629}, "has_uint32": 0, "uinteger": 0}}, "add_bos": true, "add_eos": true, "name": "hf", "path": "/scratch/dyvm6xra/dyvm6xrauseryuhao/dream-training/Qwen2.5-7B-dcp"}, "output_seq_len": 4096, "n_views": 2}, "seq_idx": 452, "rng_state": {"bit_generator": "PCG64", "state": {"state": 73407772541118432696768880670808056645, "inc": 19761753544780285878460645500694854795}, "has_uint32": 1, "uinteger": 1182720522}, "batch_size": 1, "prefetch_size": 1024}, "scheduler": {"base_lrs": [1e-05], "last_epoch": 2500, "verbose": false, "_step_count": 2501, "_get_lr_called_within_step": false, "_last_lr": [5e-06], "lr_lambdas": [{}]}} |