| { | |
| "best_global_step": null, | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 9.9697933227345, | |
| "eval_steps": 500, | |
| "global_step": 3140, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 1.0, | |
| "grad_norm": 76.48739624023438, | |
| "learning_rate": 1e-05, | |
| "loss": 36.0195, | |
| "step": 315 | |
| }, | |
| { | |
| "epoch": 1.0, | |
| "eval_loss": 27.172119140625, | |
| "eval_map": 0.1432, | |
| "eval_map_50": 0.279, | |
| "eval_map_75": 0.1349, | |
| "eval_map_car": 0.2849, | |
| "eval_map_large": 0.8516, | |
| "eval_map_medium": 0.3117, | |
| "eval_map_person": 0.0014, | |
| "eval_map_small": 0.0688, | |
| "eval_mar_1": 0.0714, | |
| "eval_mar_10": 0.1887, | |
| "eval_mar_100": 0.2291, | |
| "eval_mar_100_car": 0.4372, | |
| "eval_mar_100_person": 0.0209, | |
| "eval_mar_large": 0.9133, | |
| "eval_mar_medium": 0.4115, | |
| "eval_mar_small": 0.1605, | |
| "eval_runtime": 2499.781, | |
| "eval_samples_per_second": 1.193, | |
| "eval_steps_per_second": 0.149, | |
| "step": 315 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "grad_norm": 59.644962310791016, | |
| "learning_rate": 1e-05, | |
| "loss": 28.6156, | |
| "step": 630 | |
| }, | |
| { | |
| "epoch": 2.0, | |
| "eval_loss": 25.287906646728516, | |
| "eval_map": 0.1597, | |
| "eval_map_50": 0.2996, | |
| "eval_map_75": 0.1521, | |
| "eval_map_car": 0.3147, | |
| "eval_map_large": 0.8789, | |
| "eval_map_medium": 0.337, | |
| "eval_map_person": 0.0046, | |
| "eval_map_small": 0.0779, | |
| "eval_mar_1": 0.078, | |
| "eval_mar_10": 0.2055, | |
| "eval_mar_100": 0.2497, | |
| "eval_mar_100_car": 0.4628, | |
| "eval_mar_100_person": 0.0367, | |
| "eval_mar_large": 0.9173, | |
| "eval_mar_medium": 0.4386, | |
| "eval_mar_small": 0.1825, | |
| "eval_runtime": 2155.178, | |
| "eval_samples_per_second": 1.383, | |
| "eval_steps_per_second": 0.173, | |
| "step": 630 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "grad_norm": 73.48206329345703, | |
| "learning_rate": 1e-05, | |
| "loss": 26.5961, | |
| "step": 945 | |
| }, | |
| { | |
| "epoch": 3.0, | |
| "eval_loss": 24.46408462524414, | |
| "eval_map": 0.1679, | |
| "eval_map_50": 0.3171, | |
| "eval_map_75": 0.1572, | |
| "eval_map_car": 0.326, | |
| "eval_map_large": 0.8921, | |
| "eval_map_medium": 0.3481, | |
| "eval_map_person": 0.0098, | |
| "eval_map_small": 0.0817, | |
| "eval_mar_1": 0.0809, | |
| "eval_mar_10": 0.2137, | |
| "eval_mar_100": 0.259, | |
| "eval_mar_100_car": 0.473, | |
| "eval_mar_100_person": 0.045, | |
| "eval_mar_large": 0.9229, | |
| "eval_mar_medium": 0.4441, | |
| "eval_mar_small": 0.193, | |
| "eval_runtime": 2435.3923, | |
| "eval_samples_per_second": 1.224, | |
| "eval_steps_per_second": 0.153, | |
| "step": 945 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "grad_norm": 76.99701690673828, | |
| "learning_rate": 1e-05, | |
| "loss": 25.435, | |
| "step": 1260 | |
| }, | |
| { | |
| "epoch": 4.0, | |
| "eval_loss": 24.101743698120117, | |
| "eval_map": 0.1701, | |
| "eval_map_50": 0.3217, | |
| "eval_map_75": 0.1577, | |
| "eval_map_car": 0.329, | |
| "eval_map_large": 0.9002, | |
| "eval_map_medium": 0.3562, | |
| "eval_map_person": 0.0112, | |
| "eval_map_small": 0.0815, | |
| "eval_mar_1": 0.0816, | |
| "eval_mar_10": 0.2169, | |
| "eval_mar_100": 0.2601, | |
| "eval_mar_100_car": 0.469, | |
| "eval_mar_100_person": 0.0512, | |
| "eval_mar_large": 0.9272, | |
| "eval_mar_medium": 0.4479, | |
| "eval_mar_small": 0.1929, | |
| "eval_runtime": 2506.8205, | |
| "eval_samples_per_second": 1.189, | |
| "eval_steps_per_second": 0.149, | |
| "step": 1260 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "grad_norm": 49.34306335449219, | |
| "learning_rate": 1e-05, | |
| "loss": 24.7221, | |
| "step": 1575 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "eval_loss": 23.55514907836914, | |
| "eval_map": 0.1738, | |
| "eval_map_50": 0.3286, | |
| "eval_map_75": 0.162, | |
| "eval_map_car": 0.3357, | |
| "eval_map_large": 0.8986, | |
| "eval_map_medium": 0.3615, | |
| "eval_map_person": 0.0119, | |
| "eval_map_small": 0.0855, | |
| "eval_mar_1": 0.0833, | |
| "eval_mar_10": 0.2226, | |
| "eval_mar_100": 0.2717, | |
| "eval_mar_100_car": 0.4836, | |
| "eval_mar_100_person": 0.0597, | |
| "eval_mar_large": 0.9276, | |
| "eval_mar_medium": 0.462, | |
| "eval_mar_small": 0.2053, | |
| "eval_runtime": 2773.607, | |
| "eval_samples_per_second": 1.075, | |
| "eval_steps_per_second": 0.134, | |
| "step": 1575 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "grad_norm": 131.27320861816406, | |
| "learning_rate": 1e-05, | |
| "loss": 24.1639, | |
| "step": 1890 | |
| }, | |
| { | |
| "epoch": 6.0, | |
| "eval_loss": 23.345670700073242, | |
| "eval_map": 0.1761, | |
| "eval_map_50": 0.3319, | |
| "eval_map_75": 0.1641, | |
| "eval_map_car": 0.3412, | |
| "eval_map_large": 0.9016, | |
| "eval_map_medium": 0.3606, | |
| "eval_map_person": 0.0111, | |
| "eval_map_small": 0.0891, | |
| "eval_mar_1": 0.0838, | |
| "eval_mar_10": 0.2249, | |
| "eval_mar_100": 0.267, | |
| "eval_mar_100_car": 0.4749, | |
| "eval_mar_100_person": 0.059, | |
| "eval_mar_large": 0.9265, | |
| "eval_mar_medium": 0.4539, | |
| "eval_mar_small": 0.2003, | |
| "eval_runtime": 2907.3675, | |
| "eval_samples_per_second": 1.025, | |
| "eval_steps_per_second": 0.128, | |
| "step": 1890 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "grad_norm": 67.19497680664062, | |
| "learning_rate": 1e-05, | |
| "loss": 23.581, | |
| "step": 2205 | |
| }, | |
| { | |
| "epoch": 7.0, | |
| "eval_loss": 23.021814346313477, | |
| "eval_map": 0.1801, | |
| "eval_map_50": 0.3415, | |
| "eval_map_75": 0.1687, | |
| "eval_map_car": 0.3475, | |
| "eval_map_large": 0.9111, | |
| "eval_map_medium": 0.3682, | |
| "eval_map_person": 0.0126, | |
| "eval_map_small": 0.0924, | |
| "eval_mar_1": 0.0854, | |
| "eval_mar_10": 0.2295, | |
| "eval_mar_100": 0.2735, | |
| "eval_mar_100_car": 0.4829, | |
| "eval_mar_100_person": 0.064, | |
| "eval_mar_large": 0.9356, | |
| "eval_mar_medium": 0.4619, | |
| "eval_mar_small": 0.2061, | |
| "eval_runtime": 2783.5554, | |
| "eval_samples_per_second": 1.071, | |
| "eval_steps_per_second": 0.134, | |
| "step": 2205 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "grad_norm": 57.127410888671875, | |
| "learning_rate": 1e-05, | |
| "loss": 23.1336, | |
| "step": 2520 | |
| }, | |
| { | |
| "epoch": 8.0, | |
| "eval_loss": 22.81333351135254, | |
| "eval_map": 0.1817, | |
| "eval_map_50": 0.3458, | |
| "eval_map_75": 0.1673, | |
| "eval_map_car": 0.3507, | |
| "eval_map_large": 0.9122, | |
| "eval_map_medium": 0.3723, | |
| "eval_map_person": 0.0127, | |
| "eval_map_small": 0.0959, | |
| "eval_mar_1": 0.0852, | |
| "eval_mar_10": 0.234, | |
| "eval_mar_100": 0.2782, | |
| "eval_mar_100_car": 0.4868, | |
| "eval_mar_100_person": 0.0697, | |
| "eval_mar_large": 0.9352, | |
| "eval_mar_medium": 0.4682, | |
| "eval_mar_small": 0.2108, | |
| "eval_runtime": 2098.1242, | |
| "eval_samples_per_second": 1.421, | |
| "eval_steps_per_second": 0.178, | |
| "step": 2520 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "grad_norm": 59.762691497802734, | |
| "learning_rate": 1e-05, | |
| "loss": 22.6498, | |
| "step": 2835 | |
| }, | |
| { | |
| "epoch": 9.0, | |
| "eval_loss": 22.81146240234375, | |
| "eval_map": 0.1823, | |
| "eval_map_50": 0.3478, | |
| "eval_map_75": 0.1683, | |
| "eval_map_car": 0.3508, | |
| "eval_map_large": 0.9137, | |
| "eval_map_medium": 0.3758, | |
| "eval_map_person": 0.0139, | |
| "eval_map_small": 0.0948, | |
| "eval_mar_1": 0.0856, | |
| "eval_mar_10": 0.2347, | |
| "eval_mar_100": 0.2818, | |
| "eval_mar_100_car": 0.4884, | |
| "eval_mar_100_person": 0.0751, | |
| "eval_mar_large": 0.9358, | |
| "eval_mar_medium": 0.4691, | |
| "eval_mar_small": 0.2148, | |
| "eval_runtime": 2084.2213, | |
| "eval_samples_per_second": 1.43, | |
| "eval_steps_per_second": 0.179, | |
| "step": 2835 | |
| }, | |
| { | |
| "epoch": 9.9697933227345, | |
| "grad_norm": 106.53839874267578, | |
| "learning_rate": 1e-05, | |
| "loss": 22.3868, | |
| "step": 3140 | |
| }, | |
| { | |
| "epoch": 9.9697933227345, | |
| "eval_loss": 22.58209991455078, | |
| "eval_map": 0.181, | |
| "eval_map_50": 0.35, | |
| "eval_map_75": 0.164, | |
| "eval_map_car": 0.3473, | |
| "eval_map_large": 0.9135, | |
| "eval_map_medium": 0.3758, | |
| "eval_map_person": 0.0147, | |
| "eval_map_small": 0.0954, | |
| "eval_mar_1": 0.0856, | |
| "eval_mar_10": 0.2359, | |
| "eval_mar_100": 0.2819, | |
| "eval_mar_100_car": 0.4911, | |
| "eval_mar_100_person": 0.0727, | |
| "eval_mar_large": 0.9371, | |
| "eval_mar_medium": 0.4688, | |
| "eval_mar_small": 0.2158, | |
| "eval_runtime": 2104.4987, | |
| "eval_samples_per_second": 1.416, | |
| "eval_steps_per_second": 0.177, | |
| "step": 3140 | |
| }, | |
| { | |
| "epoch": 9.9697933227345, | |
| "step": 3140, | |
| "total_flos": 5.249371936187105e+18, | |
| "train_loss": 25.740980325686703, | |
| "train_runtime": 34062.6711, | |
| "train_samples_per_second": 1.476, | |
| "train_steps_per_second": 0.092 | |
| } | |
| ], | |
| "logging_steps": 500, | |
| "max_steps": 3140, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 10, | |
| "save_steps": 500, | |
| "stateful_callbacks": { | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": true | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 5.249371936187105e+18, | |
| "train_batch_size": 8, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |