oit002gemma3 / trainer_log.jsonl
gpetruzella's picture
Upload 18 files
21fa42a verified
{"current_steps": 5, "total_steps": 36, "loss": 5.4762, "lr": 4.849231551964771e-05, "epoch": 0.43956043956043955, "percentage": 13.89, "elapsed_time": "0:00:12", "remaining_time": "0:01:19", "throughput": 1034.76, "total_tokens": 13272}
{"current_steps": 10, "total_steps": 36, "loss": 3.9653, "lr": 4.267766952966369e-05, "epoch": 0.8791208791208791, "percentage": 27.78, "elapsed_time": "0:00:24", "remaining_time": "0:01:03", "throughput": 1031.28, "total_tokens": 25368}
{"current_steps": 15, "total_steps": 36, "loss": 3.2543, "lr": 3.355050358314172e-05, "epoch": 1.2637362637362637, "percentage": 41.67, "elapsed_time": "0:00:35", "remaining_time": "0:00:49", "throughput": 1027.32, "total_tokens": 36568}
{"current_steps": 20, "total_steps": 36, "loss": 2.9243, "lr": 2.2821106431308544e-05, "epoch": 1.7032967032967035, "percentage": 55.56, "elapsed_time": "0:00:49", "remaining_time": "0:00:39", "throughput": 1000.4, "total_tokens": 49360}
{"current_steps": 25, "total_steps": 36, "loss": 2.6278, "lr": 1.2500000000000006e-05, "epoch": 2.087912087912088, "percentage": 69.44, "elapsed_time": "0:01:00", "remaining_time": "0:00:26", "throughput": 1001.62, "total_tokens": 60992}
{"current_steps": 30, "total_steps": 36, "loss": 2.6988, "lr": 4.521198892775203e-06, "epoch": 2.5274725274725274, "percentage": 83.33, "elapsed_time": "0:01:14", "remaining_time": "0:00:14", "throughput": 981.11, "total_tokens": 72872}
{"current_steps": 35, "total_steps": 36, "loss": 2.7677, "lr": 3.7980617469479953e-07, "epoch": 2.967032967032967, "percentage": 97.22, "elapsed_time": "0:01:27", "remaining_time": "0:00:02", "throughput": 977.06, "total_tokens": 85304}
{"current_steps": 36, "total_steps": 36, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:01:28", "remaining_time": "0:00:00", "throughput": 968.13, "total_tokens": 85968}