autoprogrammer's picture
SDAR-4B mbc SFT on ESFT-law (final)
ca81fa7 verified
{"current_steps": 5, "total_steps": 45, "loss": 2.1775, "lr": 9.946716840375552e-06, "epoch": 0.3448275862068966, "percentage": 11.11, "elapsed_time": "0:00:30", "remaining_time": "0:04:00"}
{"current_steps": 10, "total_steps": 45, "loss": 1.6103, "lr": 9.36024704071904e-06, "epoch": 0.6896551724137931, "percentage": 22.22, "elapsed_time": "0:01:16", "remaining_time": "0:04:28"}
{"current_steps": 15, "total_steps": 45, "loss": 1.3979, "lr": 8.198365107794457e-06, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "0:01:38", "remaining_time": "0:03:16"}
{"current_steps": 20, "total_steps": 45, "loss": 1.1536, "lr": 6.614402023857231e-06, "epoch": 1.3448275862068966, "percentage": 44.44, "elapsed_time": "0:02:27", "remaining_time": "0:03:04"}
{"current_steps": 25, "total_steps": 45, "loss": 1.0346, "lr": 4.817389884711706e-06, "epoch": 1.6896551724137931, "percentage": 55.56, "elapsed_time": "0:02:51", "remaining_time": "0:02:17"}
{"current_steps": 30, "total_steps": 45, "loss": 0.8237, "lr": 3.044476397549221e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "0:03:14", "remaining_time": "0:01:37"}
{"current_steps": 35, "total_steps": 45, "loss": 0.7871, "lr": 1.5296290238968303e-06, "epoch": 2.344827586206897, "percentage": 77.78, "elapsed_time": "0:03:55", "remaining_time": "0:01:07"}
{"current_steps": 40, "total_steps": 45, "loss": 0.7327, "lr": 4.727588125342669e-07, "epoch": 2.689655172413793, "percentage": 88.89, "elapsed_time": "0:04:19", "remaining_time": "0:00:32"}
{"current_steps": 45, "total_steps": 45, "loss": 0.6658, "lr": 1.333858168224178e-08, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:04:48", "remaining_time": "0:00:00"}
{"current_steps": 45, "total_steps": 45, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:05:05", "remaining_time": "0:00:00"}