Instructions to use TomPanda/LLM-Restate-Discllaw with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- PEFT
How to use TomPanda/LLM-Restate-Discllaw with PEFT:
from peft import PeftModel from transformers import AutoModelForCausalLM base_model = AutoModelForCausalLM.from_pretrained("/data/oss_bucket_0/mushuang/disc/") model = PeftModel.from_pretrained(base_model, "TomPanda/LLM-Restate-Discllaw") - Notebooks
- Google Colab
- Kaggle
| {"current_steps": 10, "total_steps": 814, "loss": 0.1401, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.996276622795847e-06, "epoch": 0.02, "percentage": 1.23, "elapsed_time": "0:05:49", "remaining_time": "7:47:40"} | |
| {"current_steps": 10, "total_steps": 814, "loss": 0.1401, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.996276622795847e-06, "epoch": 0.02, "percentage": 1.23, "elapsed_time": "0:05:47", "remaining_time": "7:45:00"} | |
| {"current_steps": 20, "total_steps": 814, "loss": 0.0684, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.98511203659851e-06, "epoch": 0.05, "percentage": 2.46, "elapsed_time": "0:11:52", "remaining_time": "7:51:43"} | |
| {"current_steps": 20, "total_steps": 814, "loss": 0.0684, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.98511203659851e-06, "epoch": 0.05, "percentage": 2.46, "elapsed_time": "0:11:53", "remaining_time": "7:51:59"} | |
| {"current_steps": 20, "total_steps": 814, "loss": 0.0684, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.98511203659851e-06, "epoch": 0.05, "percentage": 2.46, "elapsed_time": "0:11:50", "remaining_time": "7:50:24"} | |
| {"current_steps": 30, "total_steps": 814, "loss": 0.051, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.966522869394282e-06, "epoch": 0.07, "percentage": 3.69, "elapsed_time": "0:17:54", "remaining_time": "7:47:57"} | |
| {"current_steps": 30, "total_steps": 814, "loss": 0.051, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.966522869394282e-06, "epoch": 0.07, "percentage": 3.69, "elapsed_time": "0:17:52", "remaining_time": "7:47:06"} | |
| {"current_steps": 40, "total_steps": 814, "loss": 0.0444, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.940536806975732e-06, "epoch": 0.1, "percentage": 4.91, "elapsed_time": "0:23:58", "remaining_time": "7:43:49"} | |
| {"current_steps": 40, "total_steps": 814, "loss": 0.0444, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.940536806975732e-06, "epoch": 0.1, "percentage": 4.91, "elapsed_time": "0:23:58", "remaining_time": "7:43:57"} | |
| {"current_steps": 40, "total_steps": 814, "loss": 0.0444, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.940536806975732e-06, "epoch": 0.1, "percentage": 4.91, "elapsed_time": "0:23:56", "remaining_time": "7:43:11"} | |
| {"current_steps": 50, "total_steps": 814, "loss": 0.0436, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.907192551707831e-06, "epoch": 0.12, "percentage": 6.14, "elapsed_time": "0:30:01", "remaining_time": "7:38:44"} | |
| {"current_steps": 50, "total_steps": 814, "loss": 0.0436, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.907192551707831e-06, "epoch": 0.12, "percentage": 6.14, "elapsed_time": "0:29:59", "remaining_time": "7:38:14"} | |
| {"current_steps": 60, "total_steps": 814, "loss": 0.038, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.866539764886562e-06, "epoch": 0.15, "percentage": 7.37, "elapsed_time": "0:36:04", "remaining_time": "7:33:21"} | |
| {"current_steps": 60, "total_steps": 814, "loss": 0.038, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.866539764886562e-06, "epoch": 0.15, "percentage": 7.37, "elapsed_time": "0:36:02", "remaining_time": "7:32:56"} | |
| {"current_steps": 70, "total_steps": 814, "loss": 0.0421, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.818638992775822e-06, "epoch": 0.17, "percentage": 8.6, "elapsed_time": "0:42:06", "remaining_time": "7:27:34"} | |
| {"current_steps": 70, "total_steps": 814, "loss": 0.0421, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.818638992775822e-06, "epoch": 0.17, "percentage": 8.6, "elapsed_time": "0:42:04", "remaining_time": "7:27:13"} | |
| {"current_steps": 80, "total_steps": 814, "loss": 0.0415, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.763561576432781e-06, "epoch": 0.2, "percentage": 9.83, "elapsed_time": "0:48:08", "remaining_time": "7:21:37"} | |
| {"current_steps": 80, "total_steps": 814, "loss": 0.0415, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.763561576432781e-06, "epoch": 0.2, "percentage": 9.83, "elapsed_time": "0:48:05", "remaining_time": "7:21:15"} | |
| {"current_steps": 90, "total_steps": 814, "loss": 0.0402, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.70138954545603e-06, "epoch": 0.22, "percentage": 11.06, "elapsed_time": "0:54:08", "remaining_time": "7:15:35"} | |
| {"current_steps": 90, "total_steps": 814, "loss": 0.0402, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.70138954545603e-06, "epoch": 0.22, "percentage": 11.06, "elapsed_time": "0:54:06", "remaining_time": "7:15:20"} | |
| {"current_steps": 100, "total_steps": 814, "loss": 0.0375, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.632215495814724e-06, "epoch": 0.25, "percentage": 12.29, "elapsed_time": "1:00:10", "remaining_time": "7:09:41"} | |
| {"current_steps": 100, "total_steps": 814, "loss": 0.0375, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.632215495814724e-06, "epoch": 0.25, "percentage": 12.29, "elapsed_time": "1:00:08", "remaining_time": "7:09:27"} | |
| {"current_steps": 110, "total_steps": 814, "loss": 0.0362, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.55614245194068e-06, "epoch": 0.27, "percentage": 13.51, "elapsed_time": "1:06:12", "remaining_time": "7:03:45"} | |
| {"current_steps": 110, "total_steps": 814, "loss": 0.0362, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.55614245194068e-06, "epoch": 0.27, "percentage": 13.51, "elapsed_time": "1:06:10", "remaining_time": "7:03:30"} | |
| {"current_steps": 120, "total_steps": 814, "loss": 0.0373, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.473283713288862e-06, "epoch": 0.29, "percentage": 14.74, "elapsed_time": "1:12:15", "remaining_time": "6:57:56"} | |
| {"current_steps": 120, "total_steps": 814, "loss": 0.0373, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.473283713288862e-06, "epoch": 0.29, "percentage": 14.74, "elapsed_time": "1:12:13", "remaining_time": "6:57:42"} | |
| {"current_steps": 130, "total_steps": 814, "loss": 0.0375, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.383762685594736e-06, "epoch": 0.32, "percentage": 15.97, "elapsed_time": "1:18:17", "remaining_time": "6:51:53"} | |
| {"current_steps": 130, "total_steps": 814, "loss": 0.0375, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.383762685594736e-06, "epoch": 0.32, "percentage": 15.97, "elapsed_time": "1:18:15", "remaining_time": "6:51:43"} | |
| {"current_steps": 140, "total_steps": 814, "loss": 0.0374, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.287712697079827e-06, "epoch": 0.34, "percentage": 17.2, "elapsed_time": "1:24:20", "remaining_time": "6:46:03"} | |
| {"current_steps": 140, "total_steps": 814, "loss": 0.0374, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.287712697079827e-06, "epoch": 0.34, "percentage": 17.2, "elapsed_time": "1:24:18", "remaining_time": "6:45:52"} | |
| {"current_steps": 150, "total_steps": 814, "loss": 0.0358, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.185276799879212e-06, "epoch": 0.37, "percentage": 18.43, "elapsed_time": "1:30:23", "remaining_time": "6:40:06"} | |
| {"current_steps": 150, "total_steps": 814, "loss": 0.0358, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.185276799879212e-06, "epoch": 0.37, "percentage": 18.43, "elapsed_time": "1:30:21", "remaining_time": "6:39:57"} | |
| {"current_steps": 160, "total_steps": 814, "loss": 0.0365, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.076607556986699e-06, "epoch": 0.39, "percentage": 19.66, "elapsed_time": "1:36:24", "remaining_time": "6:34:06"} | |
| {"current_steps": 160, "total_steps": 814, "loss": 0.0365, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.076607556986699e-06, "epoch": 0.39, "percentage": 19.66, "elapsed_time": "1:36:23", "remaining_time": "6:33:58"} | |
| {"current_steps": 170, "total_steps": 814, "loss": 0.0378, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.961866815035e-06, "epoch": 0.42, "percentage": 20.88, "elapsed_time": "1:42:27", "remaining_time": "6:28:08"} | |
| {"current_steps": 170, "total_steps": 814, "loss": 0.0378, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.961866815035e-06, "epoch": 0.42, "percentage": 20.88, "elapsed_time": "1:42:27", "remaining_time": "6:28:10"} | |
| {"current_steps": 170, "total_steps": 814, "loss": 0.0378, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.961866815035e-06, "epoch": 0.42, "percentage": 20.88, "elapsed_time": "1:42:25", "remaining_time": "6:28:01"} | |
| {"current_steps": 180, "total_steps": 814, "loss": 0.0367, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.841225463249305e-06, "epoch": 0.44, "percentage": 22.11, "elapsed_time": "1:48:31", "remaining_time": "6:22:15"} | |
| {"current_steps": 180, "total_steps": 814, "loss": 0.0367, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.841225463249305e-06, "epoch": 0.44, "percentage": 22.11, "elapsed_time": "1:48:29", "remaining_time": "6:22:07"} | |
| {"current_steps": 190, "total_steps": 814, "loss": 0.0359, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.714863178933258e-06, "epoch": 0.47, "percentage": 23.34, "elapsed_time": "1:54:34", "remaining_time": "6:16:15"} | |
| {"current_steps": 190, "total_steps": 814, "loss": 0.0359, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.714863178933258e-06, "epoch": 0.47, "percentage": 23.34, "elapsed_time": "1:54:31", "remaining_time": "6:16:08"} | |
| {"current_steps": 200, "total_steps": 814, "loss": 0.0346, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.582968159866416e-06, "epoch": 0.49, "percentage": 24.57, "elapsed_time": "2:00:36", "remaining_time": "6:10:16"} | |
| {"current_steps": 200, "total_steps": 814, "loss": 0.0346, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.582968159866416e-06, "epoch": 0.49, "percentage": 24.57, "elapsed_time": "2:00:34", "remaining_time": "6:10:10"} | |
| {"current_steps": 210, "total_steps": 814, "loss": 0.0361, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.445736844011712e-06, "epoch": 0.52, "percentage": 25.8, "elapsed_time": "2:12:23", "remaining_time": "6:20:45"} | |
| {"current_steps": 210, "total_steps": 814, "loss": 0.0361, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.445736844011712e-06, "epoch": 0.52, "percentage": 25.8, "elapsed_time": "2:12:21", "remaining_time": "6:20:40"} | |
| {"current_steps": 220, "total_steps": 814, "loss": 0.0352, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.303373616950408e-06, "epoch": 0.54, "percentage": 27.03, "elapsed_time": "2:18:25", "remaining_time": "6:13:45"} | |
| {"current_steps": 220, "total_steps": 814, "loss": 0.0352, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.303373616950408e-06, "epoch": 0.54, "percentage": 27.03, "elapsed_time": "2:18:23", "remaining_time": "6:13:39"} | |
| {"current_steps": 230, "total_steps": 814, "loss": 0.0351, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.156090507480242e-06, "epoch": 0.56, "percentage": 28.26, "elapsed_time": "2:24:28", "remaining_time": "6:06:51"} | |
| {"current_steps": 230, "total_steps": 814, "loss": 0.0351, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.156090507480242e-06, "epoch": 0.56, "percentage": 28.26, "elapsed_time": "2:24:26", "remaining_time": "6:06:46"} | |
| {"current_steps": 240, "total_steps": 814, "loss": 0.0345, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.004106871830155e-06, "epoch": 0.59, "percentage": 29.48, "elapsed_time": "2:30:32", "remaining_time": "6:00:01"} | |
| {"current_steps": 240, "total_steps": 814, "loss": 0.0345, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.004106871830155e-06, "epoch": 0.59, "percentage": 29.48, "elapsed_time": "2:30:29", "remaining_time": "5:59:56"} | |
| {"current_steps": 250, "total_steps": 814, "loss": 0.0364, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.847649066961905e-06, "epoch": 0.61, "percentage": 30.71, "elapsed_time": "2:36:36", "remaining_time": "5:53:19"} | |
| {"current_steps": 250, "total_steps": 814, "loss": 0.0364, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.847649066961905e-06, "epoch": 0.61, "percentage": 30.71, "elapsed_time": "2:36:34", "remaining_time": "5:53:15"} | |
| {"current_steps": 260, "total_steps": 814, "loss": 0.0313, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.68695011344511e-06, "epoch": 0.64, "percentage": 31.94, "elapsed_time": "2:42:40", "remaining_time": "5:46:38"} | |
| {"current_steps": 260, "total_steps": 814, "loss": 0.0313, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.68695011344511e-06, "epoch": 0.64, "percentage": 31.94, "elapsed_time": "2:42:38", "remaining_time": "5:46:34"} | |
| {"current_steps": 270, "total_steps": 814, "loss": 0.0322, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.52224934840788e-06, "epoch": 0.66, "percentage": 33.17, "elapsed_time": "2:48:43", "remaining_time": "5:39:57"} | |
| {"current_steps": 270, "total_steps": 814, "loss": 0.0322, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.52224934840788e-06, "epoch": 0.66, "percentage": 33.17, "elapsed_time": "2:48:41", "remaining_time": "5:39:53"} | |
| {"current_steps": 280, "total_steps": 814, "loss": 0.0348, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.353792069079826e-06, "epoch": 0.69, "percentage": 34.4, "elapsed_time": "2:54:48", "remaining_time": "5:33:22"} | |
| {"current_steps": 280, "total_steps": 814, "loss": 0.0348, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.353792069079826e-06, "epoch": 0.69, "percentage": 34.4, "elapsed_time": "2:54:45", "remaining_time": "5:33:17"} | |
| {"current_steps": 290, "total_steps": 814, "loss": 0.0374, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.181829167458441e-06, "epoch": 0.71, "percentage": 35.63, "elapsed_time": "3:00:51", "remaining_time": "5:26:47"} | |
| {"current_steps": 290, "total_steps": 814, "loss": 0.0374, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.181829167458441e-06, "epoch": 0.71, "percentage": 35.63, "elapsed_time": "3:00:49", "remaining_time": "5:26:43"} | |
| {"current_steps": 300, "total_steps": 814, "loss": 0.0348, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.006616756642867e-06, "epoch": 0.74, "percentage": 36.86, "elapsed_time": "3:06:55", "remaining_time": "5:20:15"} | |
| {"current_steps": 300, "total_steps": 814, "loss": 0.0348, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.006616756642867e-06, "epoch": 0.74, "percentage": 36.86, "elapsed_time": "3:06:52", "remaining_time": "5:20:11"} | |
| {"current_steps": 310, "total_steps": 814, "loss": 0.0318, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.828415789391632e-06, "epoch": 0.76, "percentage": 38.08, "elapsed_time": "3:12:58", "remaining_time": "5:13:43"} | |
| {"current_steps": 310, "total_steps": 814, "loss": 0.0318, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.828415789391632e-06, "epoch": 0.76, "percentage": 38.08, "elapsed_time": "3:12:55", "remaining_time": "5:13:40"} | |
| {"current_steps": 320, "total_steps": 814, "loss": 0.0345, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.647491669472421e-06, "epoch": 0.79, "percentage": 39.31, "elapsed_time": "3:19:02", "remaining_time": "5:07:16"} | |
| {"current_steps": 320, "total_steps": 814, "loss": 0.0345, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.647491669472421e-06, "epoch": 0.79, "percentage": 39.31, "elapsed_time": "3:19:00", "remaining_time": "5:07:13"} | |
| {"current_steps": 330, "total_steps": 814, "loss": 0.034, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.464113856382752e-06, "epoch": 0.81, "percentage": 40.54, "elapsed_time": "3:25:07", "remaining_time": "5:00:50"} | |
| {"current_steps": 330, "total_steps": 814, "loss": 0.034, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.464113856382752e-06, "epoch": 0.81, "percentage": 40.54, "elapsed_time": "3:25:05", "remaining_time": "5:00:47"} | |
| {"current_steps": 340, "total_steps": 814, "loss": 0.0305, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.278555464030228e-06, "epoch": 0.83, "percentage": 41.77, "elapsed_time": "3:31:11", "remaining_time": "4:54:25"} | |
| {"current_steps": 340, "total_steps": 814, "loss": 0.0305, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.278555464030228e-06, "epoch": 0.83, "percentage": 41.77, "elapsed_time": "3:31:09", "remaining_time": "4:54:22"} | |
| {"current_steps": 350, "total_steps": 814, "loss": 0.0337, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.091092853970098e-06, "epoch": 0.86, "percentage": 43.0, "elapsed_time": "3:37:16", "remaining_time": "4:48:02"} | |
| {"current_steps": 350, "total_steps": 814, "loss": 0.0337, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.091092853970098e-06, "epoch": 0.86, "percentage": 43.0, "elapsed_time": "3:37:13", "remaining_time": "4:47:58"} | |
| {"current_steps": 360, "total_steps": 814, "loss": 0.0326, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.902005223805931e-06, "epoch": 0.88, "percentage": 44.23, "elapsed_time": "3:43:18", "remaining_time": "4:41:37"} | |
| {"current_steps": 360, "total_steps": 814, "loss": 0.0326, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.902005223805931e-06, "epoch": 0.88, "percentage": 44.23, "elapsed_time": "3:43:16", "remaining_time": "4:41:34"} | |
| {"current_steps": 370, "total_steps": 814, "loss": 0.0344, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.711574191366427e-06, "epoch": 0.91, "percentage": 45.45, "elapsed_time": "3:49:20", "remaining_time": "4:35:12"} | |
| {"current_steps": 370, "total_steps": 814, "loss": 0.0344, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.711574191366427e-06, "epoch": 0.91, "percentage": 45.45, "elapsed_time": "3:49:18", "remaining_time": "4:35:10"} | |
| {"current_steps": 380, "total_steps": 814, "loss": 0.032, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.520083375277644e-06, "epoch": 0.93, "percentage": 46.68, "elapsed_time": "3:55:23", "remaining_time": "4:28:50"} | |
| {"current_steps": 380, "total_steps": 814, "loss": 0.032, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.520083375277644e-06, "epoch": 0.93, "percentage": 46.68, "elapsed_time": "3:55:21", "remaining_time": "4:28:48"} | |
| {"current_steps": 390, "total_steps": 814, "loss": 0.0329, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.3278179725553525e-06, "epoch": 0.96, "percentage": 47.91, "elapsed_time": "4:01:24", "remaining_time": "4:22:27"} | |
| {"current_steps": 390, "total_steps": 814, "loss": 0.0329, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.3278179725553525e-06, "epoch": 0.96, "percentage": 47.91, "elapsed_time": "4:01:22", "remaining_time": "4:22:25"} | |
| {"current_steps": 400, "total_steps": 814, "loss": 0.0337, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.135064333846612e-06, "epoch": 0.98, "percentage": 49.14, "elapsed_time": "4:07:27", "remaining_time": "4:16:07"} | |
| {"current_steps": 400, "total_steps": 814, "loss": 0.0337, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.135064333846612e-06, "epoch": 0.98, "percentage": 49.14, "elapsed_time": "4:07:25", "remaining_time": "4:16:05"} | |
| {"current_steps": 410, "total_steps": 814, "loss": 0.033, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.942109536953177e-06, "epoch": 1.01, "percentage": 50.37, "elapsed_time": "4:25:04", "remaining_time": "4:21:11"} | |
| {"current_steps": 410, "total_steps": 814, "loss": 0.033, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.942109536953177e-06, "epoch": 1.01, "percentage": 50.37, "elapsed_time": "4:25:04", "remaining_time": "4:21:11"} | |
| {"current_steps": 410, "total_steps": 814, "loss": 0.033, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.942109536953177e-06, "epoch": 1.01, "percentage": 50.37, "elapsed_time": "4:25:02", "remaining_time": "4:21:09"} | |
| {"current_steps": 420, "total_steps": 814, "loss": 0.0298, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.749240959271918e-06, "epoch": 1.03, "percentage": 51.6, "elapsed_time": "4:31:09", "remaining_time": "4:14:22"} | |
| {"current_steps": 420, "total_steps": 814, "loss": 0.0298, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.749240959271918e-06, "epoch": 1.03, "percentage": 51.6, "elapsed_time": "4:31:07", "remaining_time": "4:14:20"} | |
| {"current_steps": 430, "total_steps": 814, "loss": 0.0338, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.556745849789055e-06, "epoch": 1.06, "percentage": 52.83, "elapsed_time": "4:37:13", "remaining_time": "4:07:33"} | |
| {"current_steps": 430, "total_steps": 814, "loss": 0.0338, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.556745849789055e-06, "epoch": 1.06, "percentage": 52.83, "elapsed_time": "4:37:11", "remaining_time": "4:07:32"} | |
| {"current_steps": 440, "total_steps": 814, "loss": 0.0332, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.364910901265607e-06, "epoch": 1.08, "percentage": 54.05, "elapsed_time": "4:43:14", "remaining_time": "4:00:44"} | |
| {"current_steps": 440, "total_steps": 814, "loss": 0.0332, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.364910901265607e-06, "epoch": 1.08, "percentage": 54.05, "elapsed_time": "4:43:12", "remaining_time": "4:00:43"} | |
| {"current_steps": 450, "total_steps": 814, "loss": 0.0328, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.174021823251294e-06, "epoch": 1.1, "percentage": 55.28, "elapsed_time": "4:49:18", "remaining_time": "3:54:01"} | |
| {"current_steps": 450, "total_steps": 814, "loss": 0.0328, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.174021823251294e-06, "epoch": 1.1, "percentage": 55.28, "elapsed_time": "4:49:16", "remaining_time": "3:53:59"} | |
| {"current_steps": 460, "total_steps": 814, "loss": 0.0329, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.984362916562753e-06, "epoch": 1.13, "percentage": 56.51, "elapsed_time": "4:55:22", "remaining_time": "3:47:18"} | |
| {"current_steps": 460, "total_steps": 814, "loss": 0.0329, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.984362916562753e-06, "epoch": 1.13, "percentage": 56.51, "elapsed_time": "4:55:20", "remaining_time": "3:47:17"} | |
| {"current_steps": 470, "total_steps": 814, "loss": 0.0315, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.7962166498598785e-06, "epoch": 1.15, "percentage": 57.74, "elapsed_time": "5:01:24", "remaining_time": "3:40:36"} | |
| {"current_steps": 470, "total_steps": 814, "loss": 0.0315, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.7962166498598785e-06, "epoch": 1.15, "percentage": 57.74, "elapsed_time": "5:01:22", "remaining_time": "3:40:35"} | |
| {"current_steps": 480, "total_steps": 814, "loss": 0.0299, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.6098632389508637e-06, "epoch": 1.18, "percentage": 58.97, "elapsed_time": "5:07:27", "remaining_time": "3:33:56"} | |
| {"current_steps": 480, "total_steps": 814, "loss": 0.0299, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.6098632389508637e-06, "epoch": 1.18, "percentage": 58.97, "elapsed_time": "5:07:25", "remaining_time": "3:33:54"} | |
| {"current_steps": 490, "total_steps": 814, "loss": 0.0319, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.4255802294525464e-06, "epoch": 1.2, "percentage": 60.2, "elapsed_time": "5:13:29", "remaining_time": "3:27:17"} | |
| {"current_steps": 490, "total_steps": 814, "loss": 0.0319, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.4255802294525464e-06, "epoch": 1.2, "percentage": 60.2, "elapsed_time": "5:13:27", "remaining_time": "3:27:15"} | |
| {"current_steps": 500, "total_steps": 814, "loss": 0.0319, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.2436420834276013e-06, "epoch": 1.23, "percentage": 61.43, "elapsed_time": "5:19:33", "remaining_time": "3:20:40"} | |
| {"current_steps": 500, "total_steps": 814, "loss": 0.0319, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.2436420834276013e-06, "epoch": 1.23, "percentage": 61.43, "elapsed_time": "5:19:31", "remaining_time": "3:20:39"} | |
| {"current_steps": 510, "total_steps": 814, "loss": 0.0333, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.0643197706142136e-06, "epoch": 1.25, "percentage": 62.65, "elapsed_time": "5:25:35", "remaining_time": "3:14:04"} | |
| {"current_steps": 510, "total_steps": 814, "loss": 0.0333, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.0643197706142136e-06, "epoch": 1.25, "percentage": 62.65, "elapsed_time": "5:25:33", "remaining_time": "3:14:03"} | |
| {"current_steps": 520, "total_steps": 814, "loss": 0.0306, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.8878803648570773e-06, "epoch": 1.28, "percentage": 63.88, "elapsed_time": "5:31:40", "remaining_time": "3:07:31"} | |
| {"current_steps": 520, "total_steps": 814, "loss": 0.0306, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.8878803648570773e-06, "epoch": 1.28, "percentage": 63.88, "elapsed_time": "5:31:37", "remaining_time": "3:07:29"} | |
| {"current_steps": 530, "total_steps": 814, "loss": 0.0309, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.7145866463407163e-06, "epoch": 1.3, "percentage": 65.11, "elapsed_time": "5:37:42", "remaining_time": "3:00:57"} | |
| {"current_steps": 530, "total_steps": 814, "loss": 0.0309, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.7145866463407163e-06, "epoch": 1.3, "percentage": 65.11, "elapsed_time": "5:37:40", "remaining_time": "3:00:56"} | |
| {"current_steps": 540, "total_steps": 814, "loss": 0.0325, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.544696710217588e-06, "epoch": 1.32, "percentage": 66.34, "elapsed_time": "5:43:47", "remaining_time": "2:54:26"} | |
| {"current_steps": 540, "total_steps": 814, "loss": 0.0325, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.544696710217588e-06, "epoch": 1.32, "percentage": 66.34, "elapsed_time": "5:43:45", "remaining_time": "2:54:25"} | |
| {"current_steps": 550, "total_steps": 814, "loss": 0.032, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.3784635822138424e-06, "epoch": 1.35, "percentage": 67.57, "elapsed_time": "5:49:49", "remaining_time": "2:47:55"} | |
| {"current_steps": 550, "total_steps": 814, "loss": 0.032, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.3784635822138424e-06, "epoch": 1.35, "percentage": 67.57, "elapsed_time": "5:49:47", "remaining_time": "2:47:54"} | |
| {"current_steps": 560, "total_steps": 814, "loss": 0.034, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.2161348417852346e-06, "epoch": 1.37, "percentage": 68.8, "elapsed_time": "5:55:51", "remaining_time": "2:41:24"} | |
| {"current_steps": 560, "total_steps": 814, "loss": 0.034, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.2161348417852346e-06, "epoch": 1.37, "percentage": 68.8, "elapsed_time": "5:55:49", "remaining_time": "2:41:23"} | |
| {"current_steps": 570, "total_steps": 814, "loss": 0.0322, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.05795225338444e-06, "epoch": 1.4, "percentage": 70.02, "elapsed_time": "6:01:54", "remaining_time": "2:34:55"} | |
| {"current_steps": 570, "total_steps": 814, "loss": 0.0322, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.05795225338444e-06, "epoch": 1.4, "percentage": 70.02, "elapsed_time": "6:01:52", "remaining_time": "2:34:54"} | |
| {"current_steps": 580, "total_steps": 814, "loss": 0.0328, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.9041514063889571e-06, "epoch": 1.42, "percentage": 71.25, "elapsed_time": "6:07:56", "remaining_time": "2:28:26"} | |
| {"current_steps": 580, "total_steps": 814, "loss": 0.0328, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.9041514063889571e-06, "epoch": 1.42, "percentage": 71.25, "elapsed_time": "6:07:54", "remaining_time": "2:28:25"} | |
| {"current_steps": 590, "total_steps": 814, "loss": 0.0336, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.7549613642258573e-06, "epoch": 1.45, "percentage": 72.48, "elapsed_time": "6:13:59", "remaining_time": "2:21:59"} | |
| {"current_steps": 590, "total_steps": 814, "loss": 0.0336, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.7549613642258573e-06, "epoch": 1.45, "percentage": 72.48, "elapsed_time": "6:13:57", "remaining_time": "2:21:58"} | |
| {"current_steps": 600, "total_steps": 814, "loss": 0.0339, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6106043232159745e-06, "epoch": 1.47, "percentage": 73.71, "elapsed_time": "6:20:05", "remaining_time": "2:15:33"} | |
| {"current_steps": 600, "total_steps": 814, "loss": 0.0339, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.6106043232159745e-06, "epoch": 1.47, "percentage": 73.71, "elapsed_time": "6:20:03", "remaining_time": "2:15:33"} | |
| {"current_steps": 610, "total_steps": 814, "loss": 0.0325, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4712952816456095e-06, "epoch": 1.5, "percentage": 74.94, "elapsed_time": "6:31:43", "remaining_time": "2:11:00"} | |
| {"current_steps": 610, "total_steps": 814, "loss": 0.0325, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4712952816456095e-06, "epoch": 1.5, "percentage": 74.94, "elapsed_time": "6:31:41", "remaining_time": "2:10:59"} | |
| {"current_steps": 620, "total_steps": 814, "loss": 0.0327, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.337241719558648e-06, "epoch": 1.52, "percentage": 76.17, "elapsed_time": "6:37:47", "remaining_time": "2:04:28"} | |
| {"current_steps": 620, "total_steps": 814, "loss": 0.0327, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.337241719558648e-06, "epoch": 1.52, "percentage": 76.17, "elapsed_time": "6:37:45", "remaining_time": "2:04:27"} | |
| {"current_steps": 630, "total_steps": 814, "loss": 0.0304, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2086432897459738e-06, "epoch": 1.55, "percentage": 77.4, "elapsed_time": "6:43:51", "remaining_time": "1:57:56"} | |
| {"current_steps": 630, "total_steps": 814, "loss": 0.0304, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2086432897459738e-06, "epoch": 1.55, "percentage": 77.4, "elapsed_time": "6:43:49", "remaining_time": "1:57:56"} | |
| {"current_steps": 640, "total_steps": 814, "loss": 0.0329, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0856915203924096e-06, "epoch": 1.57, "percentage": 78.62, "elapsed_time": "6:49:53", "remaining_time": "1:51:26"} | |
| {"current_steps": 640, "total_steps": 814, "loss": 0.0329, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0856915203924096e-06, "epoch": 1.57, "percentage": 78.62, "elapsed_time": "6:49:51", "remaining_time": "1:51:25"} | |
| {"current_steps": 650, "total_steps": 814, "loss": 0.0322, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.685695298240432e-07, "epoch": 1.59, "percentage": 79.85, "elapsed_time": "6:55:57", "remaining_time": "1:44:56"} | |
| {"current_steps": 650, "total_steps": 814, "loss": 0.0322, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 9.685695298240432e-07, "epoch": 1.59, "percentage": 79.85, "elapsed_time": "6:55:55", "remaining_time": "1:44:56"} | |
| {"current_steps": 660, "total_steps": 814, "loss": 0.0343, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.574517537807897e-07, "epoch": 1.62, "percentage": 81.08, "elapsed_time": "7:02:01", "remaining_time": "1:38:28"} | |
| {"current_steps": 660, "total_steps": 814, "loss": 0.0343, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.574517537807897e-07, "epoch": 1.62, "percentage": 81.08, "elapsed_time": "7:01:59", "remaining_time": "1:38:27"} | |
| {"current_steps": 670, "total_steps": 814, "loss": 0.0328, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.525036856203677e-07, "epoch": 1.64, "percentage": 82.31, "elapsed_time": "7:08:05", "remaining_time": "1:32:00"} | |
| {"current_steps": 670, "total_steps": 814, "loss": 0.0328, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.525036856203677e-07, "epoch": 1.64, "percentage": 82.31, "elapsed_time": "7:08:03", "remaining_time": "1:32:00"} | |
| {"current_steps": 680, "total_steps": 814, "loss": 0.0334, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.538816298406203e-07, "epoch": 1.67, "percentage": 83.54, "elapsed_time": "7:14:10", "remaining_time": "1:25:33"} | |
| {"current_steps": 680, "total_steps": 814, "loss": 0.0334, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.538816298406203e-07, "epoch": 1.67, "percentage": 83.54, "elapsed_time": "7:14:08", "remaining_time": "1:25:33"} | |
| {"current_steps": 690, "total_steps": 814, "loss": 0.0334, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.617324692872744e-07, "epoch": 1.69, "percentage": 84.77, "elapsed_time": "7:20:12", "remaining_time": "1:19:06"} | |
| {"current_steps": 690, "total_steps": 814, "loss": 0.0334, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.617324692872744e-07, "epoch": 1.69, "percentage": 84.77, "elapsed_time": "7:20:10", "remaining_time": "1:19:06"} | |
| {"current_steps": 700, "total_steps": 814, "loss": 0.0337, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.7619344639384447e-07, "epoch": 1.72, "percentage": 86.0, "elapsed_time": "7:26:15", "remaining_time": "1:12:40"} | |
| {"current_steps": 700, "total_steps": 814, "loss": 0.0337, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.7619344639384447e-07, "epoch": 1.72, "percentage": 86.0, "elapsed_time": "7:26:13", "remaining_time": "1:12:40"} | |
| {"current_steps": 710, "total_steps": 814, "loss": 0.0306, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.9739195877949223e-07, "epoch": 1.74, "percentage": 87.22, "elapsed_time": "7:32:19", "remaining_time": "1:06:15"} | |
| {"current_steps": 710, "total_steps": 814, "loss": 0.0306, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.9739195877949223e-07, "epoch": 1.74, "percentage": 87.22, "elapsed_time": "7:32:17", "remaining_time": "1:06:15"} | |
| {"current_steps": 720, "total_steps": 814, "loss": 0.032, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.254453695092752e-07, "epoch": 1.77, "percentage": 88.45, "elapsed_time": "7:38:21", "remaining_time": "0:59:50"} | |
| {"current_steps": 720, "total_steps": 814, "loss": 0.032, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 3.254453695092752e-07, "epoch": 1.77, "percentage": 88.45, "elapsed_time": "7:38:19", "remaining_time": "0:59:50"} | |
| {"current_steps": 730, "total_steps": 814, "loss": 0.0325, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.604608322993518e-07, "epoch": 1.79, "percentage": 89.68, "elapsed_time": "7:44:23", "remaining_time": "0:53:26"} | |
| {"current_steps": 730, "total_steps": 814, "loss": 0.0325, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.604608322993518e-07, "epoch": 1.79, "percentage": 89.68, "elapsed_time": "7:44:21", "remaining_time": "0:53:25"} | |
| {"current_steps": 740, "total_steps": 814, "loss": 0.0351, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.0253513192751374e-07, "epoch": 1.82, "percentage": 90.91, "elapsed_time": "7:50:26", "remaining_time": "0:47:02"} | |
| {"current_steps": 740, "total_steps": 814, "loss": 0.0351, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.0253513192751374e-07, "epoch": 1.82, "percentage": 90.91, "elapsed_time": "7:50:24", "remaining_time": "0:47:02"} | |
| {"current_steps": 750, "total_steps": 814, "loss": 0.0309, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5175454008667712e-07, "epoch": 1.84, "percentage": 92.14, "elapsed_time": "7:56:28", "remaining_time": "0:40:39"} | |
| {"current_steps": 750, "total_steps": 814, "loss": 0.0309, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.5175454008667712e-07, "epoch": 1.84, "percentage": 92.14, "elapsed_time": "7:56:26", "remaining_time": "0:40:39"} | |
| {"current_steps": 760, "total_steps": 814, "loss": 0.0305, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0819468689607426e-07, "epoch": 1.86, "percentage": 93.37, "elapsed_time": "8:02:32", "remaining_time": "0:34:17"} | |
| {"current_steps": 760, "total_steps": 814, "loss": 0.0305, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0819468689607426e-07, "epoch": 1.86, "percentage": 93.37, "elapsed_time": "8:02:30", "remaining_time": "0:34:17"} | |
| {"current_steps": 770, "total_steps": 814, "loss": 0.0284, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.192044826145772e-08, "epoch": 1.89, "percentage": 94.59, "elapsed_time": "8:08:33", "remaining_time": "0:27:55"} | |
| {"current_steps": 770, "total_steps": 814, "loss": 0.0284, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.192044826145772e-08, "epoch": 1.89, "percentage": 94.59, "elapsed_time": "8:08:31", "remaining_time": "0:27:54"} | |
| {"current_steps": 780, "total_steps": 814, "loss": 0.0305, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.298584925212068e-08, "epoch": 1.91, "percentage": 95.82, "elapsed_time": "8:14:38", "remaining_time": "0:21:33"} | |
| {"current_steps": 780, "total_steps": 814, "loss": 0.0305, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.298584925212068e-08, "epoch": 1.91, "percentage": 95.82, "elapsed_time": "8:14:35", "remaining_time": "0:21:33"} | |
| {"current_steps": 790, "total_steps": 814, "loss": 0.0303, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.143398363860738e-08, "epoch": 1.94, "percentage": 97.05, "elapsed_time": "8:20:41", "remaining_time": "0:15:12"} | |
| {"current_steps": 790, "total_steps": 814, "loss": 0.0303, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.143398363860738e-08, "epoch": 1.94, "percentage": 97.05, "elapsed_time": "8:20:39", "remaining_time": "0:15:12"} | |
| {"current_steps": 800, "total_steps": 814, "loss": 0.0313, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.2969497109715016e-09, "epoch": 1.96, "percentage": 98.28, "elapsed_time": "8:26:43", "remaining_time": "0:08:52"} | |
| {"current_steps": 800, "total_steps": 814, "loss": 0.0313, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.2969497109715016e-09, "epoch": 1.96, "percentage": 98.28, "elapsed_time": "8:26:41", "remaining_time": "0:08:52"} | |
| {"current_steps": 810, "total_steps": 814, "loss": 0.0331, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.958024731567147e-10, "epoch": 1.99, "percentage": 99.51, "elapsed_time": "8:38:26", "remaining_time": "0:02:33"} | |
| {"current_steps": 810, "total_steps": 814, "loss": 0.0331, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.958024731567147e-10, "epoch": 1.99, "percentage": 99.51, "elapsed_time": "8:38:24", "remaining_time": "0:02:33"} | |
| {"current_steps": 814, "total_steps": 814, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "8:41:01", "remaining_time": "0:00:00"} | |
| {"current_steps": 814, "total_steps": 814, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "8:40:59", "remaining_time": "0:00:00"} | |
| {"current_steps": 66, "total_steps": 66, "loss": null, "eval_loss": 0.03739195317029953, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "8:47:50", "remaining_time": "0:00:00"} | |
| {"current_steps": 66, "total_steps": 66, "loss": null, "eval_loss": 0.03739195317029953, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "8:47:49", "remaining_time": "0:00:00"} | |