File size: 15,178 Bytes
40767ff
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6dbbdff
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3ac2d76
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
e384e5a
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
{"current_steps": 10, "total_steps": 822, "loss": 1.0419, "lr": 5e-06, "epoch": 0.0364963503649635, "percentage": 1.22, "elapsed_time": "0:05:27", "remaining_time": "7:23:12"}
{"current_steps": 20, "total_steps": 822, "loss": 0.9117, "lr": 5e-06, "epoch": 0.072992700729927, "percentage": 2.43, "elapsed_time": "0:10:49", "remaining_time": "7:14:13"}
{"current_steps": 30, "total_steps": 822, "loss": 0.8752, "lr": 5e-06, "epoch": 0.10948905109489052, "percentage": 3.65, "elapsed_time": "0:16:13", "remaining_time": "7:08:15"}
{"current_steps": 40, "total_steps": 822, "loss": 0.8479, "lr": 5e-06, "epoch": 0.145985401459854, "percentage": 4.87, "elapsed_time": "0:21:37", "remaining_time": "7:02:43"}
{"current_steps": 50, "total_steps": 822, "loss": 0.8276, "lr": 5e-06, "epoch": 0.18248175182481752, "percentage": 6.08, "elapsed_time": "0:27:01", "remaining_time": "6:57:09"}
{"current_steps": 60, "total_steps": 822, "loss": 0.8144, "lr": 5e-06, "epoch": 0.21897810218978103, "percentage": 7.3, "elapsed_time": "0:32:25", "remaining_time": "6:51:43"}
{"current_steps": 70, "total_steps": 822, "loss": 0.8029, "lr": 5e-06, "epoch": 0.25547445255474455, "percentage": 8.52, "elapsed_time": "0:37:47", "remaining_time": "6:45:56"}
{"current_steps": 80, "total_steps": 822, "loss": 0.7984, "lr": 5e-06, "epoch": 0.291970802919708, "percentage": 9.73, "elapsed_time": "0:43:07", "remaining_time": "6:40:03"}
{"current_steps": 90, "total_steps": 822, "loss": 0.7845, "lr": 5e-06, "epoch": 0.3284671532846715, "percentage": 10.95, "elapsed_time": "0:48:30", "remaining_time": "6:34:30"}
{"current_steps": 100, "total_steps": 822, "loss": 0.784, "lr": 5e-06, "epoch": 0.36496350364963503, "percentage": 12.17, "elapsed_time": "0:53:53", "remaining_time": "6:29:07"}
{"current_steps": 110, "total_steps": 822, "loss": 0.7786, "lr": 5e-06, "epoch": 0.40145985401459855, "percentage": 13.38, "elapsed_time": "0:59:16", "remaining_time": "6:23:41"}
{"current_steps": 120, "total_steps": 822, "loss": 0.7741, "lr": 5e-06, "epoch": 0.43795620437956206, "percentage": 14.6, "elapsed_time": "1:04:38", "remaining_time": "6:18:11"}
{"current_steps": 130, "total_steps": 822, "loss": 0.7706, "lr": 5e-06, "epoch": 0.4744525547445255, "percentage": 15.82, "elapsed_time": "1:10:00", "remaining_time": "6:12:38"}
{"current_steps": 140, "total_steps": 822, "loss": 0.7693, "lr": 5e-06, "epoch": 0.5109489051094891, "percentage": 17.03, "elapsed_time": "1:15:20", "remaining_time": "6:07:03"}
{"current_steps": 150, "total_steps": 822, "loss": 0.7698, "lr": 5e-06, "epoch": 0.5474452554744526, "percentage": 18.25, "elapsed_time": "1:20:41", "remaining_time": "6:01:30"}
{"current_steps": 160, "total_steps": 822, "loss": 0.7595, "lr": 5e-06, "epoch": 0.583941605839416, "percentage": 19.46, "elapsed_time": "1:26:02", "remaining_time": "5:56:00"}
{"current_steps": 170, "total_steps": 822, "loss": 0.7614, "lr": 5e-06, "epoch": 0.6204379562043796, "percentage": 20.68, "elapsed_time": "1:31:26", "remaining_time": "5:50:41"}
{"current_steps": 180, "total_steps": 822, "loss": 0.7541, "lr": 5e-06, "epoch": 0.656934306569343, "percentage": 21.9, "elapsed_time": "1:36:46", "remaining_time": "5:45:10"}
{"current_steps": 190, "total_steps": 822, "loss": 0.7573, "lr": 5e-06, "epoch": 0.6934306569343066, "percentage": 23.11, "elapsed_time": "1:42:07", "remaining_time": "5:39:43"}
{"current_steps": 200, "total_steps": 822, "loss": 0.7582, "lr": 5e-06, "epoch": 0.7299270072992701, "percentage": 24.33, "elapsed_time": "1:47:31", "remaining_time": "5:34:23"}
{"current_steps": 210, "total_steps": 822, "loss": 0.7582, "lr": 5e-06, "epoch": 0.7664233576642335, "percentage": 25.55, "elapsed_time": "1:52:55", "remaining_time": "5:29:06"}
{"current_steps": 220, "total_steps": 822, "loss": 0.7519, "lr": 5e-06, "epoch": 0.8029197080291971, "percentage": 26.76, "elapsed_time": "1:58:17", "remaining_time": "5:23:41"}
{"current_steps": 230, "total_steps": 822, "loss": 0.7551, "lr": 5e-06, "epoch": 0.8394160583941606, "percentage": 27.98, "elapsed_time": "2:03:39", "remaining_time": "5:18:16"}
{"current_steps": 240, "total_steps": 822, "loss": 0.7519, "lr": 5e-06, "epoch": 0.8759124087591241, "percentage": 29.2, "elapsed_time": "2:09:02", "remaining_time": "5:12:54"}
{"current_steps": 250, "total_steps": 822, "loss": 0.7471, "lr": 5e-06, "epoch": 0.9124087591240876, "percentage": 30.41, "elapsed_time": "2:14:25", "remaining_time": "5:07:34"}
{"current_steps": 260, "total_steps": 822, "loss": 0.7471, "lr": 5e-06, "epoch": 0.948905109489051, "percentage": 31.63, "elapsed_time": "2:19:49", "remaining_time": "5:02:13"}
{"current_steps": 270, "total_steps": 822, "loss": 0.7448, "lr": 5e-06, "epoch": 0.9854014598540146, "percentage": 32.85, "elapsed_time": "2:25:11", "remaining_time": "4:56:49"}
{"current_steps": 274, "total_steps": 822, "eval_loss": 0.7464940547943115, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "2:30:33", "remaining_time": "5:01:06"}
{"current_steps": 280, "total_steps": 822, "loss": 0.7201, "lr": 5e-06, "epoch": 1.0218978102189782, "percentage": 34.06, "elapsed_time": "2:34:56", "remaining_time": "4:59:54"}
{"current_steps": 290, "total_steps": 822, "loss": 0.6987, "lr": 5e-06, "epoch": 1.0583941605839415, "percentage": 35.28, "elapsed_time": "2:40:18", "remaining_time": "4:54:04"}
{"current_steps": 300, "total_steps": 822, "loss": 0.695, "lr": 5e-06, "epoch": 1.094890510948905, "percentage": 36.5, "elapsed_time": "2:45:39", "remaining_time": "4:48:14"}
{"current_steps": 310, "total_steps": 822, "loss": 0.6922, "lr": 5e-06, "epoch": 1.1313868613138687, "percentage": 37.71, "elapsed_time": "2:51:01", "remaining_time": "4:42:28"}
{"current_steps": 320, "total_steps": 822, "loss": 0.7005, "lr": 5e-06, "epoch": 1.167883211678832, "percentage": 38.93, "elapsed_time": "2:56:23", "remaining_time": "4:36:43"}
{"current_steps": 330, "total_steps": 822, "loss": 0.696, "lr": 5e-06, "epoch": 1.2043795620437956, "percentage": 40.15, "elapsed_time": "3:01:46", "remaining_time": "4:31:00"}
{"current_steps": 340, "total_steps": 822, "loss": 0.6961, "lr": 5e-06, "epoch": 1.2408759124087592, "percentage": 41.36, "elapsed_time": "3:07:10", "remaining_time": "4:25:20"}
{"current_steps": 350, "total_steps": 822, "loss": 0.6955, "lr": 5e-06, "epoch": 1.2773722627737225, "percentage": 42.58, "elapsed_time": "3:12:32", "remaining_time": "4:19:38"}
{"current_steps": 360, "total_steps": 822, "loss": 0.6967, "lr": 5e-06, "epoch": 1.313868613138686, "percentage": 43.8, "elapsed_time": "3:17:53", "remaining_time": "4:13:57"}
{"current_steps": 370, "total_steps": 822, "loss": 0.702, "lr": 5e-06, "epoch": 1.3503649635036497, "percentage": 45.01, "elapsed_time": "3:23:15", "remaining_time": "4:08:18"}
{"current_steps": 380, "total_steps": 822, "loss": 0.7, "lr": 5e-06, "epoch": 1.3868613138686132, "percentage": 46.23, "elapsed_time": "3:28:36", "remaining_time": "4:02:38"}
{"current_steps": 390, "total_steps": 822, "loss": 0.6935, "lr": 5e-06, "epoch": 1.4233576642335766, "percentage": 47.45, "elapsed_time": "3:33:57", "remaining_time": "3:56:59"}
{"current_steps": 400, "total_steps": 822, "loss": 0.6925, "lr": 5e-06, "epoch": 1.4598540145985401, "percentage": 48.66, "elapsed_time": "3:39:17", "remaining_time": "3:51:21"}
{"current_steps": 410, "total_steps": 822, "loss": 0.6987, "lr": 5e-06, "epoch": 1.4963503649635037, "percentage": 49.88, "elapsed_time": "3:44:40", "remaining_time": "3:45:46"}
{"current_steps": 420, "total_steps": 822, "loss": 0.6975, "lr": 5e-06, "epoch": 1.5328467153284673, "percentage": 51.09, "elapsed_time": "3:50:04", "remaining_time": "3:40:12"}
{"current_steps": 430, "total_steps": 822, "loss": 0.6955, "lr": 5e-06, "epoch": 1.5693430656934306, "percentage": 52.31, "elapsed_time": "3:55:26", "remaining_time": "3:34:38"}
{"current_steps": 440, "total_steps": 822, "loss": 0.6947, "lr": 5e-06, "epoch": 1.6058394160583942, "percentage": 53.53, "elapsed_time": "4:00:46", "remaining_time": "3:29:02"}
{"current_steps": 450, "total_steps": 822, "loss": 0.6979, "lr": 5e-06, "epoch": 1.6423357664233578, "percentage": 54.74, "elapsed_time": "4:06:07", "remaining_time": "3:23:27"}
{"current_steps": 460, "total_steps": 822, "loss": 0.6887, "lr": 5e-06, "epoch": 1.6788321167883211, "percentage": 55.96, "elapsed_time": "4:11:29", "remaining_time": "3:17:54"}
{"current_steps": 470, "total_steps": 822, "loss": 0.6925, "lr": 5e-06, "epoch": 1.7153284671532847, "percentage": 57.18, "elapsed_time": "4:16:48", "remaining_time": "3:12:20"}
{"current_steps": 480, "total_steps": 822, "loss": 0.6939, "lr": 5e-06, "epoch": 1.7518248175182483, "percentage": 58.39, "elapsed_time": "4:22:11", "remaining_time": "3:06:48"}
{"current_steps": 490, "total_steps": 822, "loss": 0.6968, "lr": 5e-06, "epoch": 1.7883211678832116, "percentage": 59.61, "elapsed_time": "4:27:34", "remaining_time": "3:01:17"}
{"current_steps": 500, "total_steps": 822, "loss": 0.6903, "lr": 5e-06, "epoch": 1.8248175182481752, "percentage": 60.83, "elapsed_time": "4:32:57", "remaining_time": "2:55:47"}
{"current_steps": 510, "total_steps": 822, "loss": 0.6919, "lr": 5e-06, "epoch": 1.8613138686131387, "percentage": 62.04, "elapsed_time": "4:38:19", "remaining_time": "2:50:16"}
{"current_steps": 520, "total_steps": 822, "loss": 0.6917, "lr": 5e-06, "epoch": 1.897810218978102, "percentage": 63.26, "elapsed_time": "4:43:40", "remaining_time": "2:44:44"}
{"current_steps": 530, "total_steps": 822, "loss": 0.6947, "lr": 5e-06, "epoch": 1.9343065693430657, "percentage": 64.48, "elapsed_time": "4:49:00", "remaining_time": "2:39:13"}
{"current_steps": 540, "total_steps": 822, "loss": 0.6909, "lr": 5e-06, "epoch": 1.9708029197080292, "percentage": 65.69, "elapsed_time": "4:54:22", "remaining_time": "2:33:43"}
{"current_steps": 548, "total_steps": 822, "eval_loss": 0.7327279448509216, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "5:01:42", "remaining_time": "2:30:51"}
{"current_steps": 550, "total_steps": 822, "loss": 0.6891, "lr": 5e-06, "epoch": 2.0072992700729926, "percentage": 66.91, "elapsed_time": "5:04:02", "remaining_time": "2:30:21"}
{"current_steps": 560, "total_steps": 822, "loss": 0.6428, "lr": 5e-06, "epoch": 2.0437956204379564, "percentage": 68.13, "elapsed_time": "5:09:21", "remaining_time": "2:24:44"}
{"current_steps": 570, "total_steps": 822, "loss": 0.6418, "lr": 5e-06, "epoch": 2.0802919708029197, "percentage": 69.34, "elapsed_time": "5:14:43", "remaining_time": "2:19:08"}
{"current_steps": 580, "total_steps": 822, "loss": 0.6411, "lr": 5e-06, "epoch": 2.116788321167883, "percentage": 70.56, "elapsed_time": "5:20:04", "remaining_time": "2:13:32"}
{"current_steps": 590, "total_steps": 822, "loss": 0.6429, "lr": 5e-06, "epoch": 2.153284671532847, "percentage": 71.78, "elapsed_time": "5:25:24", "remaining_time": "2:07:57"}
{"current_steps": 600, "total_steps": 822, "loss": 0.6418, "lr": 5e-06, "epoch": 2.18978102189781, "percentage": 72.99, "elapsed_time": "5:30:46", "remaining_time": "2:02:23"}
{"current_steps": 610, "total_steps": 822, "loss": 0.6455, "lr": 5e-06, "epoch": 2.2262773722627736, "percentage": 74.21, "elapsed_time": "5:36:09", "remaining_time": "1:56:49"}
{"current_steps": 620, "total_steps": 822, "loss": 0.64, "lr": 5e-06, "epoch": 2.2627737226277373, "percentage": 75.43, "elapsed_time": "5:41:31", "remaining_time": "1:51:16"}
{"current_steps": 630, "total_steps": 822, "loss": 0.6424, "lr": 5e-06, "epoch": 2.2992700729927007, "percentage": 76.64, "elapsed_time": "5:46:51", "remaining_time": "1:45:42"}
{"current_steps": 640, "total_steps": 822, "loss": 0.6422, "lr": 5e-06, "epoch": 2.335766423357664, "percentage": 77.86, "elapsed_time": "5:52:11", "remaining_time": "1:40:09"}
{"current_steps": 650, "total_steps": 822, "loss": 0.6437, "lr": 5e-06, "epoch": 2.372262773722628, "percentage": 79.08, "elapsed_time": "5:57:34", "remaining_time": "1:34:37"}
{"current_steps": 660, "total_steps": 822, "loss": 0.6458, "lr": 5e-06, "epoch": 2.408759124087591, "percentage": 80.29, "elapsed_time": "6:02:56", "remaining_time": "1:29:05"}
{"current_steps": 670, "total_steps": 822, "loss": 0.6452, "lr": 5e-06, "epoch": 2.445255474452555, "percentage": 81.51, "elapsed_time": "6:08:18", "remaining_time": "1:23:33"}
{"current_steps": 680, "total_steps": 822, "loss": 0.644, "lr": 5e-06, "epoch": 2.4817518248175183, "percentage": 82.73, "elapsed_time": "6:13:37", "remaining_time": "1:18:01"}
{"current_steps": 690, "total_steps": 822, "loss": 0.6491, "lr": 5e-06, "epoch": 2.5182481751824817, "percentage": 83.94, "elapsed_time": "6:18:58", "remaining_time": "1:12:29"}
{"current_steps": 700, "total_steps": 822, "loss": 0.6431, "lr": 5e-06, "epoch": 2.554744525547445, "percentage": 85.16, "elapsed_time": "6:24:21", "remaining_time": "1:06:59"}
{"current_steps": 710, "total_steps": 822, "loss": 0.6473, "lr": 5e-06, "epoch": 2.591240875912409, "percentage": 86.37, "elapsed_time": "6:29:45", "remaining_time": "1:01:28"}
{"current_steps": 720, "total_steps": 822, "loss": 0.6465, "lr": 5e-06, "epoch": 2.627737226277372, "percentage": 87.59, "elapsed_time": "6:35:09", "remaining_time": "0:55:58"}
{"current_steps": 730, "total_steps": 822, "loss": 0.6456, "lr": 5e-06, "epoch": 2.664233576642336, "percentage": 88.81, "elapsed_time": "6:40:31", "remaining_time": "0:50:28"}
{"current_steps": 740, "total_steps": 822, "loss": 0.6442, "lr": 5e-06, "epoch": 2.7007299270072993, "percentage": 90.02, "elapsed_time": "6:45:54", "remaining_time": "0:44:58"}
{"current_steps": 750, "total_steps": 822, "loss": 0.6459, "lr": 5e-06, "epoch": 2.7372262773722627, "percentage": 91.24, "elapsed_time": "6:51:16", "remaining_time": "0:39:28"}
{"current_steps": 760, "total_steps": 822, "loss": 0.6503, "lr": 5e-06, "epoch": 2.7737226277372264, "percentage": 92.46, "elapsed_time": "6:56:38", "remaining_time": "0:33:59"}
{"current_steps": 770, "total_steps": 822, "loss": 0.6473, "lr": 5e-06, "epoch": 2.81021897810219, "percentage": 93.67, "elapsed_time": "7:02:00", "remaining_time": "0:28:29"}
{"current_steps": 780, "total_steps": 822, "loss": 0.6426, "lr": 5e-06, "epoch": 2.846715328467153, "percentage": 94.89, "elapsed_time": "7:07:21", "remaining_time": "0:23:00"}
{"current_steps": 790, "total_steps": 822, "loss": 0.6473, "lr": 5e-06, "epoch": 2.883211678832117, "percentage": 96.11, "elapsed_time": "7:12:41", "remaining_time": "0:17:31"}
{"current_steps": 800, "total_steps": 822, "loss": 0.651, "lr": 5e-06, "epoch": 2.9197080291970803, "percentage": 97.32, "elapsed_time": "7:18:03", "remaining_time": "0:12:02"}
{"current_steps": 810, "total_steps": 822, "loss": 0.6448, "lr": 5e-06, "epoch": 2.9562043795620436, "percentage": 98.54, "elapsed_time": "7:23:25", "remaining_time": "0:06:34"}
{"current_steps": 820, "total_steps": 822, "loss": 0.6423, "lr": 5e-06, "epoch": 2.9927007299270074, "percentage": 99.76, "elapsed_time": "7:28:47", "remaining_time": "0:01:05"}
{"current_steps": 822, "total_steps": 822, "eval_loss": 0.7341417074203491, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "7:34:13", "remaining_time": "0:00:00"}
{"current_steps": 822, "total_steps": 822, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "7:35:48", "remaining_time": "0:00:00"}