File size: 17,626 Bytes
b2ab87d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
322487a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
f92f79c
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
a639aad
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
{"current_steps": 10, "total_steps": 957, "loss": 0.9785, "lr": 5e-06, "epoch": 0.031323414252153486, "percentage": 1.04, "elapsed_time": "0:09:44", "remaining_time": "15:21:50"}
{"current_steps": 20, "total_steps": 957, "loss": 0.8565, "lr": 5e-06, "epoch": 0.06264682850430697, "percentage": 2.09, "elapsed_time": "0:19:23", "remaining_time": "15:08:24"}
{"current_steps": 30, "total_steps": 957, "loss": 0.8274, "lr": 5e-06, "epoch": 0.09397024275646046, "percentage": 3.13, "elapsed_time": "0:29:02", "remaining_time": "14:57:29"}
{"current_steps": 40, "total_steps": 957, "loss": 0.799, "lr": 5e-06, "epoch": 0.12529365700861395, "percentage": 4.18, "elapsed_time": "0:38:42", "remaining_time": "14:47:32"}
{"current_steps": 50, "total_steps": 957, "loss": 0.7847, "lr": 5e-06, "epoch": 0.15661707126076743, "percentage": 5.22, "elapsed_time": "0:48:22", "remaining_time": "14:37:26"}
{"current_steps": 60, "total_steps": 957, "loss": 0.7733, "lr": 5e-06, "epoch": 0.18794048551292092, "percentage": 6.27, "elapsed_time": "0:58:01", "remaining_time": "14:27:35"}
{"current_steps": 70, "total_steps": 957, "loss": 0.7543, "lr": 5e-06, "epoch": 0.2192638997650744, "percentage": 7.31, "elapsed_time": "1:07:41", "remaining_time": "14:17:49"}
{"current_steps": 80, "total_steps": 957, "loss": 0.7505, "lr": 5e-06, "epoch": 0.2505873140172279, "percentage": 8.36, "elapsed_time": "1:17:21", "remaining_time": "14:07:59"}
{"current_steps": 90, "total_steps": 957, "loss": 0.7414, "lr": 5e-06, "epoch": 0.28191072826938135, "percentage": 9.4, "elapsed_time": "1:27:00", "remaining_time": "13:58:13"}
{"current_steps": 100, "total_steps": 957, "loss": 0.741, "lr": 5e-06, "epoch": 0.31323414252153486, "percentage": 10.45, "elapsed_time": "1:36:39", "remaining_time": "13:48:23"}
{"current_steps": 110, "total_steps": 957, "loss": 0.7386, "lr": 5e-06, "epoch": 0.3445575567736883, "percentage": 11.49, "elapsed_time": "1:46:19", "remaining_time": "13:38:39"}
{"current_steps": 120, "total_steps": 957, "loss": 0.7283, "lr": 5e-06, "epoch": 0.37588097102584184, "percentage": 12.54, "elapsed_time": "1:55:57", "remaining_time": "13:28:50"}
{"current_steps": 130, "total_steps": 957, "loss": 0.7326, "lr": 5e-06, "epoch": 0.4072043852779953, "percentage": 13.58, "elapsed_time": "2:05:37", "remaining_time": "13:19:08"}
{"current_steps": 140, "total_steps": 957, "loss": 0.7239, "lr": 5e-06, "epoch": 0.4385277995301488, "percentage": 14.63, "elapsed_time": "2:15:16", "remaining_time": "13:09:23"}
{"current_steps": 150, "total_steps": 957, "loss": 0.7294, "lr": 5e-06, "epoch": 0.46985121378230227, "percentage": 15.67, "elapsed_time": "2:24:55", "remaining_time": "12:59:43"}
{"current_steps": 160, "total_steps": 957, "loss": 0.7287, "lr": 5e-06, "epoch": 0.5011746280344558, "percentage": 16.72, "elapsed_time": "2:34:34", "remaining_time": "12:50:00"}
{"current_steps": 170, "total_steps": 957, "loss": 0.7208, "lr": 5e-06, "epoch": 0.5324980422866092, "percentage": 17.76, "elapsed_time": "2:44:12", "remaining_time": "12:40:11"}
{"current_steps": 180, "total_steps": 957, "loss": 0.7194, "lr": 5e-06, "epoch": 0.5638214565387627, "percentage": 18.81, "elapsed_time": "2:53:52", "remaining_time": "12:30:32"}
{"current_steps": 190, "total_steps": 957, "loss": 0.7209, "lr": 5e-06, "epoch": 0.5951448707909162, "percentage": 19.85, "elapsed_time": "3:03:30", "remaining_time": "12:20:48"}
{"current_steps": 200, "total_steps": 957, "loss": 0.719, "lr": 5e-06, "epoch": 0.6264682850430697, "percentage": 20.9, "elapsed_time": "3:13:08", "remaining_time": "12:11:02"}
{"current_steps": 210, "total_steps": 957, "loss": 0.7155, "lr": 5e-06, "epoch": 0.6577916992952232, "percentage": 21.94, "elapsed_time": "3:22:46", "remaining_time": "12:01:19"}
{"current_steps": 220, "total_steps": 957, "loss": 0.7137, "lr": 5e-06, "epoch": 0.6891151135473766, "percentage": 22.99, "elapsed_time": "3:32:25", "remaining_time": "11:51:35"}
{"current_steps": 230, "total_steps": 957, "loss": 0.7145, "lr": 5e-06, "epoch": 0.7204385277995301, "percentage": 24.03, "elapsed_time": "3:42:03", "remaining_time": "11:41:54"}
{"current_steps": 240, "total_steps": 957, "loss": 0.7151, "lr": 5e-06, "epoch": 0.7517619420516837, "percentage": 25.08, "elapsed_time": "3:51:42", "remaining_time": "11:32:14"}
{"current_steps": 250, "total_steps": 957, "loss": 0.7145, "lr": 5e-06, "epoch": 0.7830853563038371, "percentage": 26.12, "elapsed_time": "4:01:22", "remaining_time": "11:22:36"}
{"current_steps": 260, "total_steps": 957, "loss": 0.7174, "lr": 5e-06, "epoch": 0.8144087705559906, "percentage": 27.17, "elapsed_time": "4:11:02", "remaining_time": "11:12:58"}
{"current_steps": 270, "total_steps": 957, "loss": 0.7089, "lr": 5e-06, "epoch": 0.845732184808144, "percentage": 28.21, "elapsed_time": "4:20:42", "remaining_time": "11:03:20"}
{"current_steps": 280, "total_steps": 957, "loss": 0.7113, "lr": 5e-06, "epoch": 0.8770555990602976, "percentage": 29.26, "elapsed_time": "4:30:21", "remaining_time": "10:53:41"}
{"current_steps": 290, "total_steps": 957, "loss": 0.7087, "lr": 5e-06, "epoch": 0.9083790133124511, "percentage": 30.3, "elapsed_time": "4:40:00", "remaining_time": "10:44:00"}
{"current_steps": 300, "total_steps": 957, "loss": 0.7035, "lr": 5e-06, "epoch": 0.9397024275646045, "percentage": 31.35, "elapsed_time": "4:49:39", "remaining_time": "10:34:20"}
{"current_steps": 310, "total_steps": 957, "loss": 0.7101, "lr": 5e-06, "epoch": 0.971025841816758, "percentage": 32.39, "elapsed_time": "4:59:18", "remaining_time": "10:24:40"}
{"current_steps": 319, "total_steps": 957, "eval_loss": 0.7040486931800842, "epoch": 0.9992169146436961, "percentage": 33.33, "elapsed_time": "5:13:53", "remaining_time": "10:27:46"}
{"current_steps": 320, "total_steps": 957, "loss": 0.7543, "lr": 5e-06, "epoch": 1.0023492560689116, "percentage": 33.44, "elapsed_time": "5:15:48", "remaining_time": "10:28:38"}
{"current_steps": 330, "total_steps": 957, "loss": 0.6574, "lr": 5e-06, "epoch": 1.033672670321065, "percentage": 34.48, "elapsed_time": "5:25:28", "remaining_time": "10:18:23"}
{"current_steps": 340, "total_steps": 957, "loss": 0.6596, "lr": 5e-06, "epoch": 1.0649960845732185, "percentage": 35.53, "elapsed_time": "5:35:08", "remaining_time": "10:08:10"}
{"current_steps": 350, "total_steps": 957, "loss": 0.6634, "lr": 5e-06, "epoch": 1.096319498825372, "percentage": 36.57, "elapsed_time": "5:44:47", "remaining_time": "9:57:58"}
{"current_steps": 360, "total_steps": 957, "loss": 0.6588, "lr": 5e-06, "epoch": 1.1276429130775254, "percentage": 37.62, "elapsed_time": "5:54:27", "remaining_time": "9:47:48"}
{"current_steps": 370, "total_steps": 957, "loss": 0.6627, "lr": 5e-06, "epoch": 1.1589663273296789, "percentage": 38.66, "elapsed_time": "6:04:07", "remaining_time": "9:37:41"}
{"current_steps": 380, "total_steps": 957, "loss": 0.6623, "lr": 5e-06, "epoch": 1.1902897415818323, "percentage": 39.71, "elapsed_time": "6:13:47", "remaining_time": "9:27:34"}
{"current_steps": 390, "total_steps": 957, "loss": 0.6595, "lr": 5e-06, "epoch": 1.221613155833986, "percentage": 40.75, "elapsed_time": "6:23:28", "remaining_time": "9:17:30"}
{"current_steps": 400, "total_steps": 957, "loss": 0.6602, "lr": 5e-06, "epoch": 1.2529365700861395, "percentage": 41.8, "elapsed_time": "6:33:08", "remaining_time": "9:07:27"}
{"current_steps": 410, "total_steps": 957, "loss": 0.6623, "lr": 5e-06, "epoch": 1.284259984338293, "percentage": 42.84, "elapsed_time": "6:42:49", "remaining_time": "8:57:25"}
{"current_steps": 420, "total_steps": 957, "loss": 0.6623, "lr": 5e-06, "epoch": 1.3155833985904464, "percentage": 43.89, "elapsed_time": "6:52:30", "remaining_time": "8:47:25"}
{"current_steps": 430, "total_steps": 957, "loss": 0.6624, "lr": 5e-06, "epoch": 1.3469068128425998, "percentage": 44.93, "elapsed_time": "7:02:11", "remaining_time": "8:37:25"}
{"current_steps": 440, "total_steps": 957, "loss": 0.6597, "lr": 5e-06, "epoch": 1.3782302270947533, "percentage": 45.98, "elapsed_time": "7:11:52", "remaining_time": "8:27:26"}
{"current_steps": 450, "total_steps": 957, "loss": 0.6601, "lr": 5e-06, "epoch": 1.4095536413469067, "percentage": 47.02, "elapsed_time": "7:21:32", "remaining_time": "8:17:28"}
{"current_steps": 460, "total_steps": 957, "loss": 0.6579, "lr": 5e-06, "epoch": 1.4408770555990604, "percentage": 48.07, "elapsed_time": "7:31:13", "remaining_time": "8:07:30"}
{"current_steps": 470, "total_steps": 957, "loss": 0.6617, "lr": 5e-06, "epoch": 1.4722004698512139, "percentage": 49.11, "elapsed_time": "7:40:53", "remaining_time": "7:57:33"}
{"current_steps": 480, "total_steps": 957, "loss": 0.6575, "lr": 5e-06, "epoch": 1.5035238841033673, "percentage": 50.16, "elapsed_time": "7:50:33", "remaining_time": "7:47:37"}
{"current_steps": 490, "total_steps": 957, "loss": 0.6619, "lr": 5e-06, "epoch": 1.5348472983555208, "percentage": 51.2, "elapsed_time": "8:00:13", "remaining_time": "7:37:41"}
{"current_steps": 500, "total_steps": 957, "loss": 0.6582, "lr": 5e-06, "epoch": 1.5661707126076743, "percentage": 52.25, "elapsed_time": "8:09:52", "remaining_time": "7:27:44"}
{"current_steps": 510, "total_steps": 957, "loss": 0.6606, "lr": 5e-06, "epoch": 1.5974941268598277, "percentage": 53.29, "elapsed_time": "8:19:33", "remaining_time": "7:17:50"}
{"current_steps": 520, "total_steps": 957, "loss": 0.6591, "lr": 5e-06, "epoch": 1.6288175411119812, "percentage": 54.34, "elapsed_time": "8:29:13", "remaining_time": "7:07:56"}
{"current_steps": 530, "total_steps": 957, "loss": 0.6567, "lr": 5e-06, "epoch": 1.6601409553641346, "percentage": 55.38, "elapsed_time": "8:38:54", "remaining_time": "6:58:03"}
{"current_steps": 540, "total_steps": 957, "loss": 0.6558, "lr": 5e-06, "epoch": 1.691464369616288, "percentage": 56.43, "elapsed_time": "8:48:34", "remaining_time": "6:48:10"}
{"current_steps": 550, "total_steps": 957, "loss": 0.6552, "lr": 5e-06, "epoch": 1.7227877838684416, "percentage": 57.47, "elapsed_time": "8:58:14", "remaining_time": "6:38:17"}
{"current_steps": 560, "total_steps": 957, "loss": 0.6569, "lr": 5e-06, "epoch": 1.754111198120595, "percentage": 58.52, "elapsed_time": "9:07:55", "remaining_time": "6:28:26"}
{"current_steps": 570, "total_steps": 957, "loss": 0.6579, "lr": 5e-06, "epoch": 1.7854346123727485, "percentage": 59.56, "elapsed_time": "9:17:36", "remaining_time": "6:18:35"}
{"current_steps": 580, "total_steps": 957, "loss": 0.6586, "lr": 5e-06, "epoch": 1.8167580266249022, "percentage": 60.61, "elapsed_time": "9:27:16", "remaining_time": "6:08:43"}
{"current_steps": 590, "total_steps": 957, "loss": 0.6602, "lr": 5e-06, "epoch": 1.8480814408770556, "percentage": 61.65, "elapsed_time": "9:36:57", "remaining_time": "5:58:53"}
{"current_steps": 600, "total_steps": 957, "loss": 0.6562, "lr": 5e-06, "epoch": 1.879404855129209, "percentage": 62.7, "elapsed_time": "9:46:38", "remaining_time": "5:49:02"}
{"current_steps": 610, "total_steps": 957, "loss": 0.6598, "lr": 5e-06, "epoch": 1.9107282693813625, "percentage": 63.74, "elapsed_time": "9:56:19", "remaining_time": "5:39:13"}
{"current_steps": 620, "total_steps": 957, "loss": 0.6577, "lr": 5e-06, "epoch": 1.9420516836335162, "percentage": 64.79, "elapsed_time": "10:05:59", "remaining_time": "5:29:23"}
{"current_steps": 630, "total_steps": 957, "loss": 0.6588, "lr": 5e-06, "epoch": 1.9733750978856697, "percentage": 65.83, "elapsed_time": "10:15:39", "remaining_time": "5:19:33"}
{"current_steps": 638, "total_steps": 957, "eval_loss": 0.6915597319602966, "epoch": 1.9984338292873924, "percentage": 66.67, "elapsed_time": "10:29:32", "remaining_time": "5:14:46"}
{"current_steps": 640, "total_steps": 957, "loss": 0.7005, "lr": 5e-06, "epoch": 2.004698512137823, "percentage": 66.88, "elapsed_time": "10:32:10", "remaining_time": "5:13:07"}
{"current_steps": 650, "total_steps": 957, "loss": 0.61, "lr": 5e-06, "epoch": 2.0360219263899766, "percentage": 67.92, "elapsed_time": "10:41:48", "remaining_time": "5:03:08"}
{"current_steps": 660, "total_steps": 957, "loss": 0.6129, "lr": 5e-06, "epoch": 2.06734534064213, "percentage": 68.97, "elapsed_time": "10:51:28", "remaining_time": "4:53:09"}
{"current_steps": 670, "total_steps": 957, "loss": 0.6073, "lr": 5e-06, "epoch": 2.0986687548942835, "percentage": 70.01, "elapsed_time": "11:01:08", "remaining_time": "4:43:12"}
{"current_steps": 680, "total_steps": 957, "loss": 0.6069, "lr": 5e-06, "epoch": 2.129992169146437, "percentage": 71.06, "elapsed_time": "11:10:47", "remaining_time": "4:33:15"}
{"current_steps": 690, "total_steps": 957, "loss": 0.6115, "lr": 5e-06, "epoch": 2.1613155833985904, "percentage": 72.1, "elapsed_time": "11:20:26", "remaining_time": "4:23:18"}
{"current_steps": 700, "total_steps": 957, "loss": 0.6083, "lr": 5e-06, "epoch": 2.192638997650744, "percentage": 73.15, "elapsed_time": "11:30:05", "remaining_time": "4:13:21"}
{"current_steps": 710, "total_steps": 957, "loss": 0.6055, "lr": 5e-06, "epoch": 2.2239624119028973, "percentage": 74.19, "elapsed_time": "11:39:44", "remaining_time": "4:03:25"}
{"current_steps": 720, "total_steps": 957, "loss": 0.612, "lr": 5e-06, "epoch": 2.255285826155051, "percentage": 75.24, "elapsed_time": "11:49:23", "remaining_time": "3:53:30"}
{"current_steps": 730, "total_steps": 957, "loss": 0.6119, "lr": 5e-06, "epoch": 2.2866092404072043, "percentage": 76.28, "elapsed_time": "11:59:03", "remaining_time": "3:43:35"}
{"current_steps": 740, "total_steps": 957, "loss": 0.6113, "lr": 5e-06, "epoch": 2.3179326546593577, "percentage": 77.32, "elapsed_time": "12:08:42", "remaining_time": "3:33:41"}
{"current_steps": 750, "total_steps": 957, "loss": 0.6111, "lr": 5e-06, "epoch": 2.349256068911511, "percentage": 78.37, "elapsed_time": "12:18:20", "remaining_time": "3:23:46"}
{"current_steps": 760, "total_steps": 957, "loss": 0.6121, "lr": 5e-06, "epoch": 2.3805794831636646, "percentage": 79.41, "elapsed_time": "12:27:59", "remaining_time": "3:13:53"}
{"current_steps": 770, "total_steps": 957, "loss": 0.6159, "lr": 5e-06, "epoch": 2.4119028974158185, "percentage": 80.46, "elapsed_time": "12:37:38", "remaining_time": "3:03:59"}
{"current_steps": 780, "total_steps": 957, "loss": 0.6142, "lr": 5e-06, "epoch": 2.443226311667972, "percentage": 81.5, "elapsed_time": "12:47:17", "remaining_time": "2:54:06"}
{"current_steps": 790, "total_steps": 957, "loss": 0.6181, "lr": 5e-06, "epoch": 2.4745497259201255, "percentage": 82.55, "elapsed_time": "12:56:56", "remaining_time": "2:44:14"}
{"current_steps": 800, "total_steps": 957, "loss": 0.6127, "lr": 5e-06, "epoch": 2.505873140172279, "percentage": 83.59, "elapsed_time": "13:06:34", "remaining_time": "2:34:21"}
{"current_steps": 810, "total_steps": 957, "loss": 0.6192, "lr": 5e-06, "epoch": 2.5371965544244324, "percentage": 84.64, "elapsed_time": "13:16:13", "remaining_time": "2:24:29"}
{"current_steps": 820, "total_steps": 957, "loss": 0.6098, "lr": 5e-06, "epoch": 2.568519968676586, "percentage": 85.68, "elapsed_time": "13:25:51", "remaining_time": "2:14:38"}
{"current_steps": 830, "total_steps": 957, "loss": 0.6126, "lr": 5e-06, "epoch": 2.5998433829287393, "percentage": 86.73, "elapsed_time": "13:35:28", "remaining_time": "2:04:46"}
{"current_steps": 840, "total_steps": 957, "loss": 0.618, "lr": 5e-06, "epoch": 2.6311667971808927, "percentage": 87.77, "elapsed_time": "13:45:06", "remaining_time": "1:54:55"}
{"current_steps": 850, "total_steps": 957, "loss": 0.6132, "lr": 5e-06, "epoch": 2.662490211433046, "percentage": 88.82, "elapsed_time": "13:54:45", "remaining_time": "1:45:04"}
{"current_steps": 860, "total_steps": 957, "loss": 0.6211, "lr": 5e-06, "epoch": 2.6938136256851997, "percentage": 89.86, "elapsed_time": "14:04:24", "remaining_time": "1:35:14"}
{"current_steps": 870, "total_steps": 957, "loss": 0.6072, "lr": 5e-06, "epoch": 2.725137039937353, "percentage": 90.91, "elapsed_time": "14:14:04", "remaining_time": "1:25:24"}
{"current_steps": 880, "total_steps": 957, "loss": 0.6181, "lr": 5e-06, "epoch": 2.7564604541895066, "percentage": 91.95, "elapsed_time": "14:23:43", "remaining_time": "1:15:34"}
{"current_steps": 890, "total_steps": 957, "loss": 0.6183, "lr": 5e-06, "epoch": 2.78778386844166, "percentage": 93.0, "elapsed_time": "14:33:23", "remaining_time": "1:05:44"}
{"current_steps": 900, "total_steps": 957, "loss": 0.6185, "lr": 5e-06, "epoch": 2.8191072826938135, "percentage": 94.04, "elapsed_time": "14:43:02", "remaining_time": "0:55:55"}
{"current_steps": 910, "total_steps": 957, "loss": 0.6113, "lr": 5e-06, "epoch": 2.850430696945967, "percentage": 95.09, "elapsed_time": "14:52:41", "remaining_time": "0:46:06"}
{"current_steps": 920, "total_steps": 957, "loss": 0.613, "lr": 5e-06, "epoch": 2.881754111198121, "percentage": 96.13, "elapsed_time": "15:02:20", "remaining_time": "0:36:17"}
{"current_steps": 930, "total_steps": 957, "loss": 0.6178, "lr": 5e-06, "epoch": 2.913077525450274, "percentage": 97.18, "elapsed_time": "15:12:00", "remaining_time": "0:26:28"}
{"current_steps": 940, "total_steps": 957, "loss": 0.6157, "lr": 5e-06, "epoch": 2.9444009397024278, "percentage": 98.22, "elapsed_time": "15:21:40", "remaining_time": "0:16:40"}
{"current_steps": 950, "total_steps": 957, "loss": 0.6176, "lr": 5e-06, "epoch": 2.975724353954581, "percentage": 99.27, "elapsed_time": "15:31:18", "remaining_time": "0:06:51"}
{"current_steps": 957, "total_steps": 957, "eval_loss": 0.6914501786231995, "epoch": 2.9976507439310884, "percentage": 100.0, "elapsed_time": "15:44:59", "remaining_time": "0:00:00"}
{"current_steps": 957, "total_steps": 957, "epoch": 2.9976507439310884, "percentage": 100.0, "elapsed_time": "15:46:26", "remaining_time": "0:00:00"}