mau-cr commited on
Commit
a141e13
·
verified ·
1 Parent(s): 45a5425

Add training log history

Browse files
Files changed (1) hide show
  1. log_history.json +173 -0
log_history.json ADDED
@@ -0,0 +1,173 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "loss": 3.9173959350585936,
4
+ "grad_norm": 1.2155354022979736,
5
+ "learning_rate": 0.00099,
6
+ "epoch": 4.3478260869565215,
7
+ "step": 100
8
+ },
9
+ {
10
+ "eval_loss": 0.5551369786262512,
11
+ "eval_wer": 0.533585619678335,
12
+ "eval_runtime": 4.1258,
13
+ "eval_samples_per_second": 36.842,
14
+ "eval_steps_per_second": 4.605,
15
+ "epoch": 4.3478260869565215,
16
+ "step": 100
17
+ },
18
+ {
19
+ "loss": 0.6211311721801758,
20
+ "grad_norm": 0.5991238355636597,
21
+ "learning_rate": 0.0008792682926829268,
22
+ "epoch": 8.695652173913043,
23
+ "step": 200
24
+ },
25
+ {
26
+ "eval_loss": 0.5127682089805603,
27
+ "eval_wer": 0.49479659413434246,
28
+ "eval_runtime": 4.1435,
29
+ "eval_samples_per_second": 36.684,
30
+ "eval_steps_per_second": 4.586,
31
+ "epoch": 8.695652173913043,
32
+ "step": 200
33
+ },
34
+ {
35
+ "loss": 0.48980007171630857,
36
+ "grad_norm": 0.5660077333450317,
37
+ "learning_rate": 0.0007573170731707317,
38
+ "epoch": 13.043478260869565,
39
+ "step": 300
40
+ },
41
+ {
42
+ "eval_loss": 0.5000773072242737,
43
+ "eval_wer": 0.47776726584673607,
44
+ "eval_runtime": 4.1244,
45
+ "eval_samples_per_second": 36.854,
46
+ "eval_steps_per_second": 4.607,
47
+ "epoch": 13.043478260869565,
48
+ "step": 300
49
+ },
50
+ {
51
+ "loss": 0.41821846008300784,
52
+ "grad_norm": 0.641327440738678,
53
+ "learning_rate": 0.0006353658536585366,
54
+ "epoch": 17.391304347826086,
55
+ "step": 400
56
+ },
57
+ {
58
+ "eval_loss": 0.4955653250217438,
59
+ "eval_wer": 0.4725638599810785,
60
+ "eval_runtime": 4.1284,
61
+ "eval_samples_per_second": 36.818,
62
+ "eval_steps_per_second": 4.602,
63
+ "epoch": 17.391304347826086,
64
+ "step": 400
65
+ },
66
+ {
67
+ "loss": 0.3750358200073242,
68
+ "grad_norm": 1.793125867843628,
69
+ "learning_rate": 0.0005134146341463415,
70
+ "epoch": 21.73913043478261,
71
+ "step": 500
72
+ },
73
+ {
74
+ "eval_loss": 0.516922116279602,
75
+ "eval_wer": 0.47540208136234624,
76
+ "eval_runtime": 4.1272,
77
+ "eval_samples_per_second": 36.829,
78
+ "eval_steps_per_second": 4.604,
79
+ "epoch": 21.73913043478261,
80
+ "step": 500
81
+ },
82
+ {
83
+ "loss": 0.3346158218383789,
84
+ "grad_norm": 0.6309618949890137,
85
+ "learning_rate": 0.00039146341463414634,
86
+ "epoch": 26.08695652173913,
87
+ "step": 600
88
+ },
89
+ {
90
+ "eval_loss": 0.507932186126709,
91
+ "eval_wer": 0.45931882686849573,
92
+ "eval_runtime": 4.1444,
93
+ "eval_samples_per_second": 36.676,
94
+ "eval_steps_per_second": 4.585,
95
+ "epoch": 26.08695652173913,
96
+ "step": 600
97
+ },
98
+ {
99
+ "loss": 0.30129409790039063,
100
+ "grad_norm": 0.8467895984649658,
101
+ "learning_rate": 0.0002695121951219512,
102
+ "epoch": 30.434782608695652,
103
+ "step": 700
104
+ },
105
+ {
106
+ "eval_loss": 0.5416971445083618,
107
+ "eval_wer": 0.4649952696310312,
108
+ "eval_runtime": 4.1267,
109
+ "eval_samples_per_second": 36.833,
110
+ "eval_steps_per_second": 4.604,
111
+ "epoch": 30.434782608695652,
112
+ "step": 700
113
+ },
114
+ {
115
+ "loss": 0.27793073654174805,
116
+ "grad_norm": 0.9243687391281128,
117
+ "learning_rate": 0.0001475609756097561,
118
+ "epoch": 34.78260869565217,
119
+ "step": 800
120
+ },
121
+ {
122
+ "eval_loss": 0.528235673904419,
123
+ "eval_wer": 0.45695364238410596,
124
+ "eval_runtime": 4.148,
125
+ "eval_samples_per_second": 36.644,
126
+ "eval_steps_per_second": 4.581,
127
+ "epoch": 34.78260869565217,
128
+ "step": 800
129
+ },
130
+ {
131
+ "loss": 0.25999046325683595,
132
+ "grad_norm": 1.9254482984542847,
133
+ "learning_rate": 2.5609756097560973e-05,
134
+ "epoch": 39.130434782608695,
135
+ "step": 900
136
+ },
137
+ {
138
+ "eval_loss": 0.5384841561317444,
139
+ "eval_wer": 0.4631031220435194,
140
+ "eval_runtime": 4.1312,
141
+ "eval_samples_per_second": 36.793,
142
+ "eval_steps_per_second": 4.599,
143
+ "epoch": 39.130434782608695,
144
+ "step": 900
145
+ },
146
+ {
147
+ "eval_loss": 0.5373823046684265,
148
+ "eval_wer": 0.4621570482497635,
149
+ "eval_runtime": 4.1433,
150
+ "eval_samples_per_second": 36.685,
151
+ "eval_steps_per_second": 4.586,
152
+ "epoch": 40.0,
153
+ "step": 920
154
+ },
155
+ {
156
+ "train_runtime": 14796.7383,
157
+ "train_samples_per_second": 1.987,
158
+ "train_steps_per_second": 0.062,
159
+ "total_flos": 3.925662755756644e+19,
160
+ "train_loss": 0.7654728495556375,
161
+ "epoch": 40.0,
162
+ "step": 920
163
+ },
164
+ {
165
+ "test_loss": 0.5563547015190125,
166
+ "test_wer": 0.46591276252019387,
167
+ "test_runtime": 6.8586,
168
+ "test_samples_per_second": 38.929,
169
+ "test_steps_per_second": 4.957,
170
+ "epoch": 40.0,
171
+ "step": 920
172
+ }
173
+ ]