ShihTing commited on
Commit
a065358
·
1 Parent(s): 0796d8f

Upload trainer_state.json

Browse files
Files changed (1) hide show
  1. trainer_state.json +96 -96
trainer_state.json CHANGED
@@ -9,188 +9,188 @@
9
  "log_history": [
10
  {
11
  "epoch": 1.07,
12
- "eval_accuracy": 0.8663101604278075,
13
- "eval_loss": 0.5277199149131775,
14
- "eval_recall": 0.6122448979591837,
15
- "eval_runtime": 10.117,
16
- "eval_samples_per_second": 18.484,
17
- "eval_steps_per_second": 4.646,
18
  "step": 200
19
  },
20
  {
21
  "epoch": 2.14,
22
- "eval_accuracy": 0.7647058823529411,
23
- "eval_loss": 0.9699290990829468,
24
- "eval_recall": 0.8979591836734694,
25
- "eval_runtime": 10.119,
26
- "eval_samples_per_second": 18.48,
27
- "eval_steps_per_second": 4.645,
28
  "step": 400
29
  },
30
  {
31
  "epoch": 2.67,
32
  "learning_rate": 4.554367201426025e-05,
33
- "loss": 0.4246,
34
  "step": 500
35
  },
36
  {
37
  "epoch": 3.21,
38
- "eval_accuracy": 0.8663101604278075,
39
- "eval_loss": 0.7973827719688416,
40
- "eval_recall": 0.5510204081632653,
41
- "eval_runtime": 10.148,
42
- "eval_samples_per_second": 18.427,
43
- "eval_steps_per_second": 4.631,
44
  "step": 600
45
  },
46
  {
47
  "epoch": 4.28,
48
- "eval_accuracy": 0.8716577540106952,
49
- "eval_loss": 0.9027533531188965,
50
- "eval_recall": 0.5714285714285714,
51
- "eval_runtime": 10.102,
52
- "eval_samples_per_second": 18.511,
53
- "eval_steps_per_second": 4.653,
54
  "step": 800
55
  },
56
  {
57
  "epoch": 5.35,
58
  "learning_rate": 4.10873440285205e-05,
59
- "loss": 0.1059,
60
  "step": 1000
61
  },
62
  {
63
  "epoch": 5.35,
64
- "eval_accuracy": 0.8609625668449198,
65
- "eval_loss": 0.8567710518836975,
66
- "eval_recall": 0.7346938775510204,
67
- "eval_runtime": 10.117,
68
- "eval_samples_per_second": 18.484,
69
- "eval_steps_per_second": 4.646,
70
  "step": 1000
71
  },
72
  {
73
  "epoch": 6.42,
74
- "eval_accuracy": 0.9037433155080213,
75
- "eval_loss": 0.8681638240814209,
76
- "eval_recall": 0.7755102040816326,
77
- "eval_runtime": 10.157,
78
- "eval_samples_per_second": 18.411,
79
- "eval_steps_per_second": 4.627,
80
  "step": 1200
81
  },
82
  {
83
  "epoch": 7.49,
84
- "eval_accuracy": 0.8823529411764706,
85
- "eval_loss": 0.9168533682823181,
86
- "eval_recall": 0.6938775510204082,
87
- "eval_runtime": 10.271,
88
- "eval_samples_per_second": 18.207,
89
- "eval_steps_per_second": 4.576,
90
  "step": 1400
91
  },
92
  {
93
  "epoch": 8.02,
94
  "learning_rate": 3.6631016042780753e-05,
95
- "loss": 0.0555,
96
  "step": 1500
97
  },
98
  {
99
  "epoch": 8.56,
100
- "eval_accuracy": 0.8556149732620321,
101
- "eval_loss": 0.9982467293739319,
102
- "eval_recall": 0.7346938775510204,
103
- "eval_runtime": 10.134,
104
- "eval_samples_per_second": 18.453,
105
- "eval_steps_per_second": 4.638,
106
  "step": 1600
107
  },
108
  {
109
  "epoch": 9.63,
110
- "eval_accuracy": 0.8663101604278075,
111
- "eval_loss": 1.04860258102417,
112
- "eval_recall": 0.7142857142857143,
113
- "eval_runtime": 10.225,
114
- "eval_samples_per_second": 18.289,
115
- "eval_steps_per_second": 4.597,
116
  "step": 1800
117
  },
118
  {
119
  "epoch": 10.7,
120
  "learning_rate": 3.2174688057041004e-05,
121
- "loss": 0.0224,
122
  "step": 2000
123
  },
124
  {
125
  "epoch": 10.7,
126
- "eval_accuracy": 0.8770053475935828,
127
- "eval_loss": 1.0292185544967651,
128
- "eval_recall": 0.673469387755102,
129
- "eval_runtime": 10.362,
130
- "eval_samples_per_second": 18.047,
131
- "eval_steps_per_second": 4.536,
132
  "step": 2000
133
  },
134
  {
135
  "epoch": 11.76,
136
- "eval_accuracy": 0.8663101604278075,
137
- "eval_loss": 1.1402537822723389,
138
- "eval_recall": 0.673469387755102,
139
- "eval_runtime": 10.233,
140
- "eval_samples_per_second": 18.274,
141
- "eval_steps_per_second": 4.593,
142
  "step": 2200
143
  },
144
  {
145
  "epoch": 12.83,
146
- "eval_accuracy": 0.8716577540106952,
147
- "eval_loss": 1.1431100368499756,
148
- "eval_recall": 0.673469387755102,
149
- "eval_runtime": 10.226,
150
- "eval_samples_per_second": 18.287,
151
- "eval_steps_per_second": 4.596,
152
  "step": 2400
153
  },
154
  {
155
  "epoch": 13.37,
156
  "learning_rate": 2.7718360071301247e-05,
157
- "loss": 0.0001,
158
  "step": 2500
159
  },
160
  {
161
  "epoch": 13.9,
162
- "eval_accuracy": 0.8770053475935828,
163
- "eval_loss": 1.1465816497802734,
164
- "eval_recall": 0.6530612244897959,
165
- "eval_runtime": 10.254,
166
- "eval_samples_per_second": 18.237,
167
- "eval_steps_per_second": 4.584,
168
  "step": 2600
169
  },
170
  {
171
  "epoch": 14.97,
172
- "eval_accuracy": 0.8716577540106952,
173
- "eval_loss": 1.1757899522781372,
174
- "eval_recall": 0.6530612244897959,
175
- "eval_runtime": 10.346,
176
- "eval_samples_per_second": 18.075,
177
- "eval_steps_per_second": 4.543,
178
  "step": 2800
179
  },
180
  {
181
  "epoch": 16.04,
182
  "learning_rate": 2.32620320855615e-05,
183
- "loss": 0.0,
184
  "step": 3000
185
  },
186
  {
187
  "epoch": 16.04,
188
- "eval_accuracy": 0.8823529411764706,
189
- "eval_loss": 1.1856350898742676,
190
- "eval_recall": 0.6530612244897959,
191
- "eval_runtime": 10.397,
192
- "eval_samples_per_second": 17.986,
193
- "eval_steps_per_second": 4.521,
194
  "step": 3000
195
  }
196
  ],
 
9
  "log_history": [
10
  {
11
  "epoch": 1.07,
12
+ "eval_accuracy": 0.5401069518716578,
13
+ "eval_loss": 1.1939018964767456,
14
+ "eval_recall": 0.5401069518716578,
15
+ "eval_runtime": 10.154,
16
+ "eval_samples_per_second": 18.416,
17
+ "eval_steps_per_second": 4.629,
18
  "step": 200
19
  },
20
  {
21
  "epoch": 2.14,
22
+ "eval_accuracy": 0.6951871657754011,
23
+ "eval_loss": 0.8892518877983093,
24
+ "eval_recall": 0.6951871657754011,
25
+ "eval_runtime": 10.177,
26
+ "eval_samples_per_second": 18.375,
27
+ "eval_steps_per_second": 4.618,
28
  "step": 400
29
  },
30
  {
31
  "epoch": 2.67,
32
  "learning_rate": 4.554367201426025e-05,
33
+ "loss": 1.2205,
34
  "step": 500
35
  },
36
  {
37
  "epoch": 3.21,
38
+ "eval_accuracy": 0.6149732620320856,
39
+ "eval_loss": 1.2934410572052002,
40
+ "eval_recall": 0.6149732620320856,
41
+ "eval_runtime": 10.164,
42
+ "eval_samples_per_second": 18.398,
43
+ "eval_steps_per_second": 4.624,
44
  "step": 600
45
  },
46
  {
47
  "epoch": 4.28,
48
+ "eval_accuracy": 0.6470588235294118,
49
+ "eval_loss": 1.179315447807312,
50
+ "eval_recall": 0.6470588235294118,
51
+ "eval_runtime": 10.156,
52
+ "eval_samples_per_second": 18.413,
53
+ "eval_steps_per_second": 4.628,
54
  "step": 800
55
  },
56
  {
57
  "epoch": 5.35,
58
  "learning_rate": 4.10873440285205e-05,
59
+ "loss": 0.8231,
60
  "step": 1000
61
  },
62
  {
63
  "epoch": 5.35,
64
+ "eval_accuracy": 0.6310160427807486,
65
+ "eval_loss": 1.7959877252578735,
66
+ "eval_recall": 0.6310160427807486,
67
+ "eval_runtime": 10.15,
68
+ "eval_samples_per_second": 18.424,
69
+ "eval_steps_per_second": 4.631,
70
  "step": 1000
71
  },
72
  {
73
  "epoch": 6.42,
74
+ "eval_accuracy": 0.7005347593582888,
75
+ "eval_loss": 1.6884827613830566,
76
+ "eval_recall": 0.7005347593582888,
77
+ "eval_runtime": 10.222,
78
+ "eval_samples_per_second": 18.294,
79
+ "eval_steps_per_second": 4.598,
80
  "step": 1200
81
  },
82
  {
83
  "epoch": 7.49,
84
+ "eval_accuracy": 0.6203208556149733,
85
+ "eval_loss": 1.8338332176208496,
86
+ "eval_recall": 0.6203208556149733,
87
+ "eval_runtime": 10.15,
88
+ "eval_samples_per_second": 18.424,
89
+ "eval_steps_per_second": 4.631,
90
  "step": 1400
91
  },
92
  {
93
  "epoch": 8.02,
94
  "learning_rate": 3.6631016042780753e-05,
95
+ "loss": 0.5043,
96
  "step": 1500
97
  },
98
  {
99
  "epoch": 8.56,
100
+ "eval_accuracy": 0.6524064171122995,
101
+ "eval_loss": 1.8866851329803467,
102
+ "eval_recall": 0.6524064171122995,
103
+ "eval_runtime": 10.282,
104
+ "eval_samples_per_second": 18.187,
105
+ "eval_steps_per_second": 4.571,
106
  "step": 1600
107
  },
108
  {
109
  "epoch": 9.63,
110
+ "eval_accuracy": 0.6951871657754011,
111
+ "eval_loss": 1.6332286596298218,
112
+ "eval_recall": 0.6951871657754011,
113
+ "eval_runtime": 10.094,
114
+ "eval_samples_per_second": 18.526,
115
+ "eval_steps_per_second": 4.656,
116
  "step": 1800
117
  },
118
  {
119
  "epoch": 10.7,
120
  "learning_rate": 3.2174688057041004e-05,
121
+ "loss": 0.2426,
122
  "step": 2000
123
  },
124
  {
125
  "epoch": 10.7,
126
+ "eval_accuracy": 0.6631016042780749,
127
+ "eval_loss": 2.0470945835113525,
128
+ "eval_recall": 0.6631016042780749,
129
+ "eval_runtime": 10.46,
130
+ "eval_samples_per_second": 17.878,
131
+ "eval_steps_per_second": 4.493,
132
  "step": 2000
133
  },
134
  {
135
  "epoch": 11.76,
136
+ "eval_accuracy": 0.6684491978609626,
137
+ "eval_loss": 2.127241373062134,
138
+ "eval_recall": 0.6684491978609626,
139
+ "eval_runtime": 10.207,
140
+ "eval_samples_per_second": 18.321,
141
+ "eval_steps_per_second": 4.605,
142
  "step": 2200
143
  },
144
  {
145
  "epoch": 12.83,
146
+ "eval_accuracy": 0.7112299465240641,
147
+ "eval_loss": 2.163196563720703,
148
+ "eval_recall": 0.7112299465240641,
149
+ "eval_runtime": 10.211,
150
+ "eval_samples_per_second": 18.314,
151
+ "eval_steps_per_second": 4.603,
152
  "step": 2400
153
  },
154
  {
155
  "epoch": 13.37,
156
  "learning_rate": 2.7718360071301247e-05,
157
+ "loss": 0.1709,
158
  "step": 2500
159
  },
160
  {
161
  "epoch": 13.9,
162
+ "eval_accuracy": 0.679144385026738,
163
+ "eval_loss": 2.2403364181518555,
164
+ "eval_recall": 0.679144385026738,
165
+ "eval_runtime": 10.385,
166
+ "eval_samples_per_second": 18.007,
167
+ "eval_steps_per_second": 4.526,
168
  "step": 2600
169
  },
170
  {
171
  "epoch": 14.97,
172
+ "eval_accuracy": 0.6844919786096256,
173
+ "eval_loss": 2.3301198482513428,
174
+ "eval_recall": 0.6844919786096256,
175
+ "eval_runtime": 10.223,
176
+ "eval_samples_per_second": 18.292,
177
+ "eval_steps_per_second": 4.597,
178
  "step": 2800
179
  },
180
  {
181
  "epoch": 16.04,
182
  "learning_rate": 2.32620320855615e-05,
183
+ "loss": 0.1114,
184
  "step": 3000
185
  },
186
  {
187
  "epoch": 16.04,
188
+ "eval_accuracy": 0.6898395721925134,
189
+ "eval_loss": 2.3098907470703125,
190
+ "eval_recall": 0.6898395721925134,
191
+ "eval_runtime": 10.233,
192
+ "eval_samples_per_second": 18.274,
193
+ "eval_steps_per_second": 4.593,
194
  "step": 3000
195
  }
196
  ],