Ethan Sim commited on
Commit
63006ec
·
1 Parent(s): f2fe26d

update model with 1.0 safeguard

Browse files
checkpoint-48000/trainer_state.json CHANGED
@@ -18,7 +18,7 @@
18
  "eval_bleu": 35.1474,
19
  "eval_gen_len": 40.395,
20
  "eval_loss": 0.10896337777376175,
21
- "eval_runtime": 179.3655,
22
  "eval_samples_per_second": 5.815,
23
  "eval_steps_per_second": 0.184,
24
  "step": 4000
@@ -34,9 +34,9 @@
34
  "eval_bleu": 41.0648,
35
  "eval_gen_len": 34.5983,
36
  "eval_loss": 0.10649073868989944,
37
- "eval_runtime": 166.3848,
38
- "eval_samples_per_second": 6.269,
39
- "eval_steps_per_second": 0.198,
40
  "step": 8000
41
  },
42
  {
@@ -50,8 +50,8 @@
50
  "eval_bleu": 41.4064,
51
  "eval_gen_len": 34.4353,
52
  "eval_loss": 0.10525061935186386,
53
- "eval_runtime": 157.1928,
54
- "eval_samples_per_second": 6.635,
55
  "eval_steps_per_second": 0.21,
56
  "step": 12000
57
  },
@@ -66,9 +66,9 @@
66
  "eval_bleu": 40.6981,
67
  "eval_gen_len": 36.0038,
68
  "eval_loss": 0.10416892915964127,
69
- "eval_runtime": 135.6043,
70
- "eval_samples_per_second": 7.691,
71
- "eval_steps_per_second": 0.243,
72
  "step": 16000
73
  },
74
  {
@@ -82,9 +82,9 @@
82
  "eval_bleu": 41.7673,
83
  "eval_gen_len": 35.4631,
84
  "eval_loss": 0.10361550748348236,
85
- "eval_runtime": 156.992,
86
- "eval_samples_per_second": 6.644,
87
- "eval_steps_per_second": 0.21,
88
  "step": 20000
89
  },
90
  {
@@ -98,9 +98,9 @@
98
  "eval_bleu": 41.5766,
99
  "eval_gen_len": 35.7536,
100
  "eval_loss": 0.10351266711950302,
101
- "eval_runtime": 148.1282,
102
- "eval_samples_per_second": 7.041,
103
- "eval_steps_per_second": 0.223,
104
  "step": 24000
105
  },
106
  {
@@ -114,9 +114,9 @@
114
  "eval_bleu": 41.2765,
115
  "eval_gen_len": 35.535,
116
  "eval_loss": 0.10269948095083237,
117
- "eval_runtime": 139.1706,
118
- "eval_samples_per_second": 7.494,
119
- "eval_steps_per_second": 0.237,
120
  "step": 28000
121
  },
122
  {
@@ -130,9 +130,9 @@
130
  "eval_bleu": 42.0634,
131
  "eval_gen_len": 34.8495,
132
  "eval_loss": 0.10216742753982544,
133
- "eval_runtime": 138.1687,
134
- "eval_samples_per_second": 7.549,
135
- "eval_steps_per_second": 0.239,
136
  "step": 32000
137
  },
138
  {
@@ -146,9 +146,9 @@
146
  "eval_bleu": 41.2763,
147
  "eval_gen_len": 36.139,
148
  "eval_loss": 0.10178232192993164,
149
- "eval_runtime": 118.4305,
150
- "eval_samples_per_second": 8.807,
151
- "eval_steps_per_second": 0.279,
152
  "step": 36000
153
  },
154
  {
@@ -162,9 +162,9 @@
162
  "eval_bleu": 42.3991,
163
  "eval_gen_len": 34.4545,
164
  "eval_loss": 0.10192298889160156,
165
- "eval_runtime": 120.2656,
166
- "eval_samples_per_second": 8.672,
167
- "eval_steps_per_second": 0.274,
168
  "step": 40000
169
  },
170
  {
@@ -178,9 +178,9 @@
178
  "eval_bleu": 42.1688,
179
  "eval_gen_len": 35.3145,
180
  "eval_loss": 0.1022704690694809,
181
- "eval_runtime": 137.0088,
182
- "eval_samples_per_second": 7.613,
183
- "eval_steps_per_second": 0.241,
184
  "step": 44000
185
  },
186
  {
@@ -194,9 +194,9 @@
194
  "eval_bleu": 42.5638,
195
  "eval_gen_len": 35.0738,
196
  "eval_loss": 0.10206188261508942,
197
- "eval_runtime": 129.6219,
198
- "eval_samples_per_second": 8.046,
199
- "eval_steps_per_second": 0.255,
200
  "step": 48000
201
  }
202
  ],
 
18
  "eval_bleu": 35.1474,
19
  "eval_gen_len": 40.395,
20
  "eval_loss": 0.10896337777376175,
21
+ "eval_runtime": 179.3484,
22
  "eval_samples_per_second": 5.815,
23
  "eval_steps_per_second": 0.184,
24
  "step": 4000
 
34
  "eval_bleu": 41.0648,
35
  "eval_gen_len": 34.5983,
36
  "eval_loss": 0.10649073868989944,
37
+ "eval_runtime": 171.3066,
38
+ "eval_samples_per_second": 6.088,
39
+ "eval_steps_per_second": 0.193,
40
  "step": 8000
41
  },
42
  {
 
50
  "eval_bleu": 41.4064,
51
  "eval_gen_len": 34.4353,
52
  "eval_loss": 0.10525061935186386,
53
+ "eval_runtime": 156.772,
54
+ "eval_samples_per_second": 6.653,
55
  "eval_steps_per_second": 0.21,
56
  "step": 12000
57
  },
 
66
  "eval_bleu": 40.6981,
67
  "eval_gen_len": 36.0038,
68
  "eval_loss": 0.10416892915964127,
69
+ "eval_runtime": 133.8567,
70
+ "eval_samples_per_second": 7.792,
71
+ "eval_steps_per_second": 0.247,
72
  "step": 16000
73
  },
74
  {
 
82
  "eval_bleu": 41.7673,
83
  "eval_gen_len": 35.4631,
84
  "eval_loss": 0.10361550748348236,
85
+ "eval_runtime": 154.8814,
86
+ "eval_samples_per_second": 6.734,
87
+ "eval_steps_per_second": 0.213,
88
  "step": 20000
89
  },
90
  {
 
98
  "eval_bleu": 41.5766,
99
  "eval_gen_len": 35.7536,
100
  "eval_loss": 0.10351266711950302,
101
+ "eval_runtime": 152.4909,
102
+ "eval_samples_per_second": 6.84,
103
+ "eval_steps_per_second": 0.216,
104
  "step": 24000
105
  },
106
  {
 
114
  "eval_bleu": 41.2765,
115
  "eval_gen_len": 35.535,
116
  "eval_loss": 0.10269948095083237,
117
+ "eval_runtime": 132.6943,
118
+ "eval_samples_per_second": 7.86,
119
+ "eval_steps_per_second": 0.249,
120
  "step": 28000
121
  },
122
  {
 
130
  "eval_bleu": 42.0634,
131
  "eval_gen_len": 34.8495,
132
  "eval_loss": 0.10216742753982544,
133
+ "eval_runtime": 141.3815,
134
+ "eval_samples_per_second": 7.377,
135
+ "eval_steps_per_second": 0.233,
136
  "step": 32000
137
  },
138
  {
 
146
  "eval_bleu": 41.2763,
147
  "eval_gen_len": 36.139,
148
  "eval_loss": 0.10178232192993164,
149
+ "eval_runtime": 121.485,
150
+ "eval_samples_per_second": 8.585,
151
+ "eval_steps_per_second": 0.272,
152
  "step": 36000
153
  },
154
  {
 
162
  "eval_bleu": 42.3991,
163
  "eval_gen_len": 34.4545,
164
  "eval_loss": 0.10192298889160156,
165
+ "eval_runtime": 118.8523,
166
+ "eval_samples_per_second": 8.776,
167
+ "eval_steps_per_second": 0.278,
168
  "step": 40000
169
  },
170
  {
 
178
  "eval_bleu": 42.1688,
179
  "eval_gen_len": 35.3145,
180
  "eval_loss": 0.1022704690694809,
181
+ "eval_runtime": 139.2542,
182
+ "eval_samples_per_second": 7.49,
183
+ "eval_steps_per_second": 0.237,
184
  "step": 44000
185
  },
186
  {
 
194
  "eval_bleu": 42.5638,
195
  "eval_gen_len": 35.0738,
196
  "eval_loss": 0.10206188261508942,
197
+ "eval_runtime": 135.8728,
198
+ "eval_samples_per_second": 7.676,
199
+ "eval_steps_per_second": 0.243,
200
  "step": 48000
201
  }
202
  ],
checkpoint-48000/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ceb79d8b854e02ccc5795cd91b8ba49e36367cb01aa95d1a05db465648548b6b
3
  size 3771
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06045bfca8d45b2ad5c21bc2afdbfa7788b5223a9722cafa595fbbe472e272c9
3
  size 3771
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ceb79d8b854e02ccc5795cd91b8ba49e36367cb01aa95d1a05db465648548b6b
3
  size 3771
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06045bfca8d45b2ad5c21bc2afdbfa7788b5223a9722cafa595fbbe472e272c9
3
  size 3771