Ethan Sim commited on
Commit
d573def
·
1 Parent(s): 9bf9920

update model with 1.0 safeguard

Browse files
checkpoint-80000/trainer_state.json CHANGED
@@ -18,9 +18,9 @@
18
  "eval_bleu": 42.2846,
19
  "eval_gen_len": 33.9099,
20
  "eval_loss": 0.09808671474456787,
21
- "eval_runtime": 101.3103,
22
- "eval_samples_per_second": 10.295,
23
- "eval_steps_per_second": 0.651,
24
  "step": 8000
25
  },
26
  {
@@ -34,9 +34,9 @@
34
  "eval_bleu": 42.5263,
35
  "eval_gen_len": 33.9847,
36
  "eval_loss": 0.09837382286787033,
37
- "eval_runtime": 88.4642,
38
- "eval_samples_per_second": 11.79,
39
- "eval_steps_per_second": 0.746,
40
  "step": 16000
41
  },
42
  {
@@ -50,9 +50,9 @@
50
  "eval_bleu": 42.8007,
51
  "eval_gen_len": 34.2359,
52
  "eval_loss": 0.09744028747081757,
53
- "eval_runtime": 94.3167,
54
- "eval_samples_per_second": 11.058,
55
- "eval_steps_per_second": 0.7,
56
  "step": 24000
57
  },
58
  {
@@ -66,9 +66,9 @@
66
  "eval_bleu": 42.7644,
67
  "eval_gen_len": 34.2148,
68
  "eval_loss": 0.09636388719081879,
69
- "eval_runtime": 100.6778,
70
- "eval_samples_per_second": 10.36,
71
- "eval_steps_per_second": 0.656,
72
  "step": 32000
73
  },
74
  {
@@ -82,9 +82,9 @@
82
  "eval_bleu": 42.9411,
83
  "eval_gen_len": 34.6865,
84
  "eval_loss": 0.09594809263944626,
85
- "eval_runtime": 99.5677,
86
- "eval_samples_per_second": 10.475,
87
- "eval_steps_per_second": 0.663,
88
  "step": 40000
89
  },
90
  {
@@ -98,9 +98,9 @@
98
  "eval_bleu": 42.8809,
99
  "eval_gen_len": 34.4324,
100
  "eval_loss": 0.0971299335360527,
101
- "eval_runtime": 179.2147,
102
- "eval_samples_per_second": 5.82,
103
- "eval_steps_per_second": 0.368,
104
  "step": 48000
105
  },
106
  {
@@ -114,9 +114,9 @@
114
  "eval_bleu": 42.9581,
115
  "eval_gen_len": 33.6337,
116
  "eval_loss": 0.09666970372200012,
117
- "eval_runtime": 81.2036,
118
- "eval_samples_per_second": 12.844,
119
- "eval_steps_per_second": 0.813,
120
  "step": 56000
121
  },
122
  {
@@ -130,9 +130,9 @@
130
  "eval_bleu": 42.1891,
131
  "eval_gen_len": 35.0201,
132
  "eval_loss": 0.09686268866062164,
133
- "eval_runtime": 100.7692,
134
- "eval_samples_per_second": 10.35,
135
- "eval_steps_per_second": 0.655,
136
  "step": 64000
137
  },
138
  {
@@ -146,9 +146,9 @@
146
  "eval_bleu": 42.9143,
147
  "eval_gen_len": 34.2848,
148
  "eval_loss": 0.09685871005058289,
149
- "eval_runtime": 87.4036,
150
- "eval_samples_per_second": 11.933,
151
- "eval_steps_per_second": 0.755,
152
  "step": 72000
153
  },
154
  {
@@ -162,9 +162,9 @@
162
  "eval_bleu": 43.1757,
163
  "eval_gen_len": 34.069,
164
  "eval_loss": 0.09636421501636505,
165
- "eval_runtime": 99.9416,
166
- "eval_samples_per_second": 10.436,
167
- "eval_steps_per_second": 0.66,
168
  "step": 80000
169
  }
170
  ],
 
18
  "eval_bleu": 42.2846,
19
  "eval_gen_len": 33.9099,
20
  "eval_loss": 0.09808671474456787,
21
+ "eval_runtime": 123.0699,
22
+ "eval_samples_per_second": 8.475,
23
+ "eval_steps_per_second": 0.536,
24
  "step": 8000
25
  },
26
  {
 
34
  "eval_bleu": 42.5263,
35
  "eval_gen_len": 33.9847,
36
  "eval_loss": 0.09837382286787033,
37
+ "eval_runtime": 110.1526,
38
+ "eval_samples_per_second": 9.469,
39
+ "eval_steps_per_second": 0.599,
40
  "step": 16000
41
  },
42
  {
 
50
  "eval_bleu": 42.8007,
51
  "eval_gen_len": 34.2359,
52
  "eval_loss": 0.09744028747081757,
53
+ "eval_runtime": 120.3105,
54
+ "eval_samples_per_second": 8.669,
55
+ "eval_steps_per_second": 0.549,
56
  "step": 24000
57
  },
58
  {
 
66
  "eval_bleu": 42.7644,
67
  "eval_gen_len": 34.2148,
68
  "eval_loss": 0.09636388719081879,
69
+ "eval_runtime": 124.8267,
70
+ "eval_samples_per_second": 8.356,
71
+ "eval_steps_per_second": 0.529,
72
  "step": 32000
73
  },
74
  {
 
82
  "eval_bleu": 42.9411,
83
  "eval_gen_len": 34.6865,
84
  "eval_loss": 0.09594809263944626,
85
+ "eval_runtime": 124.3057,
86
+ "eval_samples_per_second": 8.391,
87
+ "eval_steps_per_second": 0.531,
88
  "step": 40000
89
  },
90
  {
 
98
  "eval_bleu": 42.8809,
99
  "eval_gen_len": 34.4324,
100
  "eval_loss": 0.0971299335360527,
101
+ "eval_runtime": 209.1935,
102
+ "eval_samples_per_second": 4.986,
103
+ "eval_steps_per_second": 0.315,
104
  "step": 48000
105
  },
106
  {
 
114
  "eval_bleu": 42.9581,
115
  "eval_gen_len": 33.6337,
116
  "eval_loss": 0.09666970372200012,
117
+ "eval_runtime": 110.1198,
118
+ "eval_samples_per_second": 9.472,
119
+ "eval_steps_per_second": 0.599,
120
  "step": 56000
121
  },
122
  {
 
130
  "eval_bleu": 42.1891,
131
  "eval_gen_len": 35.0201,
132
  "eval_loss": 0.09686268866062164,
133
+ "eval_runtime": 132.6946,
134
+ "eval_samples_per_second": 7.86,
135
+ "eval_steps_per_second": 0.497,
136
  "step": 64000
137
  },
138
  {
 
146
  "eval_bleu": 42.9143,
147
  "eval_gen_len": 34.2848,
148
  "eval_loss": 0.09685871005058289,
149
+ "eval_runtime": 122.6555,
150
+ "eval_samples_per_second": 8.503,
151
+ "eval_steps_per_second": 0.538,
152
  "step": 72000
153
  },
154
  {
 
162
  "eval_bleu": 43.1757,
163
  "eval_gen_len": 34.069,
164
  "eval_loss": 0.09636421501636505,
165
+ "eval_runtime": 134.8008,
166
+ "eval_samples_per_second": 7.737,
167
+ "eval_steps_per_second": 0.49,
168
  "step": 80000
169
  }
170
  ],
checkpoint-80000/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43072ea1f24ed9e4a40c898646c5b77ad1d5b8b7d2837ca1fab5fc4630684483
3
  size 3771
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10a31b74ed572f8ade9b00d1da9ed683d8a211c467ee888717946580b2cae4f3
3
  size 3771
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43072ea1f24ed9e4a40c898646c5b77ad1d5b8b7d2837ca1fab5fc4630684483
3
  size 3771
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10a31b74ed572f8ade9b00d1da9ed683d8a211c467ee888717946580b2cae4f3
3
  size 3771