Ethan Sim commited on
Commit
68779bb
·
1 Parent(s): 7f220eb

update model with 1.0 safeguard

Browse files
checkpoint-72000/trainer_state.json CHANGED
@@ -18,9 +18,9 @@
18
  "eval_bleu": 42.2846,
19
  "eval_gen_len": 33.5896,
20
  "eval_loss": 0.0983600914478302,
21
- "eval_runtime": 122.9468,
22
- "eval_samples_per_second": 8.483,
23
- "eval_steps_per_second": 0.537,
24
  "step": 8000
25
  },
26
  {
@@ -34,9 +34,9 @@
34
  "eval_bleu": 42.1887,
35
  "eval_gen_len": 34.0508,
36
  "eval_loss": 0.097293421626091,
37
- "eval_runtime": 162.7475,
38
- "eval_samples_per_second": 6.409,
39
- "eval_steps_per_second": 0.406,
40
  "step": 16000
41
  },
42
  {
@@ -50,9 +50,9 @@
50
  "eval_bleu": 42.7367,
51
  "eval_gen_len": 33.7747,
52
  "eval_loss": 0.09722033143043518,
53
- "eval_runtime": 127.375,
54
- "eval_samples_per_second": 8.188,
55
- "eval_steps_per_second": 0.518,
56
  "step": 24000
57
  },
58
  {
@@ -66,9 +66,9 @@
66
  "eval_bleu": 42.9551,
67
  "eval_gen_len": 34.4238,
68
  "eval_loss": 0.0965743437409401,
69
- "eval_runtime": 120.0033,
70
- "eval_samples_per_second": 8.691,
71
- "eval_steps_per_second": 0.55,
72
  "step": 32000
73
  },
74
  {
@@ -82,9 +82,9 @@
82
  "eval_bleu": 42.7141,
83
  "eval_gen_len": 34.0872,
84
  "eval_loss": 0.09599015861749649,
85
- "eval_runtime": 144.0409,
86
- "eval_samples_per_second": 7.241,
87
- "eval_steps_per_second": 0.458,
88
  "step": 40000
89
  },
90
  {
@@ -98,9 +98,9 @@
98
  "eval_bleu": 42.4802,
99
  "eval_gen_len": 34.1266,
100
  "eval_loss": 0.09718813002109528,
101
- "eval_runtime": 121.2752,
102
- "eval_samples_per_second": 8.6,
103
- "eval_steps_per_second": 0.544,
104
  "step": 48000
105
  },
106
  {
@@ -114,9 +114,9 @@
114
  "eval_bleu": 42.6361,
115
  "eval_gen_len": 34.1045,
116
  "eval_loss": 0.0969875305891037,
117
- "eval_runtime": 137.2112,
118
- "eval_samples_per_second": 7.601,
119
- "eval_steps_per_second": 0.481,
120
  "step": 56000
121
  },
122
  {
@@ -130,9 +130,9 @@
130
  "eval_bleu": 42.8271,
131
  "eval_gen_len": 34.4851,
132
  "eval_loss": 0.09680665284395218,
133
- "eval_runtime": 134.8615,
134
- "eval_samples_per_second": 7.734,
135
- "eval_steps_per_second": 0.489,
136
  "step": 64000
137
  },
138
  {
@@ -146,9 +146,9 @@
146
  "eval_bleu": 42.9999,
147
  "eval_gen_len": 34.0671,
148
  "eval_loss": 0.09675087034702301,
149
- "eval_runtime": 110.3226,
150
- "eval_samples_per_second": 9.454,
151
- "eval_steps_per_second": 0.598,
152
  "step": 72000
153
  }
154
  ],
 
18
  "eval_bleu": 42.2846,
19
  "eval_gen_len": 33.5896,
20
  "eval_loss": 0.0983600914478302,
21
+ "eval_runtime": 125.1063,
22
+ "eval_samples_per_second": 8.337,
23
+ "eval_steps_per_second": 0.528,
24
  "step": 8000
25
  },
26
  {
 
34
  "eval_bleu": 42.1887,
35
  "eval_gen_len": 34.0508,
36
  "eval_loss": 0.097293421626091,
37
+ "eval_runtime": 165.8917,
38
+ "eval_samples_per_second": 6.287,
39
+ "eval_steps_per_second": 0.398,
40
  "step": 16000
41
  },
42
  {
 
50
  "eval_bleu": 42.7367,
51
  "eval_gen_len": 33.7747,
52
  "eval_loss": 0.09722033143043518,
53
+ "eval_runtime": 119.8443,
54
+ "eval_samples_per_second": 8.703,
55
+ "eval_steps_per_second": 0.551,
56
  "step": 24000
57
  },
58
  {
 
66
  "eval_bleu": 42.9551,
67
  "eval_gen_len": 34.4238,
68
  "eval_loss": 0.0965743437409401,
69
+ "eval_runtime": 122.2105,
70
+ "eval_samples_per_second": 8.534,
71
+ "eval_steps_per_second": 0.54,
72
  "step": 32000
73
  },
74
  {
 
82
  "eval_bleu": 42.7141,
83
  "eval_gen_len": 34.0872,
84
  "eval_loss": 0.09599015861749649,
85
+ "eval_runtime": 147.1092,
86
+ "eval_samples_per_second": 7.09,
87
+ "eval_steps_per_second": 0.449,
88
  "step": 40000
89
  },
90
  {
 
98
  "eval_bleu": 42.4802,
99
  "eval_gen_len": 34.1266,
100
  "eval_loss": 0.09718813002109528,
101
+ "eval_runtime": 126.9046,
102
+ "eval_samples_per_second": 8.219,
103
+ "eval_steps_per_second": 0.52,
104
  "step": 48000
105
  },
106
  {
 
114
  "eval_bleu": 42.6361,
115
  "eval_gen_len": 34.1045,
116
  "eval_loss": 0.0969875305891037,
117
+ "eval_runtime": 144.8881,
118
+ "eval_samples_per_second": 7.199,
119
+ "eval_steps_per_second": 0.456,
120
  "step": 56000
121
  },
122
  {
 
130
  "eval_bleu": 42.8271,
131
  "eval_gen_len": 34.4851,
132
  "eval_loss": 0.09680665284395218,
133
+ "eval_runtime": 136.6783,
134
+ "eval_samples_per_second": 7.631,
135
+ "eval_steps_per_second": 0.483,
136
  "step": 64000
137
  },
138
  {
 
146
  "eval_bleu": 42.9999,
147
  "eval_gen_len": 34.0671,
148
  "eval_loss": 0.09675087034702301,
149
+ "eval_runtime": 115.9998,
150
+ "eval_samples_per_second": 8.991,
151
+ "eval_steps_per_second": 0.569,
152
  "step": 72000
153
  }
154
  ],
checkpoint-72000/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cf5ee38f2194704c244e5c80610b2c3775d2eb9a6a936f61d49a9795e266a86
3
  size 3771
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edf2021650916951d996ad74978de6ba9cbe3e25bd074e8ad6124d4670a0477b
3
  size 3771
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6cf5ee38f2194704c244e5c80610b2c3775d2eb9a6a936f61d49a9795e266a86
3
  size 3771
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edf2021650916951d996ad74978de6ba9cbe3e25bd074e8ad6124d4670a0477b
3
  size 3771