Ethan Sim commited on
Commit
4895dae
·
1 Parent(s): 7d0ac24

update model with 1.0 safeguard

Browse files
checkpoint-80000/trainer_state.json CHANGED
@@ -18,9 +18,9 @@
18
  "eval_bleu": 42.1115,
19
  "eval_gen_len": 33.8782,
20
  "eval_loss": 0.09834092110395432,
21
- "eval_runtime": 133.0059,
22
- "eval_samples_per_second": 7.842,
23
- "eval_steps_per_second": 0.496,
24
  "step": 8000
25
  },
26
  {
@@ -34,9 +34,9 @@
34
  "eval_bleu": 42.5044,
35
  "eval_gen_len": 34.0422,
36
  "eval_loss": 0.09755747765302658,
37
- "eval_runtime": 123.2199,
38
- "eval_samples_per_second": 8.465,
39
- "eval_steps_per_second": 0.536,
40
  "step": 16000
41
  },
42
  {
@@ -50,9 +50,9 @@
50
  "eval_bleu": 42.1738,
51
  "eval_gen_len": 33.3921,
52
  "eval_loss": 0.09764789789915085,
53
- "eval_runtime": 135.8363,
54
- "eval_samples_per_second": 7.678,
55
- "eval_steps_per_second": 0.486,
56
  "step": 24000
57
  },
58
  {
@@ -66,9 +66,9 @@
66
  "eval_bleu": 42.6761,
67
  "eval_gen_len": 33.8092,
68
  "eval_loss": 0.09669991582632065,
69
- "eval_runtime": 112.788,
70
- "eval_samples_per_second": 9.247,
71
- "eval_steps_per_second": 0.585,
72
  "step": 32000
73
  },
74
  {
@@ -82,9 +82,9 @@
82
  "eval_bleu": 42.5089,
83
  "eval_gen_len": 33.814,
84
  "eval_loss": 0.09582150727510452,
85
- "eval_runtime": 113.7375,
86
- "eval_samples_per_second": 9.17,
87
- "eval_steps_per_second": 0.58,
88
  "step": 40000
89
  },
90
  {
@@ -98,9 +98,9 @@
98
  "eval_bleu": 42.6428,
99
  "eval_gen_len": 33.954,
100
  "eval_loss": 0.09729909896850586,
101
- "eval_runtime": 111.2244,
102
- "eval_samples_per_second": 9.377,
103
- "eval_steps_per_second": 0.593,
104
  "step": 48000
105
  },
106
  {
@@ -114,9 +114,9 @@
114
  "eval_bleu": 42.5021,
115
  "eval_gen_len": 33.7661,
116
  "eval_loss": 0.09766314178705215,
117
- "eval_runtime": 149.7488,
118
- "eval_samples_per_second": 6.965,
119
- "eval_steps_per_second": 0.441,
120
  "step": 56000
121
  },
122
  {
@@ -130,9 +130,9 @@
130
  "eval_bleu": 42.8416,
131
  "eval_gen_len": 33.999,
132
  "eval_loss": 0.09677453339099884,
133
- "eval_runtime": 156.1922,
134
- "eval_samples_per_second": 6.678,
135
- "eval_steps_per_second": 0.423,
136
  "step": 64000
137
  },
138
  {
@@ -146,9 +146,9 @@
146
  "eval_bleu": 42.797,
147
  "eval_gen_len": 34.5053,
148
  "eval_loss": 0.09712178260087967,
149
- "eval_runtime": 127.7296,
150
- "eval_samples_per_second": 8.166,
151
- "eval_steps_per_second": 0.517,
152
  "step": 72000
153
  },
154
  {
@@ -162,9 +162,9 @@
162
  "eval_bleu": 43.3155,
163
  "eval_gen_len": 34.0355,
164
  "eval_loss": 0.09631923586130142,
165
- "eval_runtime": 125.7048,
166
- "eval_samples_per_second": 8.297,
167
- "eval_steps_per_second": 0.525,
168
  "step": 80000
169
  }
170
  ],
 
18
  "eval_bleu": 42.1115,
19
  "eval_gen_len": 33.8782,
20
  "eval_loss": 0.09834092110395432,
21
+ "eval_runtime": 120.1201,
22
+ "eval_samples_per_second": 8.683,
23
+ "eval_steps_per_second": 0.549,
24
  "step": 8000
25
  },
26
  {
 
34
  "eval_bleu": 42.5044,
35
  "eval_gen_len": 34.0422,
36
  "eval_loss": 0.09755747765302658,
37
+ "eval_runtime": 108.595,
38
+ "eval_samples_per_second": 9.604,
39
+ "eval_steps_per_second": 0.608,
40
  "step": 16000
41
  },
42
  {
 
50
  "eval_bleu": 42.1738,
51
  "eval_gen_len": 33.3921,
52
  "eval_loss": 0.09764789789915085,
53
+ "eval_runtime": 129.8931,
54
+ "eval_samples_per_second": 8.03,
55
+ "eval_steps_per_second": 0.508,
56
  "step": 24000
57
  },
58
  {
 
66
  "eval_bleu": 42.6761,
67
  "eval_gen_len": 33.8092,
68
  "eval_loss": 0.09669991582632065,
69
+ "eval_runtime": 115.0248,
70
+ "eval_samples_per_second": 9.068,
71
+ "eval_steps_per_second": 0.574,
72
  "step": 32000
73
  },
74
  {
 
82
  "eval_bleu": 42.5089,
83
  "eval_gen_len": 33.814,
84
  "eval_loss": 0.09582150727510452,
85
+ "eval_runtime": 115.0911,
86
+ "eval_samples_per_second": 9.062,
87
+ "eval_steps_per_second": 0.573,
88
  "step": 40000
89
  },
90
  {
 
98
  "eval_bleu": 42.6428,
99
  "eval_gen_len": 33.954,
100
  "eval_loss": 0.09729909896850586,
101
+ "eval_runtime": 116.307,
102
+ "eval_samples_per_second": 8.968,
103
+ "eval_steps_per_second": 0.567,
104
  "step": 48000
105
  },
106
  {
 
114
  "eval_bleu": 42.5021,
115
  "eval_gen_len": 33.7661,
116
  "eval_loss": 0.09766314178705215,
117
+ "eval_runtime": 141.066,
118
+ "eval_samples_per_second": 7.394,
119
+ "eval_steps_per_second": 0.468,
120
  "step": 56000
121
  },
122
  {
 
130
  "eval_bleu": 42.8416,
131
  "eval_gen_len": 33.999,
132
  "eval_loss": 0.09677453339099884,
133
+ "eval_runtime": 152.4751,
134
+ "eval_samples_per_second": 6.84,
135
+ "eval_steps_per_second": 0.433,
136
  "step": 64000
137
  },
138
  {
 
146
  "eval_bleu": 42.797,
147
  "eval_gen_len": 34.5053,
148
  "eval_loss": 0.09712178260087967,
149
+ "eval_runtime": 129.5634,
150
+ "eval_samples_per_second": 8.05,
151
+ "eval_steps_per_second": 0.509,
152
  "step": 72000
153
  },
154
  {
 
162
  "eval_bleu": 43.3155,
163
  "eval_gen_len": 34.0355,
164
  "eval_loss": 0.09631923586130142,
165
+ "eval_runtime": 129.8003,
166
+ "eval_samples_per_second": 8.035,
167
+ "eval_steps_per_second": 0.508,
168
  "step": 80000
169
  }
170
  ],
checkpoint-80000/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7754c0c1d221803f1ec03c42c8ec824faf828e5ad475618050f1176fed7e195
3
  size 3771
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0525360cd05bfbdd2df5f26e0857e71611200a70f3433da967d91c1e94623987
3
  size 3771
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7754c0c1d221803f1ec03c42c8ec824faf828e5ad475618050f1176fed7e195
3
  size 3771
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0525360cd05bfbdd2df5f26e0857e71611200a70f3433da967d91c1e94623987
3
  size 3771