fpadovani commited on
Commit
06c4c19
·
verified ·
1 Parent(s): 7d341d8

Training in progress, step 4000, checkpoint

Browse files
checkpoint-4000/trainer_state.json CHANGED
@@ -26,9 +26,9 @@
26
  {
27
  "epoch": 1.0,
28
  "eval_loss": 6.317445755004883,
29
- "eval_runtime": 19.2809,
30
- "eval_samples_per_second": 1306.732,
31
- "eval_steps_per_second": 5.135,
32
  "step": 392
33
  },
34
  {
@@ -41,9 +41,9 @@
41
  {
42
  "epoch": 2.0,
43
  "eval_loss": 6.024065017700195,
44
- "eval_runtime": 19.3681,
45
- "eval_samples_per_second": 1300.85,
46
- "eval_steps_per_second": 5.111,
47
  "step": 784
48
  },
49
  {
@@ -56,9 +56,9 @@
56
  {
57
  "epoch": 3.0,
58
  "eval_loss": 5.884053707122803,
59
- "eval_runtime": 19.3497,
60
- "eval_samples_per_second": 1302.088,
61
- "eval_steps_per_second": 5.116,
62
  "step": 1176
63
  },
64
  {
@@ -71,9 +71,9 @@
71
  {
72
  "epoch": 4.0,
73
  "eval_loss": 5.788422584533691,
74
- "eval_runtime": 19.3355,
75
- "eval_samples_per_second": 1303.047,
76
- "eval_steps_per_second": 5.12,
77
  "step": 1568
78
  },
79
  {
@@ -86,9 +86,9 @@
86
  {
87
  "epoch": 5.0,
88
  "eval_loss": 5.718640327453613,
89
- "eval_runtime": 19.1626,
90
- "eval_samples_per_second": 1314.803,
91
- "eval_steps_per_second": 5.166,
92
  "step": 1960
93
  },
94
  {
@@ -101,9 +101,9 @@
101
  {
102
  "epoch": 6.0,
103
  "eval_loss": 5.6633148193359375,
104
- "eval_runtime": 19.4816,
105
- "eval_samples_per_second": 1293.269,
106
- "eval_steps_per_second": 5.082,
107
  "step": 2352
108
  },
109
  {
@@ -116,9 +116,9 @@
116
  {
117
  "epoch": 7.0,
118
  "eval_loss": 5.620563507080078,
119
- "eval_runtime": 19.2806,
120
- "eval_samples_per_second": 1306.752,
121
- "eval_steps_per_second": 5.135,
122
  "step": 2744
123
  },
124
  {
@@ -131,9 +131,9 @@
131
  {
132
  "epoch": 8.0,
133
  "eval_loss": 5.586855888366699,
134
- "eval_runtime": 19.2672,
135
- "eval_samples_per_second": 1307.661,
136
- "eval_steps_per_second": 5.138,
137
  "step": 3136
138
  },
139
  {
@@ -146,9 +146,9 @@
146
  {
147
  "epoch": 9.0,
148
  "eval_loss": 5.562436580657959,
149
- "eval_runtime": 19.4007,
150
- "eval_samples_per_second": 1298.665,
151
- "eval_steps_per_second": 5.103,
152
  "step": 3528
153
  },
154
  {
@@ -161,9 +161,9 @@
161
  {
162
  "epoch": 10.0,
163
  "eval_loss": 5.544801235198975,
164
- "eval_runtime": 19.3033,
165
- "eval_samples_per_second": 1305.215,
166
- "eval_steps_per_second": 5.129,
167
  "step": 3920
168
  }
169
  ],
 
26
  {
27
  "epoch": 1.0,
28
  "eval_loss": 6.317445755004883,
29
+ "eval_runtime": 15.5824,
30
+ "eval_samples_per_second": 1616.887,
31
+ "eval_steps_per_second": 6.353,
32
  "step": 392
33
  },
34
  {
 
41
  {
42
  "epoch": 2.0,
43
  "eval_loss": 6.024065017700195,
44
+ "eval_runtime": 15.5591,
45
+ "eval_samples_per_second": 1619.314,
46
+ "eval_steps_per_second": 6.363,
47
  "step": 784
48
  },
49
  {
 
56
  {
57
  "epoch": 3.0,
58
  "eval_loss": 5.884053707122803,
59
+ "eval_runtime": 15.6179,
60
+ "eval_samples_per_second": 1613.212,
61
+ "eval_steps_per_second": 6.339,
62
  "step": 1176
63
  },
64
  {
 
71
  {
72
  "epoch": 4.0,
73
  "eval_loss": 5.788422584533691,
74
+ "eval_runtime": 15.5176,
75
+ "eval_samples_per_second": 1623.64,
76
+ "eval_steps_per_second": 6.38,
77
  "step": 1568
78
  },
79
  {
 
86
  {
87
  "epoch": 5.0,
88
  "eval_loss": 5.718640327453613,
89
+ "eval_runtime": 15.5828,
90
+ "eval_samples_per_second": 1616.851,
91
+ "eval_steps_per_second": 6.353,
92
  "step": 1960
93
  },
94
  {
 
101
  {
102
  "epoch": 6.0,
103
  "eval_loss": 5.6633148193359375,
104
+ "eval_runtime": 15.6437,
105
+ "eval_samples_per_second": 1610.551,
106
+ "eval_steps_per_second": 6.328,
107
  "step": 2352
108
  },
109
  {
 
116
  {
117
  "epoch": 7.0,
118
  "eval_loss": 5.620563507080078,
119
+ "eval_runtime": 15.5999,
120
+ "eval_samples_per_second": 1615.079,
121
+ "eval_steps_per_second": 6.346,
122
  "step": 2744
123
  },
124
  {
 
131
  {
132
  "epoch": 8.0,
133
  "eval_loss": 5.586855888366699,
134
+ "eval_runtime": 15.6428,
135
+ "eval_samples_per_second": 1610.644,
136
+ "eval_steps_per_second": 6.329,
137
  "step": 3136
138
  },
139
  {
 
146
  {
147
  "epoch": 9.0,
148
  "eval_loss": 5.562436580657959,
149
+ "eval_runtime": 15.5065,
150
+ "eval_samples_per_second": 1624.806,
151
+ "eval_steps_per_second": 6.384,
152
  "step": 3528
153
  },
154
  {
 
161
  {
162
  "epoch": 10.0,
163
  "eval_loss": 5.544801235198975,
164
+ "eval_runtime": 15.5961,
165
+ "eval_samples_per_second": 1615.463,
166
+ "eval_steps_per_second": 6.348,
167
  "step": 3920
168
  }
169
  ],
checkpoint-4000/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3aa067acc804b79ea56c8830addc6a7dc795994309c286a45aeb17ddcc8ec159
3
  size 5905
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52cf954a78a3d6fc682ff0c3b6ee4cda69040297e62c644ea0256038484a747a
3
  size 5905