k4black commited on
Commit
e292caa
·
1 Parent(s): 36a62b7

Training in progress, step 6000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:988ee46c408a07b7a0fad4b1c0ff670aad8799b9b267896a4244fcdba18e552b
3
  size 484047087
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51b192a7b70db1934dba0f9d9a34e18e69ec65f39168a14efeb68bab0d415c94
3
  size 484047087
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25580c636627541ce14bdc779eade94125dc6177b2aa83645d2ef2395daaa273
3
  size 242012923
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5491c1eb83ad0255fa2195ad3d2057886c2ddfe459b2d0d86d130dd460f2c126
3
  size 242012923
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b5119b201c0c8ce8aa50d2ab24369c5098c578a46726686f668686b71cefedc
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da5f59398b256310b16e5b8660f3abc262dd46e94f7c4ef1ca2deb4421e45807
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1adf8adfe4057346d099df92e326b1ad5fa2d44a51313442fb1c361bdd9899b0
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40cdf027dfcd88dd0425eb5ed9a78e9f857bde345f0e7a339091c24672288322
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ec642b785cc0a9d07d3c78d3a67e22851ce9b6c0ecba48c9d62722bf933255a
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48a2bf23ad9a52f893b5c83c2acdf47455196bb0c79c1006037401a5216124d5
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.7792329788208008,
3
- "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-adamw/checkpoint-5500",
4
- "epoch": 1.76,
5
- "global_step": 5500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -226,11 +226,31 @@
226
  "eval_samples_per_second": 75.808,
227
  "eval_steps_per_second": 2.388,
228
  "step": 5500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
229
  }
230
  ],
231
  "max_steps": 31250,
232
  "num_train_epochs": 10,
233
- "total_flos": 2.340678090306355e+16,
234
  "trial_name": null,
235
  "trial_params": null
236
  }
 
1
  {
2
+ "best_metric": 0.7785006165504456,
3
+ "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-adamw/checkpoint-6000",
4
+ "epoch": 1.92,
5
+ "global_step": 6000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
226
  "eval_samples_per_second": 75.808,
227
  "eval_steps_per_second": 2.388,
228
  "step": 5500
229
+ },
230
+ {
231
+ "epoch": 1.92,
232
+ "learning_rate": 8.507090645737192e-05,
233
+ "loss": 0.5956,
234
+ "step": 6000
235
+ },
236
+ {
237
+ "epoch": 1.92,
238
+ "eval_bleu": 0.129401969984806,
239
+ "eval_exact_match": 0.1605,
240
+ "eval_loss": 0.7785006165504456,
241
+ "eval_rouge1": 0.5640650180352025,
242
+ "eval_rouge2": 0.39806305672301234,
243
+ "eval_rougeL": 0.5469935550994057,
244
+ "eval_rougeLsum": 0.554556710156975,
245
+ "eval_runtime": 27.3051,
246
+ "eval_samples_per_second": 73.246,
247
+ "eval_steps_per_second": 2.307,
248
+ "step": 6000
249
  }
250
  ],
251
  "max_steps": 31250,
252
  "num_train_epochs": 10,
253
+ "total_flos": 2.5532806050349056e+16,
254
  "trial_name": null,
255
  "trial_params": null
256
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25580c636627541ce14bdc779eade94125dc6177b2aa83645d2ef2395daaa273
3
  size 242012923
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5491c1eb83ad0255fa2195ad3d2057886c2ddfe459b2d0d86d130dd460f2c126
3
  size 242012923