k4black commited on
Commit
55472a1
·
1 Parent(s): 8ae67a0

Training in progress, step 9000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3a85eb263deb4c62619accbaf79f0b4b520c964ea72ccb01a610c00d14c2e6c1
3
  size 484047087
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e19bdea073f1b17bc8e8a0f657c67dd3b1bb4f8bde89ffa43ed9e47456e2e259
3
  size 484047087
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b276e716795aaff1cff242b0a235b4a334c0f04be0f4527656426fdc25e0374
3
  size 242012923
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:236ac2a99de8898e9adfad014e34dc559fd10b5c876168a4128b74cab112d650
3
  size 242012923
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6fe5e55a28bec87da43da634edefd5e9737d0fb7942ab5d1595a5149b1148b6
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3c0c745fe5ced5b2666478002f55dcf70f1ca84a5de6a6cc312fc12ef289e28
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:97aa4284d30c55c9de6eb4425ce0d2728af80a248d437264944c01a2e6a6265c
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ebe8ae26c1a46b0bbc6250f4e37af6612f7d39b838b9550c3718a26037884e0
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f97dba5218102cb7a6dbc477aa202196bb52ab595fab0e37adc58120c6e0a955
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adfb3f10942eacbb4de0657261ea2ad84389656c6efb6798e4e115025b1e7001
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.7641937732696533,
3
- "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-adamw/checkpoint-8500",
4
- "epoch": 2.7199999999999998,
5
- "global_step": 8500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -346,11 +346,31 @@
346
  "eval_samples_per_second": 75.505,
347
  "eval_steps_per_second": 2.378,
348
  "step": 8500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
349
  }
350
  ],
351
  "max_steps": 31250,
352
  "num_train_epochs": 10,
353
- "total_flos": 3.614193688982323e+16,
354
  "trial_name": null,
355
  "trial_params": null
356
  }
 
1
  {
2
+ "best_metric": 0.7621653079986572,
3
+ "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-adamw/checkpoint-9000",
4
+ "epoch": 2.88,
5
+ "global_step": 9000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
346
  "eval_samples_per_second": 75.505,
347
  "eval_steps_per_second": 2.378,
348
  "step": 8500
349
+ },
350
+ {
351
+ "epoch": 2.88,
352
+ "learning_rate": 7.496547310270489e-05,
353
+ "loss": 0.5387,
354
+ "step": 9000
355
+ },
356
+ {
357
+ "epoch": 2.88,
358
+ "eval_bleu": 0.13416837075728422,
359
+ "eval_exact_match": 0.159,
360
+ "eval_loss": 0.7621653079986572,
361
+ "eval_rouge1": 0.5671758743776842,
362
+ "eval_rouge2": 0.3987572074969532,
363
+ "eval_rougeL": 0.5499787838213916,
364
+ "eval_rougeLsum": 0.55728689293535,
365
+ "eval_runtime": 26.7851,
366
+ "eval_samples_per_second": 74.668,
367
+ "eval_steps_per_second": 2.352,
368
+ "step": 9000
369
  }
370
  ],
371
  "max_steps": 31250,
372
  "num_train_epochs": 10,
373
+ "total_flos": 3.826357188742349e+16,
374
  "trial_name": null,
375
  "trial_params": null
376
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4b276e716795aaff1cff242b0a235b4a334c0f04be0f4527656426fdc25e0374
3
  size 242012923
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:236ac2a99de8898e9adfad014e34dc559fd10b5c876168a4128b74cab112d650
3
  size 242012923