k4black commited on
Commit
8ae67a0
·
1 Parent(s): 92afe32

Training in progress, step 8500

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1873b7c859425f0e26f2347fb91e6a776cba2e48839820c2dcea4e22bc7fbc67
3
  size 484047087
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a85eb263deb4c62619accbaf79f0b4b520c964ea72ccb01a610c00d14c2e6c1
3
  size 484047087
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f23299a7aeba471b07c347aceb29e5198305d8414f4dd4b21f79fc14a4592d39
3
  size 242012923
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b276e716795aaff1cff242b0a235b4a334c0f04be0f4527656426fdc25e0374
3
  size 242012923
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f9038bd13cee7be809b870072293469c3cd227459e6b82a61f4cf6abfd04c52
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6fe5e55a28bec87da43da634edefd5e9737d0fb7942ab5d1595a5149b1148b6
3
  size 14503
last-checkpoint/scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0316325edea77248486ca0e79ad8e8ee0b7725685c3d831ab06f04629fb1ef89
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97aa4284d30c55c9de6eb4425ce0d2728af80a248d437264944c01a2e6a6265c
3
  size 559
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:34db57be1d8dc6c076b5589b33fe55a93138c1738acd1cce1da407f6d1d9bb29
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f97dba5218102cb7a6dbc477aa202196bb52ab595fab0e37adc58120c6e0a955
3
  size 623
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 0.767312228679657,
3
- "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-adamw/checkpoint-8000",
4
- "epoch": 2.56,
5
- "global_step": 8000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -326,11 +326,31 @@
326
  "eval_samples_per_second": 74.896,
327
  "eval_steps_per_second": 2.359,
328
  "step": 8000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
329
  }
330
  ],
331
  "max_steps": 31250,
332
  "num_train_epochs": 10,
333
- "total_flos": 3.4018432483590144e+16,
334
  "trial_name": null,
335
  "trial_params": null
336
  }
 
1
  {
2
+ "best_metric": 0.7641937732696533,
3
+ "best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-adamw/checkpoint-8500",
4
+ "epoch": 2.7199999999999998,
5
+ "global_step": 8500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
326
  "eval_samples_per_second": 74.896,
327
  "eval_steps_per_second": 2.359,
328
  "step": 8000
329
+ },
330
+ {
331
+ "epoch": 2.72,
332
+ "learning_rate": 7.664971199514939e-05,
333
+ "loss": 0.5322,
334
+ "step": 8500
335
+ },
336
+ {
337
+ "epoch": 2.72,
338
+ "eval_bleu": 0.13498312180179964,
339
+ "eval_exact_match": 0.1665,
340
+ "eval_loss": 0.7641937732696533,
341
+ "eval_rouge1": 0.5707696930577069,
342
+ "eval_rouge2": 0.403346138073659,
343
+ "eval_rougeL": 0.5527280072901636,
344
+ "eval_rougeLsum": 0.5605579795104842,
345
+ "eval_runtime": 26.4882,
346
+ "eval_samples_per_second": 75.505,
347
+ "eval_steps_per_second": 2.378,
348
+ "step": 8500
349
  }
350
  ],
351
  "max_steps": 31250,
352
  "num_train_epochs": 10,
353
+ "total_flos": 3.614193688982323e+16,
354
  "trial_name": null,
355
  "trial_params": null
356
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f23299a7aeba471b07c347aceb29e5198305d8414f4dd4b21f79fc14a4592d39
3
  size 242012923
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4b276e716795aaff1cff242b0a235b4a334c0f04be0f4527656426fdc25e0374
3
  size 242012923