devvanshhh commited on
Commit
b9d1c16
·
1 Parent(s): e23cf5a

Training in progress, epoch 4, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6b14ca092add6f83afa8592d7cc107f9a67c8e22970174dcecb8c088b5de4169
3
  size 615849402
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61252a82dcc7cc460a7ca8e49e81f8a6269636bd56c3c3d0d458eebf8b37ff44
3
  size 615849402
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:53b82483abfbf4ffd8c243b766dabbb4812428d1894516eada10c5a9bfc6fd48
3
  size 307910594
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:abe65158947a614ad80011b29d3a4888efbbc0963b7a74c0d1f8afaa60390425
3
  size 307910594
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ede5b6194a7298561178c49b95e0507051d3deed7c4f79c181647c4a85f692c
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1e65b606b54db60587912fdc573f5f38a59d25ab0eb278c25736d481395cdf2
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f47fdf6b0fbbab3a9ea4d27bd0147fa6ed4e838983e0cf3922c7879c115ad6f0
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3bb0b6e8dad866c1a4d1aed7e44eadc70d3ea1328d713add8793b99298fb68f
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 0.7071468234062195,
3
- "best_model_checkpoint": "flanT5-description-generation/checkpoint-297",
4
- "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 297,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -46,13 +46,26 @@
46
  "eval_samples_per_second": 16.011,
47
  "eval_steps_per_second": 2.032,
48
  "step": 297
 
 
 
 
 
 
 
 
 
 
 
 
 
49
  }
50
  ],
51
  "logging_steps": 500,
52
  "max_steps": 495,
53
  "num_train_epochs": 5,
54
  "save_steps": 500,
55
- "total_flos": 438887481606144.0,
56
  "trial_name": null,
57
  "trial_params": null
58
  }
 
1
  {
2
+ "best_metric": 0.42786499857902527,
3
+ "best_model_checkpoint": "flanT5-description-generation/checkpoint-396",
4
+ "epoch": 4.0,
5
  "eval_steps": 500,
6
+ "global_step": 396,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
46
  "eval_samples_per_second": 16.011,
47
  "eval_steps_per_second": 2.032,
48
  "step": 297
49
+ },
50
+ {
51
+ "epoch": 4.0,
52
+ "eval_gen_len": 5.5786802030456855,
53
+ "eval_loss": 0.42786499857902527,
54
+ "eval_rouge1": 6.0645,
55
+ "eval_rouge2": 5.1995,
56
+ "eval_rougeL": 5.6723,
57
+ "eval_rougeLsum": 5.6926,
58
+ "eval_runtime": 16.8779,
59
+ "eval_samples_per_second": 11.672,
60
+ "eval_steps_per_second": 1.481,
61
+ "step": 396
62
  }
63
  ],
64
  "logging_steps": 500,
65
  "max_steps": 495,
66
  "num_train_epochs": 5,
67
  "save_steps": 500,
68
+ "total_flos": 585183308808192.0,
69
  "trial_name": null,
70
  "trial_params": null
71
  }