dq158 commited on
Commit
73665eb
·
1 Parent(s): e1efcea

Training in progress, epoch 2, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ab5328b63a8ec3b53c2f26a99111049d2792ac322fccebc0739829ebfab0879
3
  size 1980860410
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6393b8f0ca5e88756c2083d1f2a1907a0f9a6dbb6883be0a4876e58b8454d9e5
3
  size 1980860410
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a0afe6c8cd50d6bcf5ad6cb45258efb15f89d523168c877fac499ab3891b636e
3
  size 990409330
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c614a827b995ce3eaf6b4ca43b101bd027894d4a25801ccc43d2a50633f617fc
3
  size 990409330
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:52a28bc3541f02e8de86363b8d2f634108f83fb8b7a33f774c760cce0869599d
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:86155979fa4274be782ec567e9a698db195e65592845142c9f3ce5d5d0bead1a
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5afd8d09736ea35ab4f783803d2aca249bf98e9d0591be216198fe2ebe96a3c3
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d9908d10066d14a0312f52aee3b01a644d08d03fb490399a3d67eceed366c84
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
- "best_metric": 1.4803038835525513,
3
- "best_model_checkpoint": "dq158/morbius/checkpoint-1475",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
- "global_step": 1475,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -38,13 +38,50 @@
38
  "eval_steps_per_second": 0.555,
39
  "eval_translation_length": 35996,
40
  "step": 1475
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
41
  }
42
  ],
43
  "logging_steps": 500,
44
  "max_steps": 7375,
45
  "num_train_epochs": 5,
46
  "save_steps": 500,
47
- "total_flos": 1.2116096594214912e+16,
48
  "trial_name": null,
49
  "trial_params": null
50
  }
 
1
  {
2
+ "best_metric": 1.4565129280090332,
3
+ "best_model_checkpoint": "dq158/morbius/checkpoint-2950",
4
+ "epoch": 2.0,
5
  "eval_steps": 500,
6
+ "global_step": 2950,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
38
  "eval_steps_per_second": 0.555,
39
  "eval_translation_length": 35996,
40
  "step": 1475
41
+ },
42
+ {
43
+ "epoch": 1.02,
44
+ "learning_rate": 3.983050847457627e-05,
45
+ "loss": 1.7275,
46
+ "step": 1500
47
+ },
48
+ {
49
+ "epoch": 1.36,
50
+ "learning_rate": 3.644067796610169e-05,
51
+ "loss": 1.6924,
52
+ "step": 2000
53
+ },
54
+ {
55
+ "epoch": 1.69,
56
+ "learning_rate": 3.305084745762712e-05,
57
+ "loss": 1.6815,
58
+ "step": 2500
59
+ },
60
+ {
61
+ "epoch": 2.0,
62
+ "eval_bleu": 1.0,
63
+ "eval_brevity_penalty": 1.0,
64
+ "eval_length_ratio": 1.0,
65
+ "eval_loss": 1.4565129280090332,
66
+ "eval_precisions": [
67
+ 1.0,
68
+ 1.0,
69
+ 1.0,
70
+ 1.0
71
+ ],
72
+ "eval_reference_length": 35935,
73
+ "eval_runtime": 291.4973,
74
+ "eval_samples_per_second": 6.744,
75
+ "eval_steps_per_second": 0.563,
76
+ "eval_translation_length": 35935,
77
+ "step": 2950
78
  }
79
  ],
80
  "logging_steps": 500,
81
  "max_steps": 7375,
82
  "num_train_epochs": 5,
83
  "save_steps": 500,
84
+ "total_flos": 2.4232193188429824e+16,
85
  "trial_name": null,
86
  "trial_params": null
87
  }