Johannes Garstenauer commited on
Commit
8be369e
·
1 Parent(s): 094f87f

Training in progress, step 6468

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2001a2a8d146bbc3210e2ba74909a6c54a34bc0f57ecb371f3a4fdf527c02b9d
3
  size 133863493
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cd9ed599b2622be6183702891ab47ac5b9f5406d312cb802b16ed7f3098d9cf
3
  size 133863493
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1faeff0083195d9b234e601d177b81e0e8b95814a0bfb980ed3d9c20fa193536
3
  size 266276525
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f92d3d52cf47be1987752bc89ccb1ec1c6e0dc8b68b55de2fed88e49ded0e92
3
  size 266276525
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa0b772b5dd21989336ffb42562e16185bc2e1d10a7ccdcb65ed21eb3e033e8e
3
  size 14511
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:edec1b2f1f61c07d3b95c625533890e74aa6568913f1c7d51a65585f79b1d35e
3
  size 14511
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:874b5d38d8e13a97c857fe192fe23456e3dd1f5254d9ee7767049f04c81795a2
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c3ed672465d4250f40b2ef2e23b0eb90ec6136a6bc9ed10c02bf3f9c750c79e
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.4500835034329189,
5
- "global_step": 4851,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -60,11 +60,29 @@
60
  "learning_rate": 2.195833505288551e-05,
61
  "loss": 0.1404,
62
  "step": 4500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  }
64
  ],
65
  "max_steps": 32334,
66
  "num_train_epochs": 3,
67
- "total_flos": 8.225711749398528e+16,
68
  "trial_name": null,
69
  "trial_params": null
70
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.6001113379105586,
5
+ "global_step": 6468,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
60
  "learning_rate": 2.195833505288551e-05,
61
  "loss": 0.1404,
62
  "step": 4500
63
+ },
64
+ {
65
+ "epoch": 0.46,
66
+ "learning_rate": 2.156388339209501e-05,
67
+ "loss": 0.1381,
68
+ "step": 5000
69
+ },
70
+ {
71
+ "epoch": 0.51,
72
+ "learning_rate": 2.116943173130451e-05,
73
+ "loss": 0.136,
74
+ "step": 5500
75
+ },
76
+ {
77
+ "epoch": 0.56,
78
+ "learning_rate": 2.077498007051401e-05,
79
+ "loss": 0.135,
80
+ "step": 6000
81
  }
82
  ],
83
  "max_steps": 32334,
84
  "num_train_epochs": 3,
85
+ "total_flos": 1.0967615665864704e+17,
86
  "trial_name": null,
87
  "trial_params": null
88
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1faeff0083195d9b234e601d177b81e0e8b95814a0bfb980ed3d9c20fa193536
3
  size 266276525
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f92d3d52cf47be1987752bc89ccb1ec1c6e0dc8b68b55de2fed88e49ded0e92
3
  size 266276525