SystemAdmin123 commited on
Commit
ddecad5
·
verified ·
1 Parent(s): cac4296

Training in progress, step 80, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f0661a72ba3b66e4cc9219a425dc921ded7fb63db1b28e737a02a8ac7fdf59c
3
  size 723674912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca5ae10db168677b2a3c9eebebb9f8c7f9b9d67457d37ffa9c3acda730924ede
3
  size 723674912
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14923cfad5b25d998979f61b48520b8b8f6c1c8529883dfdb62b3f6c200c9927
3
  size 735625370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fce942f56022b1c968835cb5703df1ddb7bb2d9c6269c456723dbdb59672d7c
3
  size 735625370
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:19fc90eda86010024a75dd32530431e4c24bd0a1f6eff78d85286abbab03fba0
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8e86174b3eb32925060e9953680fbcda12f487778e2fa23373bff16bb360a64
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:566f4865681bbc83459877b33ce491582588f147022ba0534caf3300e631e63c
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96e7dd869a6e1b32bc9520ed4dad315337bd74e7bba1905b1527b70f353d1ff6
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3338107951da02a423c8f8ac5237de9e0061e6b3d0456c6fc2efa3002cc8846d
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cdef07c8fb03613426123802d3ee28840d50c7dc4d30cb68fc9cabc31660adb
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fffd547e430c47ced000ae5492f6d5e18bd88a88193ec1ee24bfe6f6a4d8e35f
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24cc5299af352f51d11766db1f1a250378308cfbc684430ac64ca9d7b85e55c6
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ceb70d09862bb859050a14662883ecf389a0e55aec23642f4305d8f0de2bee43
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7c81ebb017017feee3c6c3f2477294c6f8e1ba38c8568a1c58d53f7e2c4e60d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 7.5,
5
  "eval_steps": 20,
6
- "global_step": 60,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -81,6 +81,28 @@
81
  "eval_samples_per_second": 279.177,
82
  "eval_steps_per_second": 3.162,
83
  "step": 60
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
84
  }
85
  ],
86
  "logging_steps": 10,
@@ -100,7 +122,7 @@
100
  "attributes": {}
101
  }
102
  },
103
- "total_flos": 2.134163021679821e+16,
104
  "train_batch_size": 23,
105
  "trial_name": null,
106
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 10.0,
5
  "eval_steps": 20,
6
+ "global_step": 80,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
81
  "eval_samples_per_second": 279.177,
82
  "eval_steps_per_second": 3.162,
83
  "step": 60
84
+ },
85
+ {
86
+ "epoch": 8.75,
87
+ "grad_norm": 0.138671875,
88
+ "learning_rate": 0.00015469481581224272,
89
+ "loss": 2.0638,
90
+ "step": 70
91
+ },
92
+ {
93
+ "epoch": 10.0,
94
+ "grad_norm": 0.140625,
95
+ "learning_rate": 0.00014016954246529696,
96
+ "loss": 2.0632,
97
+ "step": 80
98
+ },
99
+ {
100
+ "epoch": 10.0,
101
+ "eval_loss": 2.067866325378418,
102
+ "eval_runtime": 4.9082,
103
+ "eval_samples_per_second": 305.813,
104
+ "eval_steps_per_second": 3.464,
105
+ "step": 80
106
  }
107
  ],
108
  "logging_steps": 10,
 
122
  "attributes": {}
123
  }
124
  },
125
+ "total_flos": 2.8455506955730944e+16,
126
  "train_batch_size": 23,
127
  "trial_name": null,
128
  "trial_params": null