SystemAdmin123 commited on
Commit
5d9163a
·
verified ·
1 Parent(s): 22b094d

Training in progress, step 100, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca5ae10db168677b2a3c9eebebb9f8c7f9b9d67457d37ffa9c3acda730924ede
3
  size 723674912
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3d4c86dbc3a809d6bdc35e80da94e44289853f47f3c4e8bc28bb197206757d0
3
  size 723674912
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1fce942f56022b1c968835cb5703df1ddb7bb2d9c6269c456723dbdb59672d7c
3
  size 735625370
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:152992c22320b5355e945dfb4a4cba99cfb4bf09b642dbac9c3009149011352d
3
  size 735625370
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8e86174b3eb32925060e9953680fbcda12f487778e2fa23373bff16bb360a64
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65fc5493cd95cc4a525582d7144fab8c2fb7ccb5f192423671fe2e1c71f9588c
3
  size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96e7dd869a6e1b32bc9520ed4dad315337bd74e7bba1905b1527b70f353d1ff6
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1e7cda19f7cb3579408e9f405862a0136ef9f921b9602ef040b683708565b31e
3
  size 15024
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9cdef07c8fb03613426123802d3ee28840d50c7dc4d30cb68fc9cabc31660adb
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35761c9ae1453a385e31327d4717208e814e94ccb377326730a4c7b214baa671
3
  size 15024
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24cc5299af352f51d11766db1f1a250378308cfbc684430ac64ca9d7b85e55c6
3
  size 15024
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a35cbf7b65c1a64e50166e0bb259917c6b81f8e9db674c5beb450f633f0b85b
3
  size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a7c81ebb017017feee3c6c3f2477294c6f8e1ba38c8568a1c58d53f7e2c4e60d
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fc7800513a1b4dd006c457152c700dd768bb49ee4ed8e4d9665a4e42095b054
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 10.0,
5
  "eval_steps": 20,
6
- "global_step": 80,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -103,6 +103,28 @@
103
  "eval_samples_per_second": 305.813,
104
  "eval_steps_per_second": 3.464,
105
  "step": 80
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
106
  }
107
  ],
108
  "logging_steps": 10,
@@ -122,7 +144,7 @@
122
  "attributes": {}
123
  }
124
  },
125
- "total_flos": 2.8455506955730944e+16,
126
  "train_batch_size": 23,
127
  "trial_name": null,
128
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 12.5,
5
  "eval_steps": 20,
6
+ "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
103
  "eval_samples_per_second": 305.813,
104
  "eval_steps_per_second": 3.464,
105
  "step": 80
106
+ },
107
+ {
108
+ "epoch": 11.25,
109
+ "grad_norm": 0.1337890625,
110
+ "learning_rate": 0.00012454854871407994,
111
+ "loss": 2.0551,
112
+ "step": 90
113
+ },
114
+ {
115
+ "epoch": 12.5,
116
+ "grad_norm": 0.14453125,
117
+ "learning_rate": 0.00010825793454723325,
118
+ "loss": 2.0298,
119
+ "step": 100
120
+ },
121
+ {
122
+ "epoch": 12.5,
123
+ "eval_loss": 2.0621085166931152,
124
+ "eval_runtime": 5.0999,
125
+ "eval_samples_per_second": 294.32,
126
+ "eval_steps_per_second": 3.333,
127
+ "step": 100
128
  }
129
  ],
130
  "logging_steps": 10,
 
144
  "attributes": {}
145
  }
146
  },
147
+ "total_flos": 3.556938369466368e+16,
148
  "train_batch_size": 23,
149
  "trial_name": null,
150
  "trial_params": null