mgh6 commited on
Commit
ec37c38
·
verified ·
1 Parent(s): 21d1839

Training in progress, step 14700, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8cac6a6f7a31e5da389a45bb3c9f082ba3080e29ab9fc8d8efbfd63df38debee
3
  size 8137792
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f0570fbe1cfb2cc0429421c072380990511e34a42c049d209bffe41383ce964
3
  size 8137792
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0ac03cb4783a47c0a95be9f4a129f0f52588882668ede0ca0972e32f6e8d7fa2
3
  size 16386426
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16d8c736d6f95c350e9377664a0da87f05e71a8a7c9d7421b0cdb2eb7d7c320e
3
  size 16386426
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fa6c6ef1a13072691bc9776f605bb9e006b751f451537eba6fdf8f832f1aa17f
3
  size 15006
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67a554a2b1dfd0fb5fde5dac2e3a00d7c706f9f81bb1fac139c3340134e19778
3
  size 15006
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f44328417ddaab62e319c451bb3d9fe74cb7a3ed5a7dc379d94953a6ec72b89f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39a8fd283686b2b43f94f51c5406bd8c5a6961c6a78793c52b8339d3ac0fec03
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 29.195438212779255,
5
  "eval_steps": 500,
6
- "global_step": 14600,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1261,6 +1261,13 @@
1261
  "learning_rate": 2.666666666666667e-06,
1262
  "loss": 1.2162,
1263
  "step": 14600
 
 
 
 
 
 
 
1264
  }
1265
  ],
1266
  "logging_steps": 100,
@@ -1280,7 +1287,7 @@
1280
  "attributes": {}
1281
  }
1282
  },
1283
- "total_flos": 2.2786680244234355e+19,
1284
  "train_batch_size": 8,
1285
  "trial_name": null,
1286
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 29.3954069676613,
5
  "eval_steps": 500,
6
+ "global_step": 14700,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1261
  "learning_rate": 2.666666666666667e-06,
1262
  "loss": 1.2162,
1263
  "step": 14600
1264
+ },
1265
+ {
1266
+ "epoch": 29.3954069676613,
1267
+ "grad_norm": 0.2399660050868988,
1268
+ "learning_rate": 2.0000000000000003e-06,
1269
+ "loss": 1.2179,
1270
+ "step": 14700
1271
  }
1272
  ],
1273
  "logging_steps": 100,
 
1287
  "attributes": {}
1288
  }
1289
  },
1290
+ "total_flos": 2.294275521542252e+19,
1291
  "train_batch_size": 8,
1292
  "trial_name": null,
1293
  "trial_params": null