mgh6 commited on
Commit
59b27a1
·
verified ·
1 Parent(s): a1e1b7c

Training in progress, step 100, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5caa6b92b6430b5541b79e0b58f7ca5bb7d35f38bba2d968f71df2dc83838d5
3
  size 2611614300
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:507d55726514d36d57a7fdead1e533238594fb1d956a903a49ce02157b571e17
3
  size 2611614300
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a616e5e2709e474c9e362c0f8f56e247d8aba32eca2de467636730b28c4d4ef
3
  size 5213028466
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fb309794c77ba81c5d999193c64bdbf97c4b11eecd10e3754dddae31d948844
3
  size 5213028466
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e3307365943bdb97704420d03c23d6d5be63a26f2aeac779ce1f4ea6ad16d9e
3
  size 14942
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:874b9aec013ad321d4edc1c021ca42f8014c7ff34d53714ff8059015e8ee9794
3
  size 14942
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68efe461a0b35c4aec0914c8e4be32a81c4a4261603765c475d2e90661d821c9
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c39af0f6970331c0f430d145f5514421d9baa7e90f9cf02971fb62606bf1ff3d
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,26 +1,26 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.24843756065370134,
5
- "eval_steps": 5000,
6
- "global_step": 1000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.24843756065370134,
13
- "grad_norm": 0.6212329864501953,
14
- "learning_rate": 0.0009751552795031056,
15
- "loss": 5.552229361614273e+25,
16
- "step": 1000
17
  }
18
  ],
19
- "logging_steps": 1000,
20
  "max_steps": 40250,
21
  "num_input_tokens_seen": 0,
22
  "num_train_epochs": 10,
23
- "save_steps": 1000,
24
  "stateful_callbacks": {
25
  "TrainerControl": {
26
  "args": {
@@ -33,7 +33,7 @@
33
  "attributes": {}
34
  }
35
  },
36
- "total_flos": 1.9448797327261696e+17,
37
  "train_batch_size": 1,
38
  "trial_name": null,
39
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.024843756065370134,
5
+ "eval_steps": 500,
6
+ "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.024843756065370134,
13
+ "grad_norm": 0.9147792458534241,
14
+ "learning_rate": 0.0009975155279503105,
15
+ "loss": 1.0811305421386547e+17,
16
+ "step": 100
17
  }
18
  ],
19
+ "logging_steps": 100,
20
  "max_steps": 40250,
21
  "num_input_tokens_seen": 0,
22
  "num_train_epochs": 10,
23
+ "save_steps": 100,
24
  "stateful_callbacks": {
25
  "TrainerControl": {
26
  "args": {
 
33
  "attributes": {}
34
  }
35
  },
36
+ "total_flos": 1.9448797327261696e+16,
37
  "train_batch_size": 1,
38
  "trial_name": null,
39
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b7148c30a014b8855d44fa1707c1d7591fba5860cd9f37063b980d6b66e148b9
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0aae1b036793cf546f080bfdd66ff5e43f2ec5b41ab240614331a01cb7e0e4a5
3
  size 5176