SystemAdmin123 commited on
Commit
cc08fbb
·
verified ·
1 Parent(s): b89fce4

Training in progress, step 50, checkpoint

Browse files
last-checkpoint/model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b5c20dc59c769d88fe81b2b0843f23d2dd86b47b4591ef40bad9115cd2b4385
3
  size 4874664552
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72fe86bc02adec23b28b68c15b10a96fd293a20ee6a1cdaafd0cf18e1685dc20
3
  size 4874664552
last-checkpoint/model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d8ef29282721049bf0104c9d2701bfa26a60707403dbad153e661e9df28751f
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0db6c3053a7deda030e77cbf9dc2889c468ba509b50f75ffb580a36cf57e0ef
3
  size 4932751008
last-checkpoint/model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a175e2a7592da2781889f8d417906512e54b2c4cf1831f1316e119d4722001f4
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d92a224e994fa1a22383ebe54bf00bb1077af44379b3bf42e7679b3dbab9987
3
  size 4330865200
last-checkpoint/model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d149d0190b4a1e8c630935731679b382222057f720f060d7786d7b42e66238bd
3
  size 1086998656
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdd5806b5d6ec7a64af996081c0f79be909a2e91f7faf708ef85bc77a39e2f04
3
  size 1086998656
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fbd3cf7e9f20636c638ad5a407323f188cfb4d34ff7182f544b0b533f9bad084
3
  size 15465450874
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:264d9f5983d4e9539188419005a2b5a0ae23bbe058e7cb34ad670a166a35860a
3
  size 15465450874
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73d7e7515bf9366d4128b5be03fea719bb7ed473249f57b8c5a1f2a51581ebf8
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c620e9c1e58182d1e495bef166b392358f6580ca0b286508365d4c14b06ac944
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.2094240837696335,
5
- "eval_steps": 40,
6
- "global_step": 40,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -11,53 +11,60 @@
11
  {
12
  "epoch": 0.005235602094240838,
13
  "eval_loss": 2.384796619415283,
14
- "eval_runtime": 61.2033,
15
- "eval_samples_per_second": 24.525,
16
- "eval_steps_per_second": 6.143,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.05235602094240838,
21
  "grad_norm": 5.15625,
22
  "learning_rate": 3.6363636363636364e-05,
23
- "loss": 1.9243,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.10471204188481675,
28
- "grad_norm": 4.5625,
29
  "learning_rate": 7.272727272727273e-05,
30
- "loss": 1.8451,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.15706806282722513,
35
  "grad_norm": 3.484375,
36
  "learning_rate": 0.00010909090909090909,
37
- "loss": 1.8315,
38
  "step": 30
39
  },
40
  {
41
  "epoch": 0.2094240837696335,
42
  "grad_norm": 3.390625,
43
  "learning_rate": 0.00014545454545454546,
44
- "loss": 2.0039,
45
  "step": 40
46
  },
47
  {
48
- "epoch": 0.2094240837696335,
49
- "eval_loss": 1.9543291330337524,
50
- "eval_runtime": 73.5405,
51
- "eval_samples_per_second": 20.411,
52
- "eval_steps_per_second": 5.113,
53
- "step": 40
 
 
 
 
 
 
 
54
  }
55
  ],
56
  "logging_steps": 10,
57
  "max_steps": 1100,
58
  "num_input_tokens_seen": 0,
59
  "num_train_epochs": 6,
60
- "save_steps": 20,
61
  "stateful_callbacks": {
62
  "TrainerControl": {
63
  "args": {
@@ -70,7 +77,7 @@
70
  "attributes": {}
71
  }
72
  },
73
- "total_flos": 1.3898457261539328e+16,
74
  "train_batch_size": 2,
75
  "trial_name": null,
76
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.2617801047120419,
5
+ "eval_steps": 50,
6
+ "global_step": 50,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
11
  {
12
  "epoch": 0.005235602094240838,
13
  "eval_loss": 2.384796619415283,
14
+ "eval_runtime": 62.0394,
15
+ "eval_samples_per_second": 24.194,
16
+ "eval_steps_per_second": 6.061,
17
  "step": 1
18
  },
19
  {
20
  "epoch": 0.05235602094240838,
21
  "grad_norm": 5.15625,
22
  "learning_rate": 3.6363636363636364e-05,
23
+ "loss": 1.9242,
24
  "step": 10
25
  },
26
  {
27
  "epoch": 0.10471204188481675,
28
+ "grad_norm": 4.59375,
29
  "learning_rate": 7.272727272727273e-05,
30
+ "loss": 1.845,
31
  "step": 20
32
  },
33
  {
34
  "epoch": 0.15706806282722513,
35
  "grad_norm": 3.484375,
36
  "learning_rate": 0.00010909090909090909,
37
+ "loss": 1.8311,
38
  "step": 30
39
  },
40
  {
41
  "epoch": 0.2094240837696335,
42
  "grad_norm": 3.390625,
43
  "learning_rate": 0.00014545454545454546,
44
+ "loss": 2.0034,
45
  "step": 40
46
  },
47
  {
48
+ "epoch": 0.2617801047120419,
49
+ "grad_norm": 3.59375,
50
+ "learning_rate": 0.00018181818181818183,
51
+ "loss": 2.2024,
52
+ "step": 50
53
+ },
54
+ {
55
+ "epoch": 0.2617801047120419,
56
+ "eval_loss": 2.1606948375701904,
57
+ "eval_runtime": 60.3553,
58
+ "eval_samples_per_second": 24.869,
59
+ "eval_steps_per_second": 6.23,
60
+ "step": 50
61
  }
62
  ],
63
  "logging_steps": 10,
64
  "max_steps": 1100,
65
  "num_input_tokens_seen": 0,
66
  "num_train_epochs": 6,
67
+ "save_steps": 50,
68
  "stateful_callbacks": {
69
  "TrainerControl": {
70
  "args": {
 
77
  "attributes": {}
78
  }
79
  },
80
+ "total_flos": 1.737307157692416e+16,
81
  "train_batch_size": 2,
82
  "trial_name": null,
83
  "trial_params": null
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2dccb17e5942fb2737bb1fdd5b88f91e0f16655a5f1ad194d5593b47e06f8592
3
  size 6968
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32a7a8613e5fa3317cdc198f56f6d0577b15eb3e0cf0efd4aa72ac710a8260e0
3
  size 6968