mgh6 commited on
Commit
9a4adc2
·
verified ·
1 Parent(s): 567d35b

Training in progress, step 10, checkpoint

Browse files
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c06f7160f22fbde4b0edd532ca852a26d78a7b89e74befb3ee87df81ead89bef
3
  size 136989964
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cea0765bd8f0b9a1e12ea0a8b17600537a8a8aa9b31d6b035239ebbbf9f671b
3
  size 136989964
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:457b61c538c6fd492b78ddcd5ec0971d7e5783c294246d6ffc856b88b8f6597f
3
  size 274102522
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09d211561c9300b084ee1c67ccc50eb7ccc587eb35c5a98716831bd475c56b01
3
  size 274102522
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:39faad36473fe7ccd1d8b3cc1d38b7677f89aa6a9fa89752e8cf76ccfeb6b6fa
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15d1dcbcac9056d8a037e6e4a22324a07fd3a0a6e510aab60137760c5db6e4b6
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f0835ee1c22f84165c30215666e7b398add56dfc6181de2afa3282c5c633579
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c977fb38c051b92c0da24652d501a434592fa15ac6055c06154f25847bf8d87
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,49 +1,34 @@
1
  {
2
- "best_metric": 0.09355609118938446,
3
- "best_model_checkpoint": "mgh6/TCS_Pair_base/checkpoint-50",
4
- "epoch": 0.6514657980456026,
5
- "eval_steps": 50,
6
- "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.3257328990228013,
13
- "grad_norm": 0.0015510329976677895,
14
- "learning_rate": 0.0009673202614379086,
15
- "loss": 1.4376,
16
- "step": 50
17
  },
18
  {
19
- "epoch": 0.3257328990228013,
20
- "eval_loss": 0.09355609118938446,
21
- "eval_runtime": 0.1701,
22
- "eval_samples_per_second": 235.183,
23
- "eval_steps_per_second": 5.88,
24
- "step": 50
25
- },
26
- {
27
- "epoch": 0.6514657980456026,
28
- "grad_norm": 0.005515442695468664,
29
- "learning_rate": 0.000934640522875817,
30
- "loss": 0.0635,
31
- "step": 100
32
- },
33
- {
34
- "epoch": 0.6514657980456026,
35
- "eval_loss": 0.10034115612506866,
36
- "eval_runtime": 0.1666,
37
- "eval_samples_per_second": 240.085,
38
- "eval_steps_per_second": 6.002,
39
- "step": 100
40
  }
41
  ],
42
- "logging_steps": 50,
43
  "max_steps": 1530,
44
  "num_input_tokens_seen": 0,
45
  "num_train_epochs": 10,
46
- "save_steps": 50,
47
  "stateful_callbacks": {
48
  "EarlyStoppingCallback": {
49
  "args": {
@@ -51,7 +36,7 @@
51
  "early_stopping_threshold": 0.0
52
  },
53
  "attributes": {
54
- "early_stopping_patience_counter": 1
55
  }
56
  },
57
  "TrainerControl": {
 
1
  {
2
+ "best_metric": 0.11874232441186905,
3
+ "best_model_checkpoint": "mgh6/TCS_Pair_base/checkpoint-10",
4
+ "epoch": 0.06514657980456026,
5
+ "eval_steps": 10,
6
+ "global_step": 10,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.06514657980456026,
13
+ "grad_norm": 2.679584264755249,
14
+ "learning_rate": 0.0009934640522875817,
15
+ "loss": 6.8323,
16
+ "step": 10
17
  },
18
  {
19
+ "epoch": 0.06514657980456026,
20
+ "eval_loss": 0.11874232441186905,
21
+ "eval_runtime": 0.1734,
22
+ "eval_samples_per_second": 230.735,
23
+ "eval_steps_per_second": 5.768,
24
+ "step": 10
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
25
  }
26
  ],
27
+ "logging_steps": 10,
28
  "max_steps": 1530,
29
  "num_input_tokens_seen": 0,
30
  "num_train_epochs": 10,
31
+ "save_steps": 10,
32
  "stateful_callbacks": {
33
  "EarlyStoppingCallback": {
34
  "args": {
 
36
  "early_stopping_threshold": 0.0
37
  },
38
  "attributes": {
39
+ "early_stopping_patience_counter": 0
40
  }
41
  },
42
  "TrainerControl": {
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed8892a6ebe12874b1e27051fb6dccb01d1190c645673e179ca706515b004c6e
3
  size 5240
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5beade62aada710acad234d8207eb11ac44f66d433b38da8f5e0430bdedea5fc
3
  size 5240