mgh6 commited on
Commit
d7b886d
·
verified ·
1 Parent(s): e474a39

Training in progress, step 100, checkpoint

Browse files
last-checkpoint/config.json CHANGED
@@ -23,7 +23,7 @@
23
  "position_embedding_type": "rotary",
24
  "token_dropout": true,
25
  "torch_dtype": "float32",
26
- "transformers_version": "4.36.1",
27
  "use_cache": true,
28
  "vocab_list": null,
29
  "vocab_size": 33
 
23
  "position_embedding_type": "rotary",
24
  "token_dropout": true,
25
  "torch_dtype": "float32",
26
+ "transformers_version": "4.45.2",
27
  "use_cache": true,
28
  "vocab_list": null,
29
  "vocab_size": 33
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:517b7a2aaaea838cb419a14f1b515d8b5cf1ed9fde5bf86d6fb0c135a3fcfda0
3
  size 136000488
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cd9a570af82105305cf26766d7851aa7b4e32c4acb1dcdebd64cd9be4301098
3
  size 136000488
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6ee99e2558f0635b821e5f0474f85cc00393edabfccf6bb4110621fc826ded64
3
  size 268176506
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1eda6ad8e7e768db6abb9e04b52a008b2ecbe0f771c73b2c2ef7955c8d156e46
3
  size 268176506
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee83cb0b382b6f7013b8e905a6b67eda9661bf7137607a26a8510616916ff33d
3
- size 14512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ad6436ce5e8229a5c4ab20ebe8cb7f55bf37abeb42cc6031740224925ccece0
3
+ size 15024
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7cf5a1d1bb94d2ab14807987fb6e7f78b0a603abb98dc702e91c99346c1c8745
3
- size 14512
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30ce71d1ff265e905b2803194965013784a4a1c2ebcd76de912d912dd5430327
3
+ size 15024
last-checkpoint/rng_state_2.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac4ea73b7e3e12f80c898b525181786b56f8cafbf02cf3e2661eb5c2237f1786
3
+ size 15024
last-checkpoint/rng_state_3.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df5ac7dd4844d948bc63bc160ee8e329c029b596511f3d1234b31a48caf5cc47
3
+ size 15024
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0943229aeeb46312acb472f3efe5d902161c82efbe50119969078cb1567edce6
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf0d25366e7e2e728cd627802a5543527b6178cf70866baa22ea5a7d28baa2af
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,35 +1,57 @@
1
  {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 0.12421588721197441,
5
- "eval_steps": 500,
6
- "global_step": 500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
- "epoch": 0.12,
13
- "learning_rate": 9.958592132505176e-05,
14
- "loss": 1.3838,
15
- "step": 500
 
16
  },
17
  {
18
- "epoch": 0.12,
19
- "eval_loss": 1.3269665241241455,
20
- "eval_runtime": 63.2116,
21
- "eval_samples_per_second": 255.634,
22
- "eval_steps_per_second": 15.978,
23
- "step": 500
24
  }
25
  ],
26
- "logging_steps": 500,
27
- "max_steps": 120750,
28
  "num_input_tokens_seen": 0,
29
- "num_train_epochs": 30,
30
- "save_steps": 500,
31
- "total_flos": 5001938240274432.0,
32
- "train_batch_size": 8,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
33
  "trial_name": null,
34
  "trial_params": null
35
  }
 
1
  {
2
+ "best_metric": 1.1609667539596558,
3
+ "best_model_checkpoint": "mgh6/TCS_MLM/checkpoint-100",
4
+ "epoch": 0.13386880856760375,
5
+ "eval_steps": 100,
6
+ "global_step": 100,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
  {
12
+ "epoch": 0.13386880856760375,
13
+ "grad_norm": 0.18324387073516846,
14
+ "learning_rate": 0.0009866131191432397,
15
+ "loss": 1.432,
16
+ "step": 100
17
  },
18
  {
19
+ "epoch": 0.13386880856760375,
20
+ "eval_loss": 1.1609667539596558,
21
+ "eval_runtime": 6.3619,
22
+ "eval_samples_per_second": 894.697,
23
+ "eval_steps_per_second": 3.615,
24
+ "step": 100
25
  }
26
  ],
27
+ "logging_steps": 100,
28
+ "max_steps": 7470,
29
  "num_input_tokens_seen": 0,
30
+ "num_train_epochs": 10,
31
+ "save_steps": 100,
32
+ "stateful_callbacks": {
33
+ "EarlyStoppingCallback": {
34
+ "args": {
35
+ "early_stopping_patience": 5,
36
+ "early_stopping_threshold": 0.0
37
+ },
38
+ "attributes": {
39
+ "early_stopping_patience_counter": 0
40
+ }
41
+ },
42
+ "TrainerControl": {
43
+ "args": {
44
+ "should_epoch_stop": false,
45
+ "should_evaluate": false,
46
+ "should_log": false,
47
+ "should_save": true,
48
+ "should_training_stop": false
49
+ },
50
+ "attributes": {}
51
+ }
52
+ },
53
+ "total_flos": 3631227076608000.0,
54
+ "train_batch_size": 64,
55
  "trial_name": null,
56
  "trial_params": null
57
  }
last-checkpoint/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d5da2bb0b25e23c2716dc60237e84cea2973b9882dcc6ff60ec43fea4464a78
3
- size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a3c35d00b3a9f09f09bbbd95adfdc6deaf5070563e785852debaae072505dcb
3
+ size 5240