lilyray commited on
Commit
5a5765d
·
verified ·
1 Parent(s): 1ac507d

Training in progress, epoch 2

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5822060e3c3a7ebd53d16d93cb50d2a5cfd7bad9d36edadaceeb261b16e3f07b
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67f65ebac087eecb3136c25266c13fe1748c83541d47af3665a593199e8fbbbf
3
  size 437958648
run-0/checkpoint-358/config.json CHANGED
@@ -9,52 +9,8 @@
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
12
- "id2label": {
13
- "0": "LABEL_0",
14
- "1": "LABEL_1",
15
- "2": "LABEL_2",
16
- "3": "LABEL_3",
17
- "4": "LABEL_4",
18
- "5": "LABEL_5",
19
- "6": "LABEL_6",
20
- "7": "LABEL_7",
21
- "8": "LABEL_8",
22
- "9": "LABEL_9",
23
- "10": "LABEL_10",
24
- "11": "LABEL_11",
25
- "12": "LABEL_12",
26
- "13": "LABEL_13",
27
- "14": "LABEL_14",
28
- "15": "LABEL_15",
29
- "16": "LABEL_16",
30
- "17": "LABEL_17",
31
- "18": "LABEL_18",
32
- "19": "LABEL_19"
33
- },
34
  "initializer_range": 0.02,
35
  "intermediate_size": 3072,
36
- "label2id": {
37
- "LABEL_0": 0,
38
- "LABEL_1": 1,
39
- "LABEL_10": 10,
40
- "LABEL_11": 11,
41
- "LABEL_12": 12,
42
- "LABEL_13": 13,
43
- "LABEL_14": 14,
44
- "LABEL_15": 15,
45
- "LABEL_16": 16,
46
- "LABEL_17": 17,
47
- "LABEL_18": 18,
48
- "LABEL_19": 19,
49
- "LABEL_2": 2,
50
- "LABEL_3": 3,
51
- "LABEL_4": 4,
52
- "LABEL_5": 5,
53
- "LABEL_6": 6,
54
- "LABEL_7": 7,
55
- "LABEL_8": 8,
56
- "LABEL_9": 9
57
- },
58
  "layer_norm_eps": 1e-12,
59
  "max_position_embeddings": 512,
60
  "model_type": "bert",
 
9
  "hidden_act": "gelu",
10
  "hidden_dropout_prob": 0.1,
11
  "hidden_size": 768,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  "initializer_range": 0.02,
13
  "intermediate_size": 3072,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14
  "layer_norm_eps": 1e-12,
15
  "max_position_embeddings": 512,
16
  "model_type": "bert",
run-0/checkpoint-358/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72271a98ada970df47cd57bfbd4c33eb65e05fb14cb2ea7bf120b4542b53b217
3
- size 438014016
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67f65ebac087eecb3136c25266c13fe1748c83541d47af3665a593199e8fbbbf
3
+ size 437958648
run-0/checkpoint-358/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a0ed4b296a7a4a44743d3b8e9ccc1ab801744d507fdd9cac2d034648b6104f4
3
- size 876149114
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3e3d0aba04ad0e517ef1c40249cfc00da0057c2c9df2644889c84eb16cdb733
3
+ size 876038394
run-0/checkpoint-358/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72340d53a573e35b8a2892a74e8a02c506aa351bd83a86e183b25bf359bda426
3
- size 14308
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be6a2abdc636a987f2524cd4857edadf7650cb9e40eb358dcc1c55bc8335346e
3
+ size 14244
run-0/checkpoint-358/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9b86cf7e053c2579534fed3f160f846f769dd4b4c1af244f53ae21315dfe462a
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d80a787c544b76e19fce4aa5a7af8bca8cf13afd6c290f7a34439d52dcc83275
3
  size 1064
run-0/checkpoint-358/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.6224137544631958,
3
  "best_model_checkpoint": "./results/run-0/checkpoint-358",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 358,
7
  "is_hyper_param_search": true,
@@ -10,26 +10,35 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.6795138888888889,
14
- "eval_loss": 0.6224137544631958,
15
- "eval_runtime": 10.0132,
16
- "eval_samples_per_second": 95.375,
17
- "eval_steps_per_second": 11.984,
 
 
 
 
 
 
 
 
 
18
  "step": 358
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 716,
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 2,
25
  "save_steps": 500,
26
  "total_flos": 0,
27
- "train_batch_size": 8,
28
  "trial_name": null,
29
  "trial_params": {
30
- "learning_rate": 1.2830875674148802e-05,
31
  "num_train_epochs": 2,
32
- "per_device_train_batch_size": 8,
33
- "seed": 14
34
  }
35
  }
 
1
  {
2
+ "best_metric": 0.6166871786117554,
3
  "best_model_checkpoint": "./results/run-0/checkpoint-358",
4
+ "epoch": 2.0,
5
  "eval_steps": 500,
6
  "global_step": 358,
7
  "is_hyper_param_search": true,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.6253472222222222,
14
+ "eval_loss": 0.642154335975647,
15
+ "eval_runtime": 10.3326,
16
+ "eval_samples_per_second": 92.426,
17
+ "eval_steps_per_second": 11.614,
18
+ "step": 179
19
+ },
20
+ {
21
+ "epoch": 2.0,
22
+ "eval_accuracy": 0.6413194444444446,
23
+ "eval_loss": 0.6166871786117554,
24
+ "eval_runtime": 10.3148,
25
+ "eval_samples_per_second": 92.585,
26
+ "eval_steps_per_second": 11.634,
27
  "step": 358
28
  }
29
  ],
30
  "logging_steps": 500,
31
+ "max_steps": 358,
32
  "num_input_tokens_seen": 0,
33
  "num_train_epochs": 2,
34
  "save_steps": 500,
35
  "total_flos": 0,
36
+ "train_batch_size": 16,
37
  "trial_name": null,
38
  "trial_params": {
39
+ "learning_rate": 9.375386211631406e-06,
40
  "num_train_epochs": 2,
41
+ "per_device_train_batch_size": 16,
42
+ "seed": 4
43
  }
44
  }
run-0/checkpoint-358/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed7492942e77c037e56d91ad59372c979d1f8ff2bc44d6c8e69149791748c37a
3
  size 4920
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:362bc42377e8cdf8bb785935f0b5fbe5a696f30de3dafe660b2fe381b2a64dc6
3
  size 4920
runs/Mar09_23-14-00_aa189cdd2d19/events.out.tfevents.1710026630.aa189cdd2d19.2368.3 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f3f56ef902ddb4652d3084a3d86a3c0dd6d4da9d1e67283e4dc2e3d5e44640dc
3
- size 4885
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:823abab9c7a85287656f94527b6673e6a0a1dd6d604fd9331149aafd1612e315
3
+ size 5562