Silicon23 commited on
Commit
05c8f03
·
verified ·
1 Parent(s): cd9eb22

Training in progress, epoch 1

Browse files
Files changed (36) hide show
  1. model.safetensors +1 -1
  2. run-2/checkpoint-1101/config.json +2 -2
  3. run-2/checkpoint-1101/model.safetensors +2 -2
  4. run-2/checkpoint-1101/optimizer.pt +2 -2
  5. run-2/checkpoint-1101/rng_state.pth +1 -1
  6. run-2/checkpoint-1101/scheduler.pt +1 -1
  7. run-2/checkpoint-1101/special_tokens_map.json +35 -5
  8. run-2/checkpoint-1101/tokenizer.json +0 -0
  9. run-2/checkpoint-1101/tokenizer_config.json +5 -1
  10. run-2/checkpoint-1101/trainer_state.json +30 -30
  11. run-2/checkpoint-1101/training_args.bin +1 -1
  12. run-2/checkpoint-1101/vocab.txt +0 -0
  13. run-2/checkpoint-734/config.json +2 -2
  14. run-2/checkpoint-734/model.safetensors +2 -2
  15. run-2/checkpoint-734/optimizer.pt +2 -2
  16. run-2/checkpoint-734/rng_state.pth +1 -1
  17. run-2/checkpoint-734/scheduler.pt +1 -1
  18. run-2/checkpoint-734/special_tokens_map.json +35 -5
  19. run-2/checkpoint-734/tokenizer.json +0 -0
  20. run-2/checkpoint-734/tokenizer_config.json +5 -1
  21. run-2/checkpoint-734/trainer_state.json +20 -20
  22. run-2/checkpoint-734/training_args.bin +1 -1
  23. run-2/checkpoint-734/vocab.txt +0 -0
  24. run-3/checkpoint-184/config.json +27 -0
  25. run-3/checkpoint-184/model.safetensors +3 -0
  26. run-3/checkpoint-184/optimizer.pt +3 -0
  27. run-3/checkpoint-184/rng_state.pth +3 -0
  28. run-3/checkpoint-184/scheduler.pt +3 -0
  29. run-3/checkpoint-184/special_tokens_map.json +37 -0
  30. run-3/checkpoint-184/tokenizer.json +0 -0
  31. run-3/checkpoint-184/tokenizer_config.json +59 -0
  32. run-3/checkpoint-184/trainer_state.json +47 -0
  33. run-3/checkpoint-184/training_args.bin +3 -0
  34. run-3/checkpoint-184/vocab.txt +0 -0
  35. runs/Aug01_14-25-19_1d376fbba8fb/events.out.tfevents.1722522793.1d376fbba8fb.12065.6 +3 -0
  36. training_args.bin +1 -1
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fadc71a72125e03f5838a56bfadbd4602fa066c074a14f472a32a55cecf283e9
3
  size 433270768
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:390b87a07ea0f9d6a4d87537c546b85c20c7024933ff57eb2812b09c2682daad
3
  size 433270768
run-2/checkpoint-1101/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "google-bert/bert-base-uncased",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
@@ -23,5 +23,5 @@
23
  "transformers_version": "4.42.4",
24
  "type_vocab_size": 2,
25
  "use_cache": true,
26
- "vocab_size": 30522
27
  }
 
1
  {
2
+ "_name_or_path": "AIMH/mental-bert-base-cased",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
 
23
  "transformers_version": "4.42.4",
24
  "type_vocab_size": 2,
25
  "use_cache": true,
26
+ "vocab_size": 28996
27
  }
run-2/checkpoint-1101/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f779546e5d9b6f9135ee088f0f2964d2cf38ba87e922bee184ea20d63557abfe
3
- size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58532fc3e6e1a792d6eb422fdeaa2ba2aec556a1473580e392c144e6dacd0dd3
3
+ size 433270768
run-2/checkpoint-1101/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6eab4a8bec2860524e20618eb23b1dbd2dc3e704b1d873cf473fd144e519e89d
3
- size 876038394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:186aefc95e967cccdee9c7e6d071af5f570d869ed965183ee610232d59082858
3
+ size 866662650
run-2/checkpoint-1101/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:933286e0cb9dcea1f2c440bb26c48c8f37234f07f09a7914eca4e8dc98672017
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62544c3cadf55a8d18579328e5981c8ef34e618dca083fe5c9460fac4bcc9ee2
3
  size 14244
run-2/checkpoint-1101/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77cb59fcda7e06ca900ff873508b1edd0916052514a9aa26ce5a07cecd3ad2a6
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:64ac2d15bb8efc796f5dc6b11142a1c7de8e9e03a6bed927a5bb8c773c4277b1
3
  size 1064
run-2/checkpoint-1101/special_tokens_map.json CHANGED
@@ -1,7 +1,37 @@
1
  {
2
- "cls_token": "[CLS]",
3
- "mask_token": "[MASK]",
4
- "pad_token": "[PAD]",
5
- "sep_token": "[SEP]",
6
- "unk_token": "[UNK]"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  }
 
1
  {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
  }
run-2/checkpoint-1101/tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
run-2/checkpoint-1101/tokenizer_config.json CHANGED
@@ -43,13 +43,17 @@
43
  },
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
46
- "do_lower_case": true,
47
  "mask_token": "[MASK]",
 
48
  "model_max_length": 512,
49
  "pad_token": "[PAD]",
50
  "sep_token": "[SEP]",
 
51
  "strip_accents": null,
52
  "tokenize_chinese_chars": true,
53
  "tokenizer_class": "BertTokenizer",
 
 
54
  "unk_token": "[UNK]"
55
  }
 
43
  },
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
46
+ "do_lower_case": false,
47
  "mask_token": "[MASK]",
48
+ "max_length": 512,
49
  "model_max_length": 512,
50
  "pad_token": "[PAD]",
51
  "sep_token": "[SEP]",
52
+ "stride": 0,
53
  "strip_accents": null,
54
  "tokenize_chinese_chars": true,
55
  "tokenizer_class": "BertTokenizer",
56
+ "truncation_side": "right",
57
+ "truncation_strategy": "longest_first",
58
  "unk_token": "[UNK]"
59
  }
run-2/checkpoint-1101/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "best_metric": 0.861878453038674,
3
- "best_model_checkpoint": "BERTForDetectingDepression-Twitter2015/run-2/checkpoint-734",
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
  "global_step": 1101,
@@ -10,50 +10,50 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.8207489257213014,
14
- "eval_loss": 0.41005730628967285,
15
- "eval_runtime": 1.5429,
16
- "eval_samples_per_second": 1055.797,
17
- "eval_steps_per_second": 66.109,
18
  "step": 367
19
  },
20
  {
21
  "epoch": 1.3623978201634879,
22
- "grad_norm": 9.666861534118652,
23
- "learning_rate": 1.831949194907621e-05,
24
- "loss": 0.5034,
25
  "step": 500
26
  },
27
  {
28
  "epoch": 2.0,
29
- "eval_accuracy": 0.861878453038674,
30
- "eval_loss": 0.5616857409477234,
31
- "eval_runtime": 1.528,
32
- "eval_samples_per_second": 1066.087,
33
- "eval_steps_per_second": 66.753,
34
  "step": 734
35
  },
36
  {
37
  "epoch": 2.7247956403269757,
38
- "grad_norm": 0.05537036433815956,
39
- "learning_rate": 1.1458259009347293e-05,
40
- "loss": 0.3057,
41
  "step": 1000
42
  },
43
  {
44
  "epoch": 3.0,
45
- "eval_accuracy": 0.8575813382443217,
46
- "eval_loss": 0.6872314810752869,
47
- "eval_runtime": 1.521,
48
- "eval_samples_per_second": 1070.983,
49
- "eval_steps_per_second": 67.06,
50
  "step": 1101
51
  }
52
  ],
53
  "logging_steps": 500,
54
- "max_steps": 1835,
55
  "num_input_tokens_seen": 0,
56
- "num_train_epochs": 5,
57
  "save_steps": 500,
58
  "stateful_callbacks": {
59
  "TrainerControl": {
@@ -62,18 +62,18 @@
62
  "should_evaluate": false,
63
  "should_log": false,
64
  "should_save": true,
65
- "should_training_stop": false
66
  },
67
  "attributes": {}
68
  }
69
  },
70
- "total_flos": 81016621722120.0,
71
  "train_batch_size": 4,
72
  "trial_name": null,
73
  "trial_params": {
74
- "learning_rate": 2.518072488880513e-05,
75
- "num_train_epochs": 5,
76
  "per_device_train_batch_size": 4,
77
- "seed": 4
78
  }
79
  }
 
1
  {
2
+ "best_metric": 0.8256599140577041,
3
+ "best_model_checkpoint": "BERTForDetectingDepression-Twitter2015/run-2/checkpoint-1101",
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
  "global_step": 1101,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.7808471454880295,
14
+ "eval_loss": 0.4515644609928131,
15
+ "eval_runtime": 1.6125,
16
+ "eval_samples_per_second": 1010.242,
17
+ "eval_steps_per_second": 63.256,
18
  "step": 367
19
  },
20
  {
21
  "epoch": 1.3623978201634879,
22
+ "grad_norm": 3.5979933738708496,
23
+ "learning_rate": 2.9911866451614284e-06,
24
+ "loss": 0.5208,
25
  "step": 500
26
  },
27
  {
28
  "epoch": 2.0,
29
+ "eval_accuracy": 0.8066298342541437,
30
+ "eval_loss": 0.448224276304245,
31
+ "eval_runtime": 1.6212,
32
+ "eval_samples_per_second": 1004.815,
33
+ "eval_steps_per_second": 62.917,
34
  "step": 734
35
  },
36
  {
37
  "epoch": 2.7247956403269757,
38
+ "grad_norm": 4.29625940322876,
39
+ "learning_rate": 5.026786209006726e-07,
40
+ "loss": 0.325,
41
  "step": 1000
42
  },
43
  {
44
  "epoch": 3.0,
45
+ "eval_accuracy": 0.8256599140577041,
46
+ "eval_loss": 0.4320577085018158,
47
+ "eval_runtime": 1.678,
48
+ "eval_samples_per_second": 970.776,
49
+ "eval_steps_per_second": 60.785,
50
  "step": 1101
51
  }
52
  ],
53
  "logging_steps": 500,
54
+ "max_steps": 1101,
55
  "num_input_tokens_seen": 0,
56
+ "num_train_epochs": 3,
57
  "save_steps": 500,
58
  "stateful_callbacks": {
59
  "TrainerControl": {
 
62
  "should_evaluate": false,
63
  "should_log": false,
64
  "should_save": true,
65
+ "should_training_stop": true
66
  },
67
  "attributes": {}
68
  }
69
  },
70
+ "total_flos": 90217286439240.0,
71
  "train_batch_size": 4,
72
  "trial_name": null,
73
  "trial_params": {
74
+ "learning_rate": 5.479694669422184e-06,
75
+ "num_train_epochs": 3,
76
  "per_device_train_batch_size": 4,
77
+ "seed": 23
78
  }
79
  }
run-2/checkpoint-1101/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3af0b514cbeb65fed5983531cf5e1fc2aae93ff3c4176583420eb7605bc7fb0
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebd0369de99427537c423d0dcd390a5465d1461d045302bfffcb8614bb9235cc
3
  size 5176
run-2/checkpoint-1101/vocab.txt CHANGED
The diff for this file is too large to render. See raw diff
 
run-2/checkpoint-734/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "google-bert/bert-base-uncased",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
@@ -23,5 +23,5 @@
23
  "transformers_version": "4.42.4",
24
  "type_vocab_size": 2,
25
  "use_cache": true,
26
- "vocab_size": 30522
27
  }
 
1
  {
2
+ "_name_or_path": "AIMH/mental-bert-base-cased",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
 
23
  "transformers_version": "4.42.4",
24
  "type_vocab_size": 2,
25
  "use_cache": true,
26
+ "vocab_size": 28996
27
  }
run-2/checkpoint-734/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16836ad2bed7e1c06c29ab9c278ea0801ebece4460836e1f4a03eeb6dcadf70b
3
- size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22de66c13813794a8111aa89a923c1d57e9437dbd057535fe4d3bbc6ce22b39f
3
+ size 433270768
run-2/checkpoint-734/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d2951dc23e785ac921ccd98c3cfea9770023d11ffb4c2af318f973dd2610a452
3
- size 876038394
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6140149df5f589df3e3669009c769099a8006618fa3a6e91c1a1b4891cd5abb7
3
+ size 866662650
run-2/checkpoint-734/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b878d34a0236f2e6d5b32621550cff1a52197ba912466b784bfa5f7f8b32056f
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c39c2ac1c613684f4984d47e60b07a0f89176826248f03f52a9539dd84aa196
3
  size 14244
run-2/checkpoint-734/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ddbeda33f6d7c4029fa8fca87e9c1c94c8a03667a2ebe8e9ab9c63b2250fb03
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3ab0ad8872c70c5a562dd2d5915ea3f7511b921e537935b427e8eb886434452
3
  size 1064
run-2/checkpoint-734/special_tokens_map.json CHANGED
@@ -1,7 +1,37 @@
1
  {
2
- "cls_token": "[CLS]",
3
- "mask_token": "[MASK]",
4
- "pad_token": "[PAD]",
5
- "sep_token": "[SEP]",
6
- "unk_token": "[UNK]"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  }
 
1
  {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
  }
run-2/checkpoint-734/tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
run-2/checkpoint-734/tokenizer_config.json CHANGED
@@ -43,13 +43,17 @@
43
  },
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
46
- "do_lower_case": true,
47
  "mask_token": "[MASK]",
 
48
  "model_max_length": 512,
49
  "pad_token": "[PAD]",
50
  "sep_token": "[SEP]",
 
51
  "strip_accents": null,
52
  "tokenize_chinese_chars": true,
53
  "tokenizer_class": "BertTokenizer",
 
 
54
  "unk_token": "[UNK]"
55
  }
 
43
  },
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
46
+ "do_lower_case": false,
47
  "mask_token": "[MASK]",
48
+ "max_length": 512,
49
  "model_max_length": 512,
50
  "pad_token": "[PAD]",
51
  "sep_token": "[SEP]",
52
+ "stride": 0,
53
  "strip_accents": null,
54
  "tokenize_chinese_chars": true,
55
  "tokenizer_class": "BertTokenizer",
56
+ "truncation_side": "right",
57
+ "truncation_strategy": "longest_first",
58
  "unk_token": "[UNK]"
59
  }
run-2/checkpoint-734/trainer_state.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "best_metric": 0.861878453038674,
3
  "best_model_checkpoint": "BERTForDetectingDepression-Twitter2015/run-2/checkpoint-734",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
@@ -10,34 +10,34 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.8207489257213014,
14
- "eval_loss": 0.41005730628967285,
15
- "eval_runtime": 1.5429,
16
- "eval_samples_per_second": 1055.797,
17
- "eval_steps_per_second": 66.109,
18
  "step": 367
19
  },
20
  {
21
  "epoch": 1.3623978201634879,
22
- "grad_norm": 9.666861534118652,
23
- "learning_rate": 1.831949194907621e-05,
24
- "loss": 0.5034,
25
  "step": 500
26
  },
27
  {
28
  "epoch": 2.0,
29
- "eval_accuracy": 0.861878453038674,
30
- "eval_loss": 0.5616857409477234,
31
- "eval_runtime": 1.528,
32
- "eval_samples_per_second": 1066.087,
33
- "eval_steps_per_second": 66.753,
34
  "step": 734
35
  }
36
  ],
37
  "logging_steps": 500,
38
- "max_steps": 1835,
39
  "num_input_tokens_seen": 0,
40
- "num_train_epochs": 5,
41
  "save_steps": 500,
42
  "stateful_callbacks": {
43
  "TrainerControl": {
@@ -51,13 +51,13 @@
51
  "attributes": {}
52
  }
53
  },
54
- "total_flos": 40395769218240.0,
55
  "train_batch_size": 4,
56
  "trial_name": null,
57
  "trial_params": {
58
- "learning_rate": 2.518072488880513e-05,
59
- "num_train_epochs": 5,
60
  "per_device_train_batch_size": 4,
61
- "seed": 4
62
  }
63
  }
 
1
  {
2
+ "best_metric": 0.8066298342541437,
3
  "best_model_checkpoint": "BERTForDetectingDepression-Twitter2015/run-2/checkpoint-734",
4
  "epoch": 2.0,
5
  "eval_steps": 500,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.7808471454880295,
14
+ "eval_loss": 0.4515644609928131,
15
+ "eval_runtime": 1.6125,
16
+ "eval_samples_per_second": 1010.242,
17
+ "eval_steps_per_second": 63.256,
18
  "step": 367
19
  },
20
  {
21
  "epoch": 1.3623978201634879,
22
+ "grad_norm": 3.5979933738708496,
23
+ "learning_rate": 2.9911866451614284e-06,
24
+ "loss": 0.5208,
25
  "step": 500
26
  },
27
  {
28
  "epoch": 2.0,
29
+ "eval_accuracy": 0.8066298342541437,
30
+ "eval_loss": 0.448224276304245,
31
+ "eval_runtime": 1.6212,
32
+ "eval_samples_per_second": 1004.815,
33
+ "eval_steps_per_second": 62.917,
34
  "step": 734
35
  }
36
  ],
37
  "logging_steps": 500,
38
+ "max_steps": 1101,
39
  "num_input_tokens_seen": 0,
40
+ "num_train_epochs": 3,
41
  "save_steps": 500,
42
  "stateful_callbacks": {
43
  "TrainerControl": {
 
51
  "attributes": {}
52
  }
53
  },
54
+ "total_flos": 45391795937400.0,
55
  "train_batch_size": 4,
56
  "trial_name": null,
57
  "trial_params": {
58
+ "learning_rate": 5.479694669422184e-06,
59
+ "num_train_epochs": 3,
60
  "per_device_train_batch_size": 4,
61
+ "seed": 23
62
  }
63
  }
run-2/checkpoint-734/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3af0b514cbeb65fed5983531cf5e1fc2aae93ff3c4176583420eb7605bc7fb0
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebd0369de99427537c423d0dcd390a5465d1461d045302bfffcb8614bb9235cc
3
  size 5176
run-2/checkpoint-734/vocab.txt CHANGED
The diff for this file is too large to render. See raw diff
 
run-3/checkpoint-184/config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "AIMH/mental-bert-base-cased",
3
+ "architectures": [
4
+ "BertForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "gradient_checkpointing": false,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 768,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-12,
15
+ "max_position_embeddings": 512,
16
+ "model_type": "bert",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 0,
20
+ "position_embedding_type": "absolute",
21
+ "problem_type": "single_label_classification",
22
+ "torch_dtype": "float32",
23
+ "transformers_version": "4.42.4",
24
+ "type_vocab_size": 2,
25
+ "use_cache": true,
26
+ "vocab_size": 28996
27
+ }
run-3/checkpoint-184/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:390b87a07ea0f9d6a4d87537c546b85c20c7024933ff57eb2812b09c2682daad
3
+ size 433270768
run-3/checkpoint-184/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b24fdf61dfde76f8c765621c48bb88cb407a2f76018dfe8bc773783315b77ed8
3
+ size 866662650
run-3/checkpoint-184/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:681ec4e61374fa9e2aab11d316c063600df1f5046025c108beada34b2dff2d47
3
+ size 14244
run-3/checkpoint-184/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd64a2b79ba8923b1e6ed89d8956bba3c4abe9090f3931e4252c9fb7fcfdce95
3
+ size 1064
run-3/checkpoint-184/special_tokens_map.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": {
3
+ "content": "[CLS]",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "mask_token": {
10
+ "content": "[MASK]",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": {
17
+ "content": "[PAD]",
18
+ "lstrip": false,
19
+ "normalized": false,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
+ "sep_token": {
24
+ "content": "[SEP]",
25
+ "lstrip": false,
26
+ "normalized": false,
27
+ "rstrip": false,
28
+ "single_word": false
29
+ },
30
+ "unk_token": {
31
+ "content": "[UNK]",
32
+ "lstrip": false,
33
+ "normalized": false,
34
+ "rstrip": false,
35
+ "single_word": false
36
+ }
37
+ }
run-3/checkpoint-184/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
run-3/checkpoint-184/tokenizer_config.json ADDED
@@ -0,0 +1,59 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_lower_case": false,
47
+ "mask_token": "[MASK]",
48
+ "max_length": 512,
49
+ "model_max_length": 512,
50
+ "pad_token": "[PAD]",
51
+ "sep_token": "[SEP]",
52
+ "stride": 0,
53
+ "strip_accents": null,
54
+ "tokenize_chinese_chars": true,
55
+ "tokenizer_class": "BertTokenizer",
56
+ "truncation_side": "right",
57
+ "truncation_strategy": "longest_first",
58
+ "unk_token": "[UNK]"
59
+ }
run-3/checkpoint-184/trainer_state.json ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.8465316144874155,
3
+ "best_model_checkpoint": "BERTForDetectingDepression-Twitter2015/run-3/checkpoint-184",
4
+ "epoch": 1.0,
5
+ "eval_steps": 500,
6
+ "global_step": 184,
7
+ "is_hyper_param_search": true,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_accuracy": 0.8465316144874155,
14
+ "eval_loss": 0.4355960190296173,
15
+ "eval_runtime": 1.6102,
16
+ "eval_samples_per_second": 1011.674,
17
+ "eval_steps_per_second": 63.346,
18
+ "step": 184
19
+ }
20
+ ],
21
+ "logging_steps": 500,
22
+ "max_steps": 368,
23
+ "num_input_tokens_seen": 0,
24
+ "num_train_epochs": 2,
25
+ "save_steps": 500,
26
+ "stateful_callbacks": {
27
+ "TrainerControl": {
28
+ "args": {
29
+ "should_epoch_stop": false,
30
+ "should_evaluate": false,
31
+ "should_log": false,
32
+ "should_save": true,
33
+ "should_training_stop": false
34
+ },
35
+ "attributes": {}
36
+ }
37
+ },
38
+ "total_flos": 0,
39
+ "train_batch_size": 8,
40
+ "trial_name": null,
41
+ "trial_params": {
42
+ "learning_rate": 9.899372834750846e-05,
43
+ "num_train_epochs": 2,
44
+ "per_device_train_batch_size": 8,
45
+ "seed": 35
46
+ }
47
+ }
run-3/checkpoint-184/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24e46e8eb76ff9978b97b6569c3ac0be7c5dc09979dbba62178dbf785d19e67c
3
+ size 5176
run-3/checkpoint-184/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
 
runs/Aug01_14-25-19_1d376fbba8fb/events.out.tfevents.1722522793.1d376fbba8fb.12065.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f8a2ed30a8a9722b0d9f5f4d492153d65867329454e353ef638efc271abd324
3
+ size 5948
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ebd0369de99427537c423d0dcd390a5465d1461d045302bfffcb8614bb9235cc
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24e46e8eb76ff9978b97b6569c3ac0be7c5dc09979dbba62178dbf785d19e67c
3
  size 5176