Silicon23 commited on
Commit
6793279
·
verified ·
1 Parent(s): 4d7ecca

Training in progress, epoch 1

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:704ef4bcd8ea60bbc53294ab7df6ba3b1e6831e8ce251571ce2b56c4a1de6259
3
  size 437958648
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3acc66ee228a8fbaec1ea30a8cc721d05dae8b55d25d5c9b87dff31e5fa8b625
3
  size 437958648
run-3/checkpoint-184/config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "AIMH/mental-bert-base-cased",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
@@ -23,5 +23,5 @@
23
  "transformers_version": "4.42.4",
24
  "type_vocab_size": 2,
25
  "use_cache": true,
26
- "vocab_size": 28996
27
  }
 
1
  {
2
+ "_name_or_path": "google-bert/bert-base-uncased",
3
  "architectures": [
4
  "BertForSequenceClassification"
5
  ],
 
23
  "transformers_version": "4.42.4",
24
  "type_vocab_size": 2,
25
  "use_cache": true,
26
+ "vocab_size": 30522
27
  }
run-3/checkpoint-184/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:390b87a07ea0f9d6a4d87537c546b85c20c7024933ff57eb2812b09c2682daad
3
- size 433270768
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5dd2efb9eeb705ea8b16b5da79358c1da34cf3a2882fd7eb9b8c9c9d434e92f
3
+ size 437958648
run-3/checkpoint-184/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b24fdf61dfde76f8c765621c48bb88cb407a2f76018dfe8bc773783315b77ed8
3
- size 866662650
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24c2b27b2223fd37b2fa33684f10cc9d3177ca08579859056399040a6095f444
3
+ size 876038394
run-3/checkpoint-184/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:681ec4e61374fa9e2aab11d316c063600df1f5046025c108beada34b2dff2d47
3
- size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:077a14d29ff2d9c856ffdd614b5eef79bea88d73063d9977a539a6dc593de297
3
+ size 14308
run-3/checkpoint-184/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd64a2b79ba8923b1e6ed89d8956bba3c4abe9090f3931e4252c9fb7fcfdce95
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e904389b286fdd080046e19448f588d09db351c91af423321259880cd786278e
3
  size 1064
run-3/checkpoint-184/special_tokens_map.json CHANGED
@@ -1,37 +1,7 @@
1
  {
2
- "cls_token": {
3
- "content": "[CLS]",
4
- "lstrip": false,
5
- "normalized": false,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "mask_token": {
10
- "content": "[MASK]",
11
- "lstrip": false,
12
- "normalized": false,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "pad_token": {
17
- "content": "[PAD]",
18
- "lstrip": false,
19
- "normalized": false,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
- "sep_token": {
24
- "content": "[SEP]",
25
- "lstrip": false,
26
- "normalized": false,
27
- "rstrip": false,
28
- "single_word": false
29
- },
30
- "unk_token": {
31
- "content": "[UNK]",
32
- "lstrip": false,
33
- "normalized": false,
34
- "rstrip": false,
35
- "single_word": false
36
- }
37
  }
 
1
  {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  }
run-3/checkpoint-184/tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
run-3/checkpoint-184/tokenizer_config.json CHANGED
@@ -43,17 +43,13 @@
43
  },
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
46
- "do_lower_case": false,
47
  "mask_token": "[MASK]",
48
- "max_length": 512,
49
  "model_max_length": 512,
50
  "pad_token": "[PAD]",
51
  "sep_token": "[SEP]",
52
- "stride": 0,
53
  "strip_accents": null,
54
  "tokenize_chinese_chars": true,
55
  "tokenizer_class": "BertTokenizer",
56
- "truncation_side": "right",
57
- "truncation_strategy": "longest_first",
58
  "unk_token": "[UNK]"
59
  }
 
43
  },
44
  "clean_up_tokenization_spaces": true,
45
  "cls_token": "[CLS]",
46
+ "do_lower_case": true,
47
  "mask_token": "[MASK]",
 
48
  "model_max_length": 512,
49
  "pad_token": "[PAD]",
50
  "sep_token": "[SEP]",
 
51
  "strip_accents": null,
52
  "tokenize_chinese_chars": true,
53
  "tokenizer_class": "BertTokenizer",
 
 
54
  "unk_token": "[UNK]"
55
  }
run-3/checkpoint-184/trainer_state.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "best_metric": 0.8465316144874155,
3
  "best_model_checkpoint": "BERTForDetectingDepression-Twitter2015/run-3/checkpoint-184",
4
- "epoch": 1.0,
5
  "eval_steps": 500,
6
  "global_step": 184,
7
  "is_hyper_param_search": true,
@@ -10,16 +10,25 @@
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
- "eval_accuracy": 0.8465316144874155,
14
- "eval_loss": 0.4355960190296173,
15
- "eval_runtime": 1.6102,
16
- "eval_samples_per_second": 1011.674,
17
- "eval_steps_per_second": 63.346,
 
 
 
 
 
 
 
 
 
18
  "step": 184
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 368,
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 2,
25
  "save_steps": 500,
@@ -30,18 +39,18 @@
30
  "should_evaluate": false,
31
  "should_log": false,
32
  "should_save": true,
33
- "should_training_stop": false
34
  },
35
  "attributes": {}
36
  }
37
  },
38
  "total_flos": 0,
39
- "train_batch_size": 8,
40
  "trial_name": null,
41
  "trial_params": {
42
- "learning_rate": 9.899372834750846e-05,
43
  "num_train_epochs": 2,
44
- "per_device_train_batch_size": 8,
45
- "seed": 35
46
  }
47
  }
 
1
  {
2
+ "best_metric": 0.7796193984039288,
3
  "best_model_checkpoint": "BERTForDetectingDepression-Twitter2015/run-3/checkpoint-184",
4
+ "epoch": 2.0,
5
  "eval_steps": 500,
6
  "global_step": 184,
7
  "is_hyper_param_search": true,
 
10
  "log_history": [
11
  {
12
  "epoch": 1.0,
13
+ "eval_accuracy": 0.7630448127685697,
14
+ "eval_loss": 0.46627277135849,
15
+ "eval_runtime": 1.4592,
16
+ "eval_samples_per_second": 1116.36,
17
+ "eval_steps_per_second": 69.901,
18
+ "step": 92
19
+ },
20
+ {
21
+ "epoch": 2.0,
22
+ "eval_accuracy": 0.7796193984039288,
23
+ "eval_loss": 0.4434141218662262,
24
+ "eval_runtime": 1.5862,
25
+ "eval_samples_per_second": 1026.96,
26
+ "eval_steps_per_second": 64.303,
27
  "step": 184
28
  }
29
  ],
30
  "logging_steps": 500,
31
+ "max_steps": 184,
32
  "num_input_tokens_seen": 0,
33
  "num_train_epochs": 2,
34
  "save_steps": 500,
 
39
  "should_evaluate": false,
40
  "should_log": false,
41
  "should_save": true,
42
+ "should_training_stop": true
43
  },
44
  "attributes": {}
45
  }
46
  },
47
  "total_flos": 0,
48
+ "train_batch_size": 16,
49
  "trial_name": null,
50
  "trial_params": {
51
+ "learning_rate": 2.159233393188895e-05,
52
  "num_train_epochs": 2,
53
+ "per_device_train_batch_size": 16,
54
+ "seed": 21
55
  }
56
  }
run-3/checkpoint-184/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24e46e8eb76ff9978b97b6569c3ac0be7c5dc09979dbba62178dbf785d19e67c
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0791269d577f31b2938387964641e880ef29f7b001df66e39e8233adc4c9474
3
  size 5176
run-3/checkpoint-184/vocab.txt CHANGED
The diff for this file is too large to render. See raw diff
 
run-4/checkpoint-23/config.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "google-bert/bert-base-uncased",
3
+ "architectures": [
4
+ "BertForSequenceClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "classifier_dropout": null,
8
+ "gradient_checkpointing": false,
9
+ "hidden_act": "gelu",
10
+ "hidden_dropout_prob": 0.1,
11
+ "hidden_size": 768,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 3072,
14
+ "layer_norm_eps": 1e-12,
15
+ "max_position_embeddings": 512,
16
+ "model_type": "bert",
17
+ "num_attention_heads": 12,
18
+ "num_hidden_layers": 12,
19
+ "pad_token_id": 0,
20
+ "position_embedding_type": "absolute",
21
+ "problem_type": "single_label_classification",
22
+ "torch_dtype": "float32",
23
+ "transformers_version": "4.42.4",
24
+ "type_vocab_size": 2,
25
+ "use_cache": true,
26
+ "vocab_size": 30522
27
+ }
run-4/checkpoint-23/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3acc66ee228a8fbaec1ea30a8cc721d05dae8b55d25d5c9b87dff31e5fa8b625
3
+ size 437958648
run-4/checkpoint-23/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a961d86fd5c541e3200b35dded450f82e4d2cba58a2359dfe098b3c027759450
3
+ size 876038394
run-4/checkpoint-23/rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6b5374b258a782a1c42464a3d348e037829ea94a82bd72abab9d1afc627506d
3
+ size 14244
run-4/checkpoint-23/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b77d79df43f49cd96a21a5d961fa56ca220a3195e3ffc35d77697df9dac9e4eb
3
+ size 1064
run-4/checkpoint-23/special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
run-4/checkpoint-23/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
run-4/checkpoint-23/tokenizer_config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_lower_case": true,
47
+ "mask_token": "[MASK]",
48
+ "model_max_length": 512,
49
+ "pad_token": "[PAD]",
50
+ "sep_token": "[SEP]",
51
+ "strip_accents": null,
52
+ "tokenize_chinese_chars": true,
53
+ "tokenizer_class": "BertTokenizer",
54
+ "unk_token": "[UNK]"
55
+ }
run-4/checkpoint-23/trainer_state.json ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.5979128299570289,
3
+ "best_model_checkpoint": "BERTForDetectingDepression-Twitter2015/run-4/checkpoint-23",
4
+ "epoch": 1.0,
5
+ "eval_steps": 500,
6
+ "global_step": 23,
7
+ "is_hyper_param_search": true,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_accuracy": 0.5979128299570289,
14
+ "eval_loss": 0.678537905216217,
15
+ "eval_runtime": 1.4893,
16
+ "eval_samples_per_second": 1093.811,
17
+ "eval_steps_per_second": 68.489,
18
+ "step": 23
19
+ }
20
+ ],
21
+ "logging_steps": 500,
22
+ "max_steps": 69,
23
+ "num_input_tokens_seen": 0,
24
+ "num_train_epochs": 3,
25
+ "save_steps": 500,
26
+ "stateful_callbacks": {
27
+ "TrainerControl": {
28
+ "args": {
29
+ "should_epoch_stop": false,
30
+ "should_evaluate": false,
31
+ "should_log": false,
32
+ "should_save": true,
33
+ "should_training_stop": false
34
+ },
35
+ "attributes": {}
36
+ }
37
+ },
38
+ "total_flos": 0,
39
+ "train_batch_size": 64,
40
+ "trial_name": null,
41
+ "trial_params": {
42
+ "learning_rate": 2.9236721941091785e-06,
43
+ "num_train_epochs": 3,
44
+ "per_device_train_batch_size": 64,
45
+ "seed": 12
46
+ }
47
+ }
run-4/checkpoint-23/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20e5d749933754adfcd491676d87575b65895093b05afc38cb0180cdd1806f56
3
+ size 5176
run-4/checkpoint-23/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
 
runs/Aug02_03-09-56_8953887c6028/events.out.tfevents.1722568629.8953887c6028.1235.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e5cbcb06b43be72942d3502453a7046f18942f5900b2f60325164d701b9cde4
3
+ size 6223
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0791269d577f31b2938387964641e880ef29f7b001df66e39e8233adc4c9474
3
  size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20e5d749933754adfcd491676d87575b65895093b05afc38cb0180cdd1806f56
3
  size 5176