Silicon23 commited on Aug 2, 2024

Commit

2df4513

verified ·

1 Parent(s): 29c2df1

Training in progress, epoch 1

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model.safetensors +1 -1
run-0/checkpoint-138/config.json +27 -0
run-0/checkpoint-138/model.safetensors +3 -0
run-0/checkpoint-138/optimizer.pt +3 -0
run-0/checkpoint-138/rng_state.pth +3 -0
run-0/checkpoint-138/scheduler.pt +3 -0
run-0/checkpoint-138/special_tokens_map.json +7 -0
run-0/checkpoint-138/tokenizer.json +0 -0
run-0/checkpoint-138/tokenizer_config.json +55 -0
run-0/checkpoint-138/trainer_state.json +65 -0
run-0/checkpoint-138/training_args.bin +3 -0
run-0/checkpoint-138/vocab.txt +0 -0
run-0/checkpoint-92/config.json +27 -0
run-0/checkpoint-92/model.safetensors +3 -0
run-0/checkpoint-92/optimizer.pt +3 -0
run-0/checkpoint-92/rng_state.pth +3 -0
run-0/checkpoint-92/scheduler.pt +3 -0
run-0/checkpoint-92/special_tokens_map.json +7 -0
run-0/checkpoint-92/tokenizer.json +0 -0
run-0/checkpoint-92/tokenizer_config.json +55 -0
run-0/checkpoint-92/trainer_state.json +56 -0
run-0/checkpoint-92/training_args.bin +3 -0
run-0/checkpoint-92/vocab.txt +0 -0
run-1/checkpoint-115/config.json +27 -0
run-1/checkpoint-115/model.safetensors +3 -0
run-1/checkpoint-115/optimizer.pt +3 -0
run-1/checkpoint-115/rng_state.pth +3 -0
run-1/checkpoint-115/scheduler.pt +3 -0
run-1/checkpoint-115/special_tokens_map.json +7 -0
run-1/checkpoint-115/tokenizer.json +0 -0
run-1/checkpoint-115/tokenizer_config.json +55 -0
run-1/checkpoint-115/trainer_state.json +83 -0
run-1/checkpoint-115/training_args.bin +3 -0
run-1/checkpoint-115/vocab.txt +0 -0
run-1/checkpoint-23/config.json +27 -0
run-1/checkpoint-23/model.safetensors +3 -0
run-1/checkpoint-23/optimizer.pt +3 -0
run-1/checkpoint-23/rng_state.pth +3 -0
run-1/checkpoint-23/scheduler.pt +3 -0
run-1/checkpoint-23/special_tokens_map.json +7 -0
run-1/checkpoint-23/tokenizer.json +0 -0
run-1/checkpoint-23/tokenizer_config.json +55 -0
run-1/checkpoint-23/trainer_state.json +47 -0
run-1/checkpoint-23/training_args.bin +3 -0
run-1/checkpoint-23/vocab.txt +0 -0
run-1/checkpoint-46/config.json +2 -2
run-1/checkpoint-46/model.safetensors +2 -2
run-1/checkpoint-46/optimizer.pt +2 -2
run-1/checkpoint-46/rng_state.pth +2 -2
run-1/checkpoint-46/scheduler.pt +1 -1

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f0950bccb6e8f42ff8aaf183690786f4f587f3e867be81f34f2e747546f1f694
 size 437958648

 version https://git-lfs.github.com/spec/v1
+oid sha256:e2a3600272e96e508d95cd7d0fd4b74d14a69bf837314e079cf130d77ecb3317
 size 437958648

run-0/checkpoint-138/config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "_name_or_path": "google-bert/bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.42.4",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-0/checkpoint-138/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5dbf8b7bb52b22fabaeff1fad1884fcb9fcbefc79c054ab5f513ba8dbb49de65
+size 437958648

run-0/checkpoint-138/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b512fd546f75ddfaacc16badd6b502b618262232831aa7635939d990df20c4cf
+size 876038394

run-0/checkpoint-138/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e8ecd154d55702ed68fc41ceef15cb10a21893a89828613680e414311fa1854
+size 14308

run-0/checkpoint-138/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4029d4852946489c5a724dd947a32439cf547712bf02327b54e8f09e18d217ad
+size 1064

run-0/checkpoint-138/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-138/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-138/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-138/trainer_state.json ADDED Viewed

	@@ -0,0 +1,65 @@

+{
+  "best_metric": 0.6789441375076735,
+  "best_model_checkpoint": "BERTForDetectingDepression-Twitter2015/run-0/checkpoint-138",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 138,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.6187845303867403,
+      "eval_loss": 0.677045464515686,
+      "eval_runtime": 1.5174,
+      "eval_samples_per_second": 1073.531,
+      "eval_steps_per_second": 67.219,
+      "step": 46
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.6642111724984653,
+      "eval_loss": 0.6484399437904358,
+      "eval_runtime": 1.475,
+      "eval_samples_per_second": 1104.382,
+      "eval_steps_per_second": 69.151,
+      "step": 92
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.6789441375076735,
+      "eval_loss": 0.6311272978782654,
+      "eval_runtime": 1.5486,
+      "eval_samples_per_second": 1051.891,
+      "eval_steps_per_second": 65.864,
+      "step": 138
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 138,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 2.2663564697926915e-06,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 32,
+    "seed": 14
+  }
+}

run-0/checkpoint-138/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:837929207f0b87e3e725511aaedbea183a5274d57f3b1b522598d3b04a5f07f3
+size 5176

run-0/checkpoint-138/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-92/config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "_name_or_path": "google-bert/bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.42.4",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-0/checkpoint-92/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:026ee48e0cf3df0d2bef65cc3c1807d8cafaa676d2d85937b5cd5364ee373b86
+size 437958648

run-0/checkpoint-92/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e0192798ed32647f48c44b20c85c5f19a33c6aea50695de9147cd29e9f60a5d7
+size 876038394

run-0/checkpoint-92/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7fb4e9720d55f98334341af4c3b61159260bbef267c474db89d3c3c8dea14f5a
+size 14308

run-0/checkpoint-92/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f1e80f81925f9d805c8ec1205135b1649c03f930eaa068b7b25681ba2bfc6fa6
+size 1064

run-0/checkpoint-92/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-92/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-92/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-92/trainer_state.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "best_metric": 0.6642111724984653,
+  "best_model_checkpoint": "BERTForDetectingDepression-Twitter2015/run-0/checkpoint-92",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 92,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.6187845303867403,
+      "eval_loss": 0.677045464515686,
+      "eval_runtime": 1.5174,
+      "eval_samples_per_second": 1073.531,
+      "eval_steps_per_second": 67.219,
+      "step": 46
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.6642111724984653,
+      "eval_loss": 0.6484399437904358,
+      "eval_runtime": 1.475,
+      "eval_samples_per_second": 1104.382,
+      "eval_steps_per_second": 69.151,
+      "step": 92
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 138,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 32,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 2.2663564697926915e-06,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 32,
+    "seed": 14
+  }
+}

run-0/checkpoint-92/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:837929207f0b87e3e725511aaedbea183a5274d57f3b1b522598d3b04a5f07f3
+size 5176

run-0/checkpoint-92/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-115/config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "_name_or_path": "google-bert/bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.42.4",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-1/checkpoint-115/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c5e6fc5fe1da3684a3a006ea683bb96ed5863b38fdd49e6442c434ae74cf24da
+size 437958648

run-1/checkpoint-115/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0d0c1124a2903d09bbce354ea2ac2b170be98000e57d38e53fa95efd3dd81ebb
+size 876038394

run-1/checkpoint-115/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2ee419a7bbda5a4c1c2e5021a889b682984c20c35dcb9baf6728157769e86872
+size 14308

run-1/checkpoint-115/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a2c2df8857b6a5107644eba751f3ebd133f3275664b8e32d47687421b2a44b08
+size 1064

run-1/checkpoint-115/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-115/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-115/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-115/trainer_state.json ADDED Viewed

	@@ -0,0 +1,83 @@

+{
+  "best_metric": 0.761817065684469,
+  "best_model_checkpoint": "BERTForDetectingDepression-Twitter2015/run-1/checkpoint-115",
+  "epoch": 5.0,
+  "eval_steps": 500,
+  "global_step": 115,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.6642111724984653,
+      "eval_loss": 0.6271333694458008,
+      "eval_runtime": 1.4666,
+      "eval_samples_per_second": 1110.761,
+      "eval_steps_per_second": 69.55,
+      "step": 23
+    },
+    {
+      "epoch": 2.0,
+      "eval_accuracy": 0.7188459177409454,
+      "eval_loss": 0.5219240784645081,
+      "eval_runtime": 1.5,
+      "eval_samples_per_second": 1085.998,
+      "eval_steps_per_second": 68.0,
+      "step": 46
+    },
+    {
+      "epoch": 3.0,
+      "eval_accuracy": 0.7415592387968079,
+      "eval_loss": 0.47888997197151184,
+      "eval_runtime": 1.4904,
+      "eval_samples_per_second": 1092.984,
+      "eval_steps_per_second": 68.437,
+      "step": 69
+    },
+    {
+      "epoch": 4.0,
+      "eval_accuracy": 0.7483118477593615,
+      "eval_loss": 0.4670851230621338,
+      "eval_runtime": 1.5143,
+      "eval_samples_per_second": 1075.722,
+      "eval_steps_per_second": 67.356,
+      "step": 92
+    },
+    {
+      "epoch": 5.0,
+      "eval_accuracy": 0.761817065684469,
+      "eval_loss": 0.4600331485271454,
+      "eval_runtime": 1.5741,
+      "eval_samples_per_second": 1034.87,
+      "eval_steps_per_second": 64.799,
+      "step": 115
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 115,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 6.9782836266139365e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 14
+  }
+}

run-1/checkpoint-115/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1fc052e058e0609700f4d71cef9b05f3a649bb73e2cb1fa9b826998feb955cce
+size 5176

run-1/checkpoint-115/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-23/config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "_name_or_path": "google-bert/bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.42.4",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-1/checkpoint-23/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3dc1d1256baafc947da02e08de244f6ef734bb9d040a77a53b980f908f3b01ea
+size 437958648

run-1/checkpoint-23/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:55ebe142b0f28c27a4b17f530c60b6118539865507e1bb9be63fdfb09428dd7c
+size 876038394

run-1/checkpoint-23/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8adece8090459f26eab2fc804d4ef31922b8e56c6cf9a7588bab1f0364f48b33
+size 14308

run-1/checkpoint-23/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ee95a1c37f8ac4d9c53fe171baff3651d7f3b83675dbd8ad69cca835ca30f34b
+size 1064

run-1/checkpoint-23/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-23/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-23/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-23/trainer_state.json ADDED Viewed

	@@ -0,0 +1,47 @@

+{
+  "best_metric": 0.6642111724984653,
+  "best_model_checkpoint": "BERTForDetectingDepression-Twitter2015/run-1/checkpoint-23",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 23,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_accuracy": 0.6642111724984653,
+      "eval_loss": 0.6271333694458008,
+      "eval_runtime": 1.4666,
+      "eval_samples_per_second": 1110.761,
+      "eval_steps_per_second": 69.55,
+      "step": 23
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 115,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 6.9782836266139365e-06,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 64,
+    "seed": 14
+  }
+}

run-1/checkpoint-23/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1fc052e058e0609700f4d71cef9b05f3a649bb73e2cb1fa9b826998feb955cce
+size 5176

run-1/checkpoint-23/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-46/config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "AIMH/mental-bert-base-cased",
   "architectures": [
     "BertForSequenceClassification"
   ],
@@ -23,5 +23,5 @@
   "transformers_version": "4.42.4",
   "type_vocab_size": 2,
   "use_cache": true,
-  "vocab_size": 28996
 }

 {
+  "_name_or_path": "google-bert/bert-base-uncased",
   "architectures": [
     "BertForSequenceClassification"
   ],
   "transformers_version": "4.42.4",
   "type_vocab_size": 2,
   "use_cache": true,
+  "vocab_size": 30522
 }

run-1/checkpoint-46/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dc917e584973edc749cf694c1228f611a6882a562c84dfbe1aff346e9cb16bcd
-size 433270768

 version https://git-lfs.github.com/spec/v1
+oid sha256:4163412194623739457773b30f405c0e8b5f6414abe78bf60a38bd8cea092426
+size 437958648

run-1/checkpoint-46/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b2f2217fb0fcd8060d966470a3c91c46cc7bf5c372277d447ed5fb517e2b69e0
-size 866662650

 version https://git-lfs.github.com/spec/v1
+oid sha256:c7e533af6af1ce210e1fb52cf9ead6151c788ddd91459e191fbcf345fd9f02a9
+size 876038394

run-1/checkpoint-46/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3741068fe73763fea3a5f64541b64a384c4ecbb4560207f9ece1de7c171e503e
-size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:6908d76e4b94598f7d7d295f3110d78f44327859ae99e6f608f73aa224224364
+size 14308

run-1/checkpoint-46/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0773ccd18bf9c6a00d48af6c1c6112e2af9a5be3524a5aa8341b6fa206346db9
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:e2e6c1efd917b07685110ab129135faf25a14970b3e6d6b6e96f57377e6f487f
 size 1064