End of training

Browse files

Files changed (4) hide show

README.md +16 -11
config.json +16 -33
model.safetensors +2 -2
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -6,20 +6,22 @@ tags:
 - generated_from_trainer
 metrics:
 - accuracy
 model-index:
-- name: results
   results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 should probably proofread and complete it, then remove this comment. -->
-# results
 This model is a fine-tuned version of [monologg/koelectra-base-v3-discriminator](https://huggingface.co/monologg/koelectra-base-v3-discriminator) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 2.0903
-- Accuracy: 0.3669
 ## Model description
@@ -44,16 +46,19 @@ The following hyperparameters were used during training:
 - seed: 42
 - optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
 - lr_scheduler_type: linear
-- num_epochs: 4
 ### Training results
-| Training Loss | Epoch | Step | Validation Loss | Accuracy |
-|:-------------:|:-----:|:----:|:---------------:|:--------:|
-| 2.5615        | 1.0   | 1554 | 2.5777          | 0.1532   |
-| 2.3007        | 2.0   | 3108 | 2.3464          | 0.2561   |
-| 1.9241        | 3.0   | 4662 | 2.1408          | 0.3367   |
-| 1.6816        | 4.0   | 6216 | 2.0903          | 0.3669   |
 ### Framework versions

 - generated_from_trainer
 metrics:
 - accuracy
+- f1
 model-index:
+- name: MyMbti_classification_model
   results: []
 ---
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 should probably proofread and complete it, then remove this comment. -->
+# MyMbti_classification_model
 This model is a fine-tuned version of [monologg/koelectra-base-v3-discriminator](https://huggingface.co/monologg/koelectra-base-v3-discriminator) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.6564
+- Accuracy: 0.5676
+- F1: 0.6406
 ## Model description
 - seed: 42
 - optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
 - lr_scheduler_type: linear
+- num_epochs: 5
 ### Training results
+| Training Loss | Epoch  | Step | Validation Loss | Accuracy | F1     |
+|:-------------:|:------:|:----:|:---------------:|:--------:|:------:|
+| 0.6612        | 0.0669 | 200  | 0.6585          | 0.4970   | 0.4306 |
+| 0.6569        | 0.1339 | 400  | 0.6563          | 0.4951   | 0.4099 |
+| 0.6547        | 0.2008 | 600  | 0.6564          | 0.5676   | 0.6406 |
+| 0.653         | 0.2677 | 800  | 0.6533          | 0.5289   | 0.5172 |
+| 0.6554        | 0.3347 | 1000 | 0.6524          | 0.5400   | 0.5435 |
+| 0.6558        | 0.4016 | 1200 | 0.6552          | 0.5416   | 0.4878 |
+| 0.6516        | 0.4685 | 1400 | 0.6549          | 0.5438   | 0.4847 |
 ### Framework versions

config.json CHANGED Viewed

@@ -3,48 +3,30 @@
     "ElectraForSequenceClassification"
   ],
   "attention_probs_dropout_prob": 0.1,
   "classifier_dropout": null,
   "embedding_size": 768,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "id2label": {
-    "0": "LABEL_0",
-    "1": "LABEL_1",
-    "2": "LABEL_2",
-    "3": "LABEL_3",
-    "4": "LABEL_4",
-    "5": "LABEL_5",
-    "6": "LABEL_6",
-    "7": "LABEL_7",
-    "8": "LABEL_8",
-    "9": "LABEL_9",
-    "10": "LABEL_10",
-    "11": "LABEL_11",
-    "12": "LABEL_12",
-    "13": "LABEL_13",
-    "14": "LABEL_14",
-    "15": "LABEL_15"
   },
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "label2id": {
-    "LABEL_0": 0,
-    "LABEL_1": 1,
-    "LABEL_10": 10,
-    "LABEL_11": 11,
-    "LABEL_12": 12,
-    "LABEL_13": 13,
-    "LABEL_14": 14,
-    "LABEL_15": 15,
-    "LABEL_2": 2,
-    "LABEL_3": 3,
-    "LABEL_4": 4,
-    "LABEL_5": 5,
-    "LABEL_6": 6,
-    "LABEL_7": 7,
-    "LABEL_8": 8,
-    "LABEL_9": 9
   },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
@@ -53,11 +35,12 @@
   "num_hidden_layers": 12,
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
-  "problem_type": "single_label_classification",
   "summary_activation": "gelu",
   "summary_last_dropout": 0.1,
   "summary_type": "first",
   "summary_use_proj": true,
   "torch_dtype": "float32",
   "transformers_version": "4.55.2",
   "type_vocab_size": 2,

     "ElectraForSequenceClassification"
   ],
   "attention_probs_dropout_prob": 0.1,
+  "axis_names": [
+    "IE",
+    "SN",
+    "TF",
+    "JP"
+  ],
   "classifier_dropout": null,
   "embedding_size": 768,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "id2label": {
+    "0": "IE",
+    "1": "SN",
+    "2": "TF",
+    "3": "JP"
   },
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "label2id": {
+    "IE": 0,
+    "JP": 3,
+    "SN": 1,
+    "TF": 2
   },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
   "num_hidden_layers": 12,
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
+  "problem_type": "multi_label_classification",
   "summary_activation": "gelu",
   "summary_last_dropout": 0.1,
   "summary_type": "first",
   "summary_use_proj": true,
+  "task_type": "multilabel_4axis",
   "torch_dtype": "float32",
   "transformers_version": "4.55.2",
   "type_vocab_size": 2,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0db04dc9c8d456584eac7f334388de3e6b2982f5807dadbfd487c5b13912bb45
-size 451758736

 version https://git-lfs.github.com/spec/v1
+oid sha256:7eac4d6bde09291ae691e27527969fba10a06eb4b13409899a89a41711444e5a
+size 451721824

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6de89322b112bf904d1abd35dc5efa4d54d4aea70192130afedd0da28083425e
 size 5713

 version https://git-lfs.github.com/spec/v1
+oid sha256:5bf668bbab69941c0ced64b8a84b99b1af55159f6b0ee1a0bac514355441169b
 size 5713