Upload fine-tuned KcELECTRA emotion model (6 classes)

Files changed (6) hide show

config.json ADDED Viewed

+{
+  "add_cross_attention": false,
+  "architectures": [
+    "ElectraForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "bos_token_id": null,
+  "classifier_dropout": null,
+  "dtype": "float32",
+  "embedding_size": 768,
+  "eos_token_id": null,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "LABEL_0",
+    "1": "LABEL_1",
+    "2": "LABEL_2",
+    "3": "LABEL_3",
+    "4": "LABEL_4",
+    "5": "LABEL_5"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "is_decoder": false,
+  "label2id": {
+    "LABEL_0": 0,
+    "LABEL_1": 1,
+    "LABEL_2": 2,
+    "LABEL_3": 3,
+    "LABEL_4": 4,
+    "LABEL_5": 5
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "electra",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "summary_activation": "gelu",
+  "summary_last_dropout": 0.1,
+  "summary_type": "first",
+  "summary_use_proj": true,
+  "tie_word_embeddings": true,
+  "tokenizer_class": "BertTokenizer",
+  "transformers_version": "5.3.0",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 54343
+}

metrics.json ADDED Viewed

+{
+  "train_loss": [
+    1.3997176137407767,
+    1.060374002843689,
+    0.9424460485780697,
+    0.8126668618181824,
+    0.6781947357485433,
+    0.550816770938434,
+    0.44699311838975775,
+    0.3649046599144829,
+    0.3023313081891379,
+    0.2600003223730046
+  ],
+  "val_loss": [
+    0.8864293653661242,
+    0.7893356407920902,
+    0.7794545379180747,
+    0.7466167671462665,
+    0.7812407450356449,
+    0.8254531650051761,
+    0.888769704875393,
+    0.9474576842129374,
+    0.9978417330421507,
+    1.0494976064163404
+  ],
+  "val_acc": [
+    0.6776622985389366,
+    0.707486067178792,
+    0.7135110709444193,
+    0.7315860822413014,
+    0.7299292062057539,
+    0.7330923331827083,
+    0.7368579605362253,
+    0.7404729627956017,
+    0.7388160867600543,
+    0.7395692122307577
+  ]
+}

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba11952764f0efacca1bfd00eaabd65e43d927a1d9448e6ff1285753a02115c2
+size 511149648

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

+{
+  "backend": "tokenizers",
+  "cls_token": "[CLS]",
+  "do_basic_tokenize": true,
+  "do_lower_case": false,
+  "is_local": false,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "never_split": null,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

training_curve.png ADDED Viewed