Upload folder using huggingface_hub

Files changed (9) hide show

added_tokens.json ADDED Viewed

+{
+  "<mask>": 64000
+}

best_model.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:9d0ec680e3d53c5873c628000ab6960d16c1e2f53056772175f1cafa10ae1f8c
+size 540083162

bpe.codes ADDED Viewed

The diff for this file is too large to render. See raw diff

config.json ADDED Viewed

+{
+  "model_type": "ExtractiveSummarizationModel",
+  "base_model": "VoVanPhuc/sup-SimCSE-VietNamese-phobert-base",
+  "max_length": 256,
+  "max_sentences": 6,
+  "num_labels": 2
+}

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:ac6d41c0d0599e160719cec4b3c6a0a3910f75687fec659e53c19e001aa3f843
+size 540023352

special_tokens_map.json ADDED Viewed

+{
+  "bos_token": "<s>",
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": "<mask>",
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "unk_token": "<unk>"
+}

tokenizer_config.json ADDED Viewed

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "64000": {
+      "content": "<mask>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "mask_token": "<mask>",
+  "model_max_length": 256,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "tokenizer_class": "PhobertTokenizer",
+  "unk_token": "<unk>"
+}

training_history.json ADDED Viewed

+{
+  "train_losses": [
+    0.5307241083458066,
+    0.42265801821276544,
+    0.28383589831739664,
+    0.18120389145310037,
+    0.12248440267366822
+  ],
+  "val_losses": [
+    0.4832361350059509,
+    0.48715638515353205,
+    0.4948434266000986,
+    0.6831720430944115,
+    0.813050055058673
+  ],
+  "val_accuracies": [
+    0.7677911844373307,
+    0.7823196257079537,
+    0.8091603053435115,
+    0.8079290815070179,
+    0.8059591233686284
+  ],
+  "val_f1_scores": [
+    0.8186189651856126,
+    0.8418038654259127,
+    0.8512190439623728,
+    0.8513719512195121,
+    0.8478176902278872
+  ]
+}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff