End of training

Browse files

Files changed (7) hide show

README.md +91 -0
dict.txt +0 -0
model.safetensors +1 -1
sentencepiece.bpe.model +3 -0
special_tokens_map.json +51 -0
tokenizer_config.json +56 -0
training_args.bin +1 -1

README.md ADDED Viewed

	@@ -0,0 +1,91 @@

+---
+library_name: transformers
+license: mit
+base_model: FiveC/BartTay
+tags:
+- generated_from_trainer
+metrics:
+- sacrebleu
+model-index:
+- name: BartTayFinal-test
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# BartTayFinal-test
+This model is a fine-tuned version of [FiveC/BartTay](https://huggingface.co/FiveC/BartTay) on an unknown dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.1284
+- Sacrebleu: 17.1154
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 2e-05
+- train_batch_size: 16
+- eval_batch_size: 16
+- seed: 42
+- optimizer: Use OptimizerNames.ADAMW_TORCH_FUSED with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
+- lr_scheduler_type: linear
+- num_epochs: 3
+- mixed_precision_training: Native AMP
+### Training results
+| Training Loss | Epoch  | Step | Validation Loss | Sacrebleu |
+|:-------------:|:------:|:----:|:---------------:|:---------:|
+| 0.2531        | 0.0996 | 128  | 0.2094          | 0.1428    |
+| 0.2268        | 0.1992 | 256  | 0.1940          | 1.0998    |
+| 0.2106        | 0.2988 | 384  | 0.1869          | 2.8366    |
+| 0.1997        | 0.3984 | 512  | 0.1815          | 3.3156    |
+| 0.2056        | 0.4981 | 640  | 0.1811          | 2.6645    |
+| 0.1913        | 0.5977 | 768  | 0.1758          | 4.2371    |
+| 0.1852        | 0.6973 | 896  | 0.1677          | 6.2441    |
+| 0.187         | 0.7969 | 1024 | 0.1631          | 6.8860    |
+| 0.173         | 0.8965 | 1152 | 0.1581          | 7.9818    |
+| 0.171         | 0.9961 | 1280 | 0.1569          | 8.3053    |
+| 0.1547        | 1.0957 | 1408 | 0.1559          | 9.2269    |
+| 0.1546        | 1.1953 | 1536 | 0.1496          | 10.2844   |
+| 0.1475        | 1.2949 | 1664 | 0.1478          | 11.3408   |
+| 0.1542        | 1.3946 | 1792 | 0.1454          | 11.5532   |
+| 0.1532        | 1.4942 | 1920 | 0.1431          | 12.3223   |
+| 0.1453        | 1.5938 | 2048 | 0.1410          | 12.8742   |
+| 0.1465        | 1.6934 | 2176 | 0.1381          | 13.6623   |
+| 0.1486        | 1.7930 | 2304 | 0.1379          | 14.0894   |
+| 0.1432        | 1.8926 | 2432 | 0.1353          | 15.0525   |
+| 0.1399        | 1.9922 | 2560 | 0.1334          | 14.8205   |
+| 0.1325        | 2.0918 | 2688 | 0.1340          | 15.4056   |
+| 0.128         | 2.1914 | 2816 | 0.1325          | 16.1499   |
+| 0.1238        | 2.2911 | 2944 | 0.1320          | 15.7701   |
+| 0.1307        | 2.3907 | 3072 | 0.1302          | 16.3446   |
+| 0.126         | 2.4903 | 3200 | 0.1307          | 16.6955   |
+| 0.1264        | 2.5899 | 3328 | 0.1296          | 16.8372   |
+| 0.12          | 2.6895 | 3456 | 0.1296          | 16.9080   |
+| 0.1271        | 2.7891 | 3584 | 0.1291          | 16.7139   |
+| 0.1196        | 2.8887 | 3712 | 0.1286          | 17.0726   |
+| 0.1244        | 2.9883 | 3840 | 0.1284          | 17.1154   |
+### Framework versions
+- Transformers 4.57.1
+- Pytorch 2.8.0+cu126
+- Datasets 4.0.0
+- Tokenizers 0.22.1

dict.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8b0fe15462287b03ae86f81cbd4716f3364b0f77656c45f40c89e6a81737b297
 size 1583480280

 version https://git-lfs.github.com/spec/v1
+oid sha256:fd35ce75ebc0ea976ab42326abe895822a80726f78cfc763e2bdc0ed1ba0e827
 size 1583480280

sentencepiece.bpe.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cfc8146abe2a0488e9e2a0c56de7952f7c11ab059eca145a0a727afce0db2865
+size 5069051

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,51 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "cls_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": {
+    "content": "<pad>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "sep_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,56 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "40029": {
+      "content": "<mask>",
+      "lstrip": true,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "cls_token": "<s>",
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "mask_token": "<mask>",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<pad>",
+  "sep_token": "</s>",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "BartphoTokenizer",
+  "unk_token": "<unk>"
+}

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:66ca2557e3b6eda36de18f7f19c557f83999d16ce2143a0f43881beb5bc43887
 size 5969

 version https://git-lfs.github.com/spec/v1
+oid sha256:7680a1d34a65b8a6efa920d2bcc5a95253e4d6b194d5e275a3f1a4be0ef0b969
 size 5969