End of training

Browse files

Files changed (9) hide show

README.md +13 -12
all_results.json +7 -7
config.json +1 -1
generation_config.json +1 -1
model.safetensors +1 -1
test_results.json +7 -7
tokenizer.json +2 -2
tokenizer_config.json +0 -1
training_args.bin +2 -2

README.md CHANGED Viewed

@@ -3,6 +3,8 @@ library_name: transformers
 license: cc-by-nc-4.0
 base_model: facebook/nllb-200-distilled-600M
 tags:
 - generated_from_trainer
 metrics:
 - bleu
@@ -14,13 +16,14 @@ model-index:
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 should probably proofread and complete it, then remove this comment. -->
 # nllb-dry-run
 This model is a fine-tuned version of [facebook/nllb-200-distilled-600M](https://huggingface.co/facebook/nllb-200-distilled-600M) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 3.6589
-- Bleu: 2.6974
-- Chrf: 19.3271
 ## Model description
@@ -51,18 +54,16 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch  | Step | Validation Loss | Bleu   | Chrf    |
 |:-------------:|:------:|:----:|:---------------:|:------:|:-------:|
-| No log        | 0.3125 | 10   | 3.4706          | 2.5602 | 16.3473 |
-| No log        | 0.625  | 20   | 3.3367          | 3.8875 | 19.2715 |
-| No log        | 0.9375 | 30   | 3.3101          | 5.7749 | 18.7760 |
-| No log        | 1.25   | 40   | 3.2497          | 4.1533 | 21.2912 |
-| No log        | 1.5625 | 50   | 3.5124          | 4.0060 | 19.0293 |
-| No log        | 1.875  | 60   | 3.3710          | 3.9858 | 21.0020 |
-| No log        | 2.1875 | 70   | 3.6589          | 2.6974 | 19.3271 |
 ### Framework versions
-- Transformers 5.7.0
 - Pytorch 2.8.0+cu128
-- Datasets 4.8.5
 - Tokenizers 0.22.2

 license: cc-by-nc-4.0
 base_model: facebook/nllb-200-distilled-600M
 tags:
+- trackio
+- trackio:https://huggingface.co/spaces/madoss/trackio
 - generated_from_trainer
 metrics:
 - bleu
 <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 should probably proofread and complete it, then remove this comment. -->
+<a href="https://huggingface.co/spaces/madoss/trackio" target="_blank"><img src="https://raw.githubusercontent.com/gradio-app/trackio/refs/heads/main/trackio/assets/badge.png" alt="Visualize in Trackio" title="Visualize in Trackio" style="height: 40px;"/></a>
 # nllb-dry-run
 This model is a fine-tuned version of [facebook/nllb-200-distilled-600M](https://huggingface.co/facebook/nllb-200-distilled-600M) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 3.5119
+- Bleu: 3.4640
+- Chrf: 18.8077
 ## Model description
 | Training Loss | Epoch  | Step | Validation Loss | Bleu   | Chrf    |
 |:-------------:|:------:|:----:|:---------------:|:------:|:-------:|
+| No log        | 0.3125 | 10   | 3.4697          | 2.3857 | 15.3837 |
+| No log        | 0.625  | 20   | 3.3382          | 3.7821 | 19.2101 |
+| No log        | 0.9375 | 30   | 3.3116          | 5.8430 | 18.9142 |
+| No log        | 1.25   | 40   | 3.2531          | 3.6516 | 19.1025 |
+| No log        | 1.5625 | 50   | 3.5119          | 3.4640 | 18.8077 |
 ### Framework versions
+- Transformers 5.5.4
 - Pytorch 2.8.0+cu128
+- Datasets 4.8.4
 - Tokenizers 0.22.2

all_results.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
-    "epoch": 2.1875,
-    "test_bleu": 0.7201604351112776,
-    "test_chrf": 16.004319571347093,
-    "test_loss": 4.11027193069458,
-    "test_runtime": 4.0659,
-    "test_samples_per_second": 2.459,
-    "test_steps_per_second": 0.738
 }

 {
+    "epoch": 1.5625,
+    "test_bleu": 2.3686059277426317,
+    "test_chrf": 19.996465593863476,
+    "test_loss": 4.228389739990234,
+    "test_runtime": 6.6284,
+    "test_samples_per_second": 1.509,
+    "test_steps_per_second": 0.453
 }

config.json CHANGED Viewed

@@ -27,7 +27,7 @@
   "scale_embedding": true,
   "tie_word_embeddings": true,
   "tokenizer_class": "NllbTokenizer",
-  "transformers_version": "5.7.0",
   "use_cache": false,
   "vocab_size": 256206
 }

   "scale_embedding": true,
   "tie_word_embeddings": true,
   "tokenizer_class": "NllbTokenizer",
+  "transformers_version": "5.5.4",
   "use_cache": false,
   "vocab_size": 256206
 }

generation_config.json CHANGED Viewed

@@ -32,7 +32,7 @@
   "temperature": 1.0,
   "top_k": 50,
   "top_p": 1.0,
-  "transformers_version": "5.7.0",
   "typical_p": 1.0,
   "use_cache": true
 }

   "temperature": 1.0,
   "top_k": 50,
   "top_p": 1.0,
+  "transformers_version": "5.5.4",
   "typical_p": 1.0,
   "use_cache": true
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:410c7bac8e64c1ebcae22aa1d6e7cc6845f43ae9104a6c277e963251217236f9
 size 2460354912

 version https://git-lfs.github.com/spec/v1
+oid sha256:6f7f5620207bfc05b93aefecc44aa76e1fafb516a279ce755d0acd91bbe0ca91
 size 2460354912

test_results.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
-    "epoch": 2.1875,
-    "test_bleu": 0.7201604351112776,
-    "test_chrf": 16.004319571347093,
-    "test_loss": 4.11027193069458,
-    "test_runtime": 4.0659,
-    "test_samples_per_second": 2.459,
-    "test_steps_per_second": 0.738
 }

 {
+    "epoch": 1.5625,
+    "test_bleu": 2.3686059277426317,
+    "test_chrf": 19.996465593863476,
+    "test_loss": 4.228389739990234,
+    "test_runtime": 6.6284,
+    "test_samples_per_second": 1.509,
+    "test_steps_per_second": 0.453
 }

tokenizer.json CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f39ebb5b95428adcefc2fac66b01cb90204197fcb1871fbce2f03f74ea671164
-size 32240136

 version https://git-lfs.github.com/spec/v1
+oid sha256:a033dad7cd9f5a295fff4a20fe14f7b2c6dc7152c670c79d07e502891d460fe7
+size 32240233

tokenizer_config.json CHANGED Viewed

@@ -209,7 +209,6 @@
   ],
   "is_local": false,
   "legacy_behaviour": false,
-  "local_files_only": false,
   "mask_token": "<mask>",
   "model_max_length": 1024,
   "pad_token": "<pad>",

   ],
   "is_local": false,
   "legacy_behaviour": false,
   "mask_token": "<mask>",
   "model_max_length": 1024,
   "pad_token": "<pad>",

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8e263635a31ac91ac2fbd2a517c781c92f0e88fa0cea7d2c688b6a2e2a310c5c
-size 5457

 version https://git-lfs.github.com/spec/v1
+oid sha256:270f2e120330b110cc57777d90e42017aa5dcd4d8ae3ac8792a08da0702b4137
+size 5393