dymax
/

SmolLM2-FT-MyDataset

Text Generation

Generated from Trainer

text-generation-inference

Model card Files Files and versions

Metrics Training metrics Community

dymax commited on Jun 19, 2025

Commit

e43e924

·

verified ·

1 Parent(s): f191cd2

End of training

Files changed (4) hide show

README.md +3 -2
model.safetensors +1 -1
special_tokens_map.json +17 -23
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -1,4 +1,5 @@
 ---
 library_name: transformers
 model_name: SmolLM2-FT-MyDataset
 tags:
@@ -12,7 +13,7 @@ licence: license
 # Model Card for SmolLM2-FT-MyDataset
-This model is a fine-tuned version of [None](https://huggingface.co/None).
 It has been trained using [TRL](https://github.com/huggingface/trl).
 ## Quick start
@@ -35,7 +36,7 @@ This model was trained with SFT.
 ### Framework versions
-- TRL: 0.18.1
 - Transformers: 4.52.4
 - Pytorch: 2.6.0+cu124
 - Datasets: 3.6.0

 ---
+base_model: HuggingFaceTB/SmolLM2-135M
 library_name: transformers
 model_name: SmolLM2-FT-MyDataset
 tags:
 # Model Card for SmolLM2-FT-MyDataset
+This model is a fine-tuned version of [HuggingFaceTB/SmolLM2-135M](https://huggingface.co/HuggingFaceTB/SmolLM2-135M).
 It has been trained using [TRL](https://github.com/huggingface/trl).
 ## Quick start
 ### Framework versions
+- TRL: 0.18.2
 - Transformers: 4.52.4
 - Pytorch: 2.6.0+cu124
 - Datasets: 3.6.0

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:75db70dec3f6eb373e3bd753964814b3bef3c41f78be78f2bca9fc4cc0d1b355
 size 538090408

 version https://git-lfs.github.com/spec/v1
+oid sha256:6757dd214fd3fa772b70ee726e777a14e0be23a4e7e1d8708df778e1e9507152
 size 538090408

special_tokens_map.json CHANGED Viewed

@@ -1,29 +1,23 @@
 {
   "additional_special_tokens": [
-    "<|im_start|>",
-    "<|im_end|>"
   ],
-  "bos_token": {
-    "content": "<|im_start|>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "eos_token": {
-    "content": "<|im_end|>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "pad_token": {
-    "content": "<|im_end|>",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
   "unk_token": {
     "content": "<|endoftext|>",
     "lstrip": false,

 {
   "additional_special_tokens": [
+    {
+      "content": "<|im_start|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    },
+    {
+      "content": "<|im_end|>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false
+    }
   ],
+  "bos_token": "<|im_start|>",
+  "eos_token": "<|im_end|>",
+  "pad_token": "<|im_end|>",
   "unk_token": {
     "content": "<|endoftext|>",
     "lstrip": false,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:813d9222d8cbf3e31fdc84714babe109ea8516bbc2bcfe1d6a359eb13dcbbcd3
 size 5560

 version https://git-lfs.github.com/spec/v1
+oid sha256:016edfbd8658b7a28714e7e9581744ae1e2ade895e07f59d820c3e8257af3ed6
 size 5560