End of training

Files changed (6) hide show

README.md CHANGED Viewed

@@ -27,14 +27,15 @@ print(output["score"])
 ## Training procedure
 This model was trained with Reward.
 ### Framework versions
-- TRL: 0.28.0
 - Transformers: 4.57.1
 - Pytorch: 2.8.0+cu126
 - Datasets: 4.4.2

 ## Training procedure
 This model was trained with Reward.
 ### Framework versions
+- TRL: 0.29.0
 - Transformers: 4.57.1
 - Pytorch: 2.8.0+cu126
 - Datasets: 4.4.2

chat_template.jinja ADDED Viewed

+{%- for message in messages -%}
+    {%- set content = message.content if message.content is string else "" -%}
+    {%- if message.role == "user" -%}
+        {{ "<|im_start|>" + message.role + "
+"  + content + "<|im_end|>
+" }}
+    {%- elif message.role == "assistant" -%}
+        {% generation %}
+        {{ "<|im_start|>assistant
+" + content.lstrip("
+") + "<|im_end|>
+" }}
+        {% endgeneration %}
+    {%- endif -%}
+{%- endfor -%}
+{# ───── generation prompt ───── #}
+{%- if add_generation_prompt -%}
+    {{ "<|im_start|>assistant
+" + "<think>
+</think>
+"  }}
+{%- endif -%}

config.json CHANGED Viewed

@@ -13,8 +13,14 @@
   "head_dim": 256,
   "hidden_activation": "gelu_pytorch_tanh",
   "hidden_size": 640,
   "initializer_range": 0.02,
   "intermediate_size": 2048,
   "layer_types": [
     "sliding_attention",
     "sliding_attention",
@@ -50,5 +56,5 @@
   "transformers_version": "4.57.1",
   "use_bidirectional_attention": false,
   "use_cache": true,
-  "vocab_size": 262144
 }

   "head_dim": 256,
   "hidden_activation": "gelu_pytorch_tanh",
   "hidden_size": 640,
+  "id2label": {
+    "0": "LABEL_0"
+  },
   "initializer_range": 0.02,
   "intermediate_size": 2048,
+  "label2id": {
+    "LABEL_0": 0
+  },
   "layer_types": [
     "sliding_attention",
     "sliding_attention",
   "transformers_version": "4.57.1",
   "use_bidirectional_attention": false,
   "use_cache": true,
+  "vocab_size": 262147
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:871111223cf6a7a79cb58bb88ff6cb1b759e35c3f528cb457a05e612d34abe4e
-size 1072424464

 version https://git-lfs.github.com/spec/v1
+oid sha256:64388433a90441a8ad7fac8ddb0580075d9e01b1870e8a3ef61ae97c5ae27116
+size 1072429584

runs/Mar01_20-10-48_df9c3a37a31c/events.out.tfevents.1772395950.df9c3a37a31c.88.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:4ec92990c1870e3fef93372dd68510e12033d2ecf36bea52fe9f8cc14e1348ca
+size 43238

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9659243eb1bb3a1fbfe97b53f4731b09985897293928cf01902a7924e29be502
-size 6097

 version https://git-lfs.github.com/spec/v1
+oid sha256:ca59eb1c06f1689cc0023b60fa26ad801750128409443858acc2f28d661fd513
+size 6033