AngelRaychev
/

0.5B-policy-iteration_7

Text Generation

Generated from Trainer

text-generation-inference

Model card Files Files and versions

AngelRaychev commited on May 14, 2025

Commit

2266c7e

·

verified ·

1 Parent(s): d00ad67

End of training

Files changed (3) hide show

config.json +1 -1
pytorch_model.bin +1 -1
training_args.bin +1 -1

config.json CHANGED Viewed

@@ -11,7 +11,7 @@
   "intermediate_size": 4864,
   "max_position_embeddings": 32768,
   "max_window_layers": 24,
-  "model_card": "\nFinal Loss: 0.1673\nBatch Size: 256\nLearning Rate: 5e-06\nDataset Size: 12591\n",
   "model_type": "qwen2",
   "num_attention_heads": 14,
   "num_hidden_layers": 24,

   "intermediate_size": 4864,
   "max_position_embeddings": 32768,
   "max_window_layers": 24,
+  "model_card": "\nFinal Loss: 0.1683\nBatch Size: 512\nLearning Rate: 5e-06\nDataset Size: 12591\n",
   "model_type": "qwen2",
   "num_attention_heads": 14,
   "num_hidden_layers": 24,

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d3df4b903008bb467bcf7c9fb24cdc8101f1b73e469cafee3fd95af2d7559efc
 size 988163026

 version https://git-lfs.github.com/spec/v1
+oid sha256:7aeaf1b527ead357df85a12973c6d4a6a15acf31cdeca477b3471820323852f6
 size 988163026

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d2cee0c878a3284dba884d3cacae6a86ae7b4c078fac42091f7e16d39de570d4
 size 5624

 version https://git-lfs.github.com/spec/v1
+oid sha256:6a29d96aa638a5c5562064d795ce2f91fe93f5a8b7f696ad71e36378cecae230
 size 5624