trl-internal-testing
/

tiny-Qwen3ForCausalLM

Text Generation

text-generation-inference

Model card Files Files and versions

qgallouedec HF Staff commited on Sep 23, 2025

Commit

34cb715

·

verified ·

1 Parent(s): 4329e26

Upload Qwen3ForCausalLM

Files changed (2) hide show

config.json +1 -41
model.safetensors +1 -1

config.json CHANGED Viewed

@@ -13,40 +13,6 @@
   "initializer_range": 0.02,
   "intermediate_size": 32,
   "layer_types": [
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
-    "full_attention",
     "full_attention",
     "full_attention"
   ],
@@ -57,13 +23,7 @@
   "num_hidden_layers": 2,
   "num_key_value_heads": 2,
   "rms_norm_eps": 1e-06,
-  "rope_scaling": {
-    "mrope_section": [
-      2
-    ],
-    "rope_type": "default",
-    "type": "default"
-  },
   "rope_theta": 1000000,
   "sliding_window": null,
   "tie_word_embeddings": false,

   "initializer_range": 0.02,
   "intermediate_size": 32,
   "layer_types": [
     "full_attention",
     "full_attention"
   ],
   "num_hidden_layers": 2,
   "num_key_value_heads": 2,
   "rms_norm_eps": 1e-06,
+  "rope_scaling": null,
   "rope_theta": 1000000,
   "sliding_window": null,
   "tie_word_embeddings": false,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d62d6528dfe6f8a52484a7bc55c160566f0bcc64eecc60d9908b8bf92270cda9
 size 4917896

 version https://git-lfs.github.com/spec/v1
+oid sha256:835d9e71035ff7e2261b3a8e4d693a86921caa3b07210aee6501bd22d6bc82dc
 size 4917896