bezzam
/

Qwen3-ASR-1.7B

Text Generation

Model card Files Files and versions

bezzam HF Staff commited on 25 days ago

Commit

62e9718

·

verified ·

1 Parent(s): 928ba58

Upload Qwen3ASRForConditionalGeneration

Files changed (2) hide show

config.json +35 -10
model.safetensors +2 -2

config.json CHANGED Viewed

@@ -41,27 +41,52 @@
     "hidden_size": 2048,
     "initializer_range": 0.02,
     "intermediate_size": 6144,
     "max_position_embeddings": 65536,
-    "model_type": "qwen3_asr_text",
     "num_attention_heads": 16,
     "num_hidden_layers": 28,
     "num_key_value_heads": 8,
     "pad_token_id": null,
     "rms_norm_eps": 1e-06,
     "rope_parameters": {
-      "interleaved": true,
-      "mrope_interleaved": true,
-      "mrope_section": [
-        24,
-        20,
-        20
-      ],
       "rope_theta": 1000000,
-      "rope_type": "default",
-      "type": "default"
     },
     "tie_word_embeddings": true,
     "use_cache": true,
     "vocab_size": 151936
   },
   "transformers_version": "5.5.0.dev0"

     "hidden_size": 2048,
     "initializer_range": 0.02,
     "intermediate_size": 6144,
+    "layer_types": [
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention",
+      "full_attention"
+    ],
     "max_position_embeddings": 65536,
+    "max_window_layers": 28,
+    "model_type": "qwen3",
     "num_attention_heads": 16,
     "num_hidden_layers": 28,
     "num_key_value_heads": 8,
     "pad_token_id": null,
     "rms_norm_eps": 1e-06,
     "rope_parameters": {
       "rope_theta": 1000000,
+      "rope_type": "default"
     },
+    "sliding_window": null,
     "tie_word_embeddings": true,
     "use_cache": true,
+    "use_sliding_window": false,
     "vocab_size": 151936
   },
   "transformers_version": "5.5.0.dev0"

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b499ebc2de7e9d023636f77be0dc35b4e655bd22fa27d7401fd94a43cbd38f46
-size 4698515936

 version https://git-lfs.github.com/spec/v1
+oid sha256:361730b2a606a75eb9d495c5dc531b11337c0b59a68c7775d19e5094f90713e0
+size 4076190632