aarabil
/

Qwen3-Embedding-0.6B

Feature Extraction

text-generation-inference

Model card Files Files and versions

aarabil commited on Sep 7, 2025

Commit

3a8569b

·

verified ·

1 Parent(s): dc1dc8e

Upload model

Files changed (2) hide show

config.json +33 -3
model.safetensors +2 -2

config.json CHANGED Viewed

@@ -1,16 +1,47 @@
 {
   "architectures": [
-    "Qwen3ForCausalLM"
   ],
   "attention_bias": false,
   "attention_dropout": 0.0,
   "bos_token_id": 151643,
   "eos_token_id": 151643,
   "head_dim": 128,
   "hidden_act": "silu",
   "hidden_size": 1024,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "max_position_embeddings": 32768,
   "max_window_layers": 28,
   "model_type": "qwen3",
@@ -22,8 +53,7 @@
   "rope_theta": 1000000,
   "sliding_window": null,
   "tie_word_embeddings": true,
-  "torch_dtype": "float32",
-  "transformers_version": "4.52.4",
   "use_cache": true,
   "use_sliding_window": false,
   "vocab_size": 151669

 {
   "architectures": [
+    "Qwen3Model"
   ],
   "attention_bias": false,
   "attention_dropout": 0.0,
   "bos_token_id": 151643,
+  "dtype": "float32",
   "eos_token_id": 151643,
   "head_dim": 128,
   "hidden_act": "silu",
   "hidden_size": 1024,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
+  "layer_types": [
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention",
+    "full_attention"
+  ],
   "max_position_embeddings": 32768,
   "max_window_layers": 28,
   "model_type": "qwen3",
   "rope_theta": 1000000,
   "sliding_window": null,
   "tie_word_embeddings": true,
+  "transformers_version": "4.56.0",
   "use_cache": true,
   "use_sliding_window": false,
   "vocab_size": 151669

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b37cc0fe306b402a94e75ebe116c60e9feef0ec2405d28fb2d29b2f805abb64e
-size 2383141336

 version https://git-lfs.github.com/spec/v1
+oid sha256:fea1a806ad4460c25fe92c57617d33d3e92499ebd024cb102bb7052cb91dd509
+size 2383139480