Update models
Browse files- .gitattributes +13 -0
- Qwen2.5-Math-1.5B-Instruct-Q2_K.gguf +3 -0
- Qwen2.5-Math-1.5B-Instruct-Q3_K_L.gguf +3 -0
- Qwen2.5-Math-1.5B-Instruct-Q3_K_M.gguf +3 -0
- Qwen2.5-Math-1.5B-Instruct-Q3_K_S.gguf +3 -0
- Qwen2.5-Math-1.5B-Instruct-Q4_0.gguf +3 -0
- Qwen2.5-Math-1.5B-Instruct-Q4_K_M.gguf +3 -0
- Qwen2.5-Math-1.5B-Instruct-Q4_K_S.gguf +3 -0
- Qwen2.5-Math-1.5B-Instruct-Q5_0.gguf +3 -0
- Qwen2.5-Math-1.5B-Instruct-Q5_K_M.gguf +3 -0
- Qwen2.5-Math-1.5B-Instruct-Q5_K_S.gguf +3 -0
- Qwen2.5-Math-1.5B-Instruct-Q6_K.gguf +3 -0
- Qwen2.5-Math-1.5B-Instruct-Q8_0.gguf +3 -0
- Qwen2.5-Math-1.5B-Instruct-f16.gguf +3 -0
- config.json +27 -0
.gitattributes
CHANGED
|
@@ -33,3 +33,16 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
| 34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
| 35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
| 36 |
+
Qwen2.5-Math-1.5B-Instruct-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
| 37 |
+
Qwen2.5-Math-1.5B-Instruct-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
| 38 |
+
Qwen2.5-Math-1.5B-Instruct-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
| 39 |
+
Qwen2.5-Math-1.5B-Instruct-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
| 40 |
+
Qwen2.5-Math-1.5B-Instruct-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
| 41 |
+
Qwen2.5-Math-1.5B-Instruct-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
| 42 |
+
Qwen2.5-Math-1.5B-Instruct-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
| 43 |
+
Qwen2.5-Math-1.5B-Instruct-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
|
| 44 |
+
Qwen2.5-Math-1.5B-Instruct-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
| 45 |
+
Qwen2.5-Math-1.5B-Instruct-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
| 46 |
+
Qwen2.5-Math-1.5B-Instruct-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
| 47 |
+
Qwen2.5-Math-1.5B-Instruct-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
|
| 48 |
+
Qwen2.5-Math-1.5B-Instruct-f16.gguf filter=lfs diff=lfs merge=lfs -text
|
Qwen2.5-Math-1.5B-Instruct-Q2_K.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:128c79c7638ef0d706b9d1848ce9532b798b49b09fe9f0784f1fd3b83d2b2408
|
| 3 |
+
size 676304928
|
Qwen2.5-Math-1.5B-Instruct-Q3_K_L.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a952483ac97a181ba0f1ee26863ea2027f07ac3a4020d644be31ee78b088844b
|
| 3 |
+
size 880162848
|
Qwen2.5-Math-1.5B-Instruct-Q3_K_M.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f318bc30fb48d6042cd4d0a24d26abe56e5b38b03cb59bff511dcafc4575b1b9
|
| 3 |
+
size 824178720
|
Qwen2.5-Math-1.5B-Instruct-Q3_K_S.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cc90862576ec6064d01af20a302dd9fb1ddd3b9012a33b2f7a380574a6ed064
|
| 3 |
+
size 760944672
|
Qwen2.5-Math-1.5B-Instruct-Q4_0.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d99708da6261b0444376210c1d313ac485a184bad4d203504974e41b72a5b5b0
|
| 3 |
+
size 934955040
|
Qwen2.5-Math-1.5B-Instruct-Q4_K_M.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:336d6f6973034fea14fae3164649dd8d81fb1df06dee3aa12de26cfb04715759
|
| 3 |
+
size 986048544
|
Qwen2.5-Math-1.5B-Instruct-Q4_K_S.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2779466c5852b11f63389abde0b1f130c5749614227bd930b5a15dcecd143b45
|
| 3 |
+
size 940312608
|
Qwen2.5-Math-1.5B-Instruct-Q5_0.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:74681aa30a576aec0601df54144fa9e2aa6ab8ce6ed6357e464ed910d54ca33a
|
| 3 |
+
size 1098729504
|
Qwen2.5-Math-1.5B-Instruct-Q5_K_M.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:66b73a573f2d7a091b9ccbd464fdc2a83d69003a6708b5fc5811845a839361de
|
| 3 |
+
size 1125050400
|
Qwen2.5-Math-1.5B-Instruct-Q5_K_S.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f689c71bf0c4781884add84c807b450203671fda825d3b799b23774a7cbdacc8
|
| 3 |
+
size 1098729504
|
Qwen2.5-Math-1.5B-Instruct-Q6_K.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:472d3de5fd86e80d0ad714e888c1e869bcab3d88554fd0f3e9fdf5659cf30cc8
|
| 3 |
+
size 1272739872
|
Qwen2.5-Math-1.5B-Instruct-Q8_0.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f1a95bbe6e3d3c9502f302dba2b8a40a7a79332c063a0752c78de0a017ff8fbf
|
| 3 |
+
size 1646573088
|
Qwen2.5-Math-1.5B-Instruct-f16.gguf
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa0a19c14acb67de8a9a0e271d5cc0334c8ccec9e68103324e3a13f6c98d07c2
|
| 3 |
+
size 3093669408
|
config.json
ADDED
|
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"Qwen2ForCausalLM"
|
| 4 |
+
],
|
| 5 |
+
"attention_dropout": 0.0,
|
| 6 |
+
"bos_token_id": 151643,
|
| 7 |
+
"eos_token_id": 151645,
|
| 8 |
+
"hidden_act": "silu",
|
| 9 |
+
"hidden_size": 1536,
|
| 10 |
+
"initializer_range": 0.02,
|
| 11 |
+
"intermediate_size": 8960,
|
| 12 |
+
"max_position_embeddings": 4096,
|
| 13 |
+
"max_window_layers": 21,
|
| 14 |
+
"model_type": "qwen2",
|
| 15 |
+
"num_attention_heads": 12,
|
| 16 |
+
"num_hidden_layers": 28,
|
| 17 |
+
"num_key_value_heads": 2,
|
| 18 |
+
"rms_norm_eps": 1e-06,
|
| 19 |
+
"rope_theta": 10000.0,
|
| 20 |
+
"sliding_window": 4096,
|
| 21 |
+
"tie_word_embeddings": true,
|
| 22 |
+
"torch_dtype": "bfloat16",
|
| 23 |
+
"transformers_version": "4.43.1",
|
| 24 |
+
"use_cache": true,
|
| 25 |
+
"use_sliding_window": false,
|
| 26 |
+
"vocab_size": 151936
|
| 27 |
+
}
|