Upload folder using huggingface_hub
Browse files- README.md +13 -26
- mergekit_config.yml +0 -9
- model-00001-of-00004.safetensors +1 -1
- model-00002-of-00004.safetensors +1 -1
- model-00003-of-00004.safetensors +1 -1
- model-00004-of-00004.safetensors +1 -1
README.md
CHANGED
|
@@ -1,18 +1,16 @@
|
|
| 1 |
---
|
| 2 |
base_model:
|
| 3 |
-
-
|
| 4 |
-
- Qwen/Qwen2.5-Coder-7B
|
| 5 |
-
- prithivMLmods/QwQ-MathOct-7B
|
| 6 |
-
- Qwen/Qwen2.5-Math-7B
|
| 7 |
-
- prithivMLmods/QwQ-LCoT2-7B-Instruct
|
| 8 |
- EVA-UNIT-01/EVA-Qwen2.5-7B-v0.1
|
|
|
|
| 9 |
- Qwen/Qwen2.5-7B-Instruct-1M
|
| 10 |
-
- Qwen/Qwen2.5-
|
| 11 |
-
- Qwen/Qwen2.5-7B
|
| 12 |
-
- fblgit/cybertron-v4-qw7B-UNAMGS
|
| 13 |
- deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
|
|
|
|
|
|
|
|
|
|
| 14 |
- huihui-ai/Qwen2.5-7B-Instruct-abliterated
|
| 15 |
-
-
|
| 16 |
library_name: transformers
|
| 17 |
tags:
|
| 18 |
- mergekit
|
|
@@ -31,18 +29,16 @@ This model was merged using the [TIES](https://arxiv.org/abs/2306.01708) merge m
|
|
| 31 |
### Models Merged
|
| 32 |
|
| 33 |
The following models were included in the merge:
|
| 34 |
-
* [Rombo-Org/Rombo-LLM-V2.5-Qwen-7b](https://huggingface.co/Rombo-Org/Rombo-LLM-V2.5-Qwen-7b)
|
| 35 |
-
* [Qwen/Qwen2.5-Coder-7B](https://huggingface.co/Qwen/Qwen2.5-Coder-7B)
|
| 36 |
-
* [prithivMLmods/QwQ-MathOct-7B](https://huggingface.co/prithivMLmods/QwQ-MathOct-7B)
|
| 37 |
-
* [Qwen/Qwen2.5-Math-7B](https://huggingface.co/Qwen/Qwen2.5-Math-7B)
|
| 38 |
-
* [prithivMLmods/QwQ-LCoT2-7B-Instruct](https://huggingface.co/prithivMLmods/QwQ-LCoT2-7B-Instruct)
|
| 39 |
* [EVA-UNIT-01/EVA-Qwen2.5-7B-v0.1](https://huggingface.co/EVA-UNIT-01/EVA-Qwen2.5-7B-v0.1)
|
|
|
|
| 40 |
* [Qwen/Qwen2.5-7B-Instruct-1M](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct-1M)
|
| 41 |
-
* [Qwen/Qwen2.5-7B](https://huggingface.co/Qwen/Qwen2.5-7B)
|
| 42 |
-
* [fblgit/cybertron-v4-qw7B-UNAMGS](https://huggingface.co/fblgit/cybertron-v4-qw7B-UNAMGS)
|
| 43 |
* [deepseek-ai/DeepSeek-R1-Distill-Qwen-7B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B)
|
|
|
|
|
|
|
|
|
|
| 44 |
* [huihui-ai/Qwen2.5-7B-Instruct-abliterated](https://huggingface.co/huihui-ai/Qwen2.5-7B-Instruct-abliterated)
|
| 45 |
-
* [
|
| 46 |
|
| 47 |
### Configuration
|
| 48 |
|
|
@@ -50,12 +46,6 @@ The following YAML configuration was used to produce this model:
|
|
| 50 |
|
| 51 |
```yaml
|
| 52 |
models:
|
| 53 |
-
- model: Qwen/Qwen2.5-7B-Instruct
|
| 54 |
-
parameters:
|
| 55 |
-
weight: 1
|
| 56 |
-
- model: Qwen/Qwen2.5-7B
|
| 57 |
-
parameters:
|
| 58 |
-
weight: 1
|
| 59 |
- model: Qwen/Qwen2.5-Math-7B
|
| 60 |
parameters:
|
| 61 |
weight: 1
|
|
@@ -86,9 +76,6 @@ models:
|
|
| 86 |
- model: prithivMLmods/QwQ-LCoT2-7B-Instruct
|
| 87 |
parameters:
|
| 88 |
weight: 1
|
| 89 |
-
- model: prithivMLmods/QwQ-MathOct-7B
|
| 90 |
-
parameters:
|
| 91 |
-
weight: 1
|
| 92 |
merge_method: ties
|
| 93 |
base_model: Qwen/Qwen2.5-7B-Instruct
|
| 94 |
parameters:
|
|
|
|
| 1 |
---
|
| 2 |
base_model:
|
| 3 |
+
- Qwen/Qwen2.5-7B-Instruct
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4 |
- EVA-UNIT-01/EVA-Qwen2.5-7B-v0.1
|
| 5 |
+
- HumanLLMs/Human-Like-Qwen2.5-7B-Instruct
|
| 6 |
- Qwen/Qwen2.5-7B-Instruct-1M
|
| 7 |
+
- Qwen/Qwen2.5-Math-7B
|
|
|
|
|
|
|
| 8 |
- deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
|
| 9 |
+
- Qwen/Qwen2.5-Coder-7B
|
| 10 |
+
- fblgit/cybertron-v4-qw7B-UNAMGS
|
| 11 |
+
- prithivMLmods/QwQ-LCoT2-7B-Instruct
|
| 12 |
- huihui-ai/Qwen2.5-7B-Instruct-abliterated
|
| 13 |
+
- Rombo-Org/Rombo-LLM-V2.5-Qwen-7b
|
| 14 |
library_name: transformers
|
| 15 |
tags:
|
| 16 |
- mergekit
|
|
|
|
| 29 |
### Models Merged
|
| 30 |
|
| 31 |
The following models were included in the merge:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 32 |
* [EVA-UNIT-01/EVA-Qwen2.5-7B-v0.1](https://huggingface.co/EVA-UNIT-01/EVA-Qwen2.5-7B-v0.1)
|
| 33 |
+
* [HumanLLMs/Human-Like-Qwen2.5-7B-Instruct](https://huggingface.co/HumanLLMs/Human-Like-Qwen2.5-7B-Instruct)
|
| 34 |
* [Qwen/Qwen2.5-7B-Instruct-1M](https://huggingface.co/Qwen/Qwen2.5-7B-Instruct-1M)
|
| 35 |
+
* [Qwen/Qwen2.5-Math-7B](https://huggingface.co/Qwen/Qwen2.5-Math-7B)
|
|
|
|
| 36 |
* [deepseek-ai/DeepSeek-R1-Distill-Qwen-7B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B)
|
| 37 |
+
* [Qwen/Qwen2.5-Coder-7B](https://huggingface.co/Qwen/Qwen2.5-Coder-7B)
|
| 38 |
+
* [fblgit/cybertron-v4-qw7B-UNAMGS](https://huggingface.co/fblgit/cybertron-v4-qw7B-UNAMGS)
|
| 39 |
+
* [prithivMLmods/QwQ-LCoT2-7B-Instruct](https://huggingface.co/prithivMLmods/QwQ-LCoT2-7B-Instruct)
|
| 40 |
* [huihui-ai/Qwen2.5-7B-Instruct-abliterated](https://huggingface.co/huihui-ai/Qwen2.5-7B-Instruct-abliterated)
|
| 41 |
+
* [Rombo-Org/Rombo-LLM-V2.5-Qwen-7b](https://huggingface.co/Rombo-Org/Rombo-LLM-V2.5-Qwen-7b)
|
| 42 |
|
| 43 |
### Configuration
|
| 44 |
|
|
|
|
| 46 |
|
| 47 |
```yaml
|
| 48 |
models:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 49 |
- model: Qwen/Qwen2.5-Math-7B
|
| 50 |
parameters:
|
| 51 |
weight: 1
|
|
|
|
| 76 |
- model: prithivMLmods/QwQ-LCoT2-7B-Instruct
|
| 77 |
parameters:
|
| 78 |
weight: 1
|
|
|
|
|
|
|
|
|
|
| 79 |
merge_method: ties
|
| 80 |
base_model: Qwen/Qwen2.5-7B-Instruct
|
| 81 |
parameters:
|
mergekit_config.yml
CHANGED
|
@@ -1,10 +1,4 @@
|
|
| 1 |
models:
|
| 2 |
-
- model: Qwen/Qwen2.5-7B-Instruct
|
| 3 |
-
parameters:
|
| 4 |
-
weight: 1
|
| 5 |
-
- model: Qwen/Qwen2.5-7B
|
| 6 |
-
parameters:
|
| 7 |
-
weight: 1
|
| 8 |
- model: Qwen/Qwen2.5-Math-7B
|
| 9 |
parameters:
|
| 10 |
weight: 1
|
|
@@ -35,9 +29,6 @@ models:
|
|
| 35 |
- model: prithivMLmods/QwQ-LCoT2-7B-Instruct
|
| 36 |
parameters:
|
| 37 |
weight: 1
|
| 38 |
-
- model: prithivMLmods/QwQ-MathOct-7B
|
| 39 |
-
parameters:
|
| 40 |
-
weight: 1
|
| 41 |
merge_method: ties
|
| 42 |
base_model: Qwen/Qwen2.5-7B-Instruct
|
| 43 |
parameters:
|
|
|
|
| 1 |
models:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
- model: Qwen/Qwen2.5-Math-7B
|
| 3 |
parameters:
|
| 4 |
weight: 1
|
|
|
|
| 29 |
- model: prithivMLmods/QwQ-LCoT2-7B-Instruct
|
| 30 |
parameters:
|
| 31 |
weight: 1
|
|
|
|
|
|
|
|
|
|
| 32 |
merge_method: ties
|
| 33 |
base_model: Qwen/Qwen2.5-7B-Instruct
|
| 34 |
parameters:
|
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4970978712
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ebbf92d8fa7099e76e5c3aa282db8c73cec827a1e1b98e419af2c13611cd5074
|
| 3 |
size 4970978712
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751032
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ae6864ff524d844d57dd536aa40d329f504ff42f0c43a1b61c685b308c8e083
|
| 3 |
size 4932751032
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4991495808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:565df93157b48ced2098f2289cdfa91335398e8c89452e72c729d279cd149099
|
| 3 |
size 4991495808
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 330326240
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f0c8c30e087abc96f0a87093b0e671f75e94a65c96aee06923fc8afb4064e81d
|
| 3 |
size 330326240
|