Upload model

Browse files

Files changed (6) hide show

README.md +34 -7
config.json +1 -1
mergekit_config.yml +24 -3
model-00001-of-00001.safetensors +1 -1
tokenizer.json +2 -2
tokenizer_config.json +1 -0

README.md CHANGED Viewed

@@ -1,28 +1,34 @@
 ---
 base_model:
 - starnet/19star03
-- lionking927/s11-m1-0303
 - starnet/15star03
 library_name: transformers
 tags:
 - mergekit
 - merge
 ---
-# output
 This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
 ## Merge Details
 ### Merge Method
-This model was merged using the [TIES](https://arxiv.org/abs/2306.01708) merge method using [starnet/15star03](https://huggingface.co/starnet/15star03) as a base.
 ### Models Merged
 The following models were included in the merge:
 * [starnet/19star03](https://huggingface.co/starnet/19star03)
-* [lionking927/s11-m1-0303](https://huggingface.co/lionking927/s11-m1-0303)
 ### Configuration
@@ -30,7 +36,7 @@ The following YAML configuration was used to produce this model:
 ```yaml
 models:
-  - model: starnet/15star03
     parameters:
       density: [1, 0.7, 0.1] # density gradient
       weight: 1.0
@@ -38,7 +44,28 @@ models:
     parameters:
       density: 0.5
       weight: [0, 0.3, 0.7, 1] # weight gradient
-  - model: lionking927/s11-m1-0303
     parameters:
       density: 0.33
       weight:
@@ -46,7 +73,7 @@ models:
           value: 0.5
         - value: 0
 merge_method: ties
-base_model: starnet/15star03
 parameters:
   normalize: true
   int8_mask: true

 ---
 base_model:
+- aks1s/13Aks-18
 - starnet/19star03
+- OwOpeepeepoopoo/ZZZZZsubmission7
+- OwOpeepeepoopoo/ZZZZZsubmission5
 - starnet/15star03
+- irusl/05Ir-4
 library_name: transformers
 tags:
 - mergekit
 - merge
 ---
+# output_2
 This is a merge of pre-trained language models created using [mergekit](https://github.com/cg123/mergekit).
 ## Merge Details
 ### Merge Method
+This model was merged using the [TIES](https://arxiv.org/abs/2306.01708) merge method using [irusl/05Ir-4](https://huggingface.co/irusl/05Ir-4) as a base.
 ### Models Merged
 The following models were included in the merge:
+* [aks1s/13Aks-18](https://huggingface.co/aks1s/13Aks-18)
 * [starnet/19star03](https://huggingface.co/starnet/19star03)
+* [OwOpeepeepoopoo/ZZZZZsubmission7](https://huggingface.co/OwOpeepeepoopoo/ZZZZZsubmission7)
+* [OwOpeepeepoopoo/ZZZZZsubmission5](https://huggingface.co/OwOpeepeepoopoo/ZZZZZsubmission5)
+* [starnet/15star03](https://huggingface.co/starnet/15star03)
 ### Configuration
 ```yaml
 models:
+  - model: irusl/05Ir-4
     parameters:
       density: [1, 0.7, 0.1] # density gradient
       weight: 1.0
     parameters:
       density: 0.5
       weight: [0, 0.3, 0.7, 1] # weight gradient
+  - model: starnet/15star03
+    parameters:
+      density: 0.33
+      weight:
+        - filter: mlp
+          value: 0.5
+        - value: 0
+  - model: aks1s/13Aks-18
+    parameters:
+      density: 0.33
+      weight:
+        - filter: mlp
+          value: 0.5
+        - value: 0
+  - model: OwOpeepeepoopoo/ZZZZZsubmission7
+    parameters:
+      density: 0.33
+      weight:
+        - filter: mlp
+          value: 0.5
+        - value: 0
+  - model: OwOpeepeepoopoo/ZZZZZsubmission5
     parameters:
       density: 0.33
       weight:
           value: 0.5
         - value: 0
 merge_method: ties
+base_model: irusl/05Ir-4
 parameters:
   normalize: true
   int8_mask: true

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "starnet/15star03",
   "architectures": [
     "StableLmForCausalLM"
   ],

 {
+  "_name_or_path": "irusl/05Ir-4",
   "architectures": [
     "StableLmForCausalLM"
   ],

mergekit_config.yml CHANGED Viewed

@@ -1,5 +1,5 @@
 models:
-  - model: starnet/15star03
     parameters:
       density: [1, 0.7, 0.1] # density gradient
       weight: 1.0
@@ -7,7 +7,28 @@ models:
     parameters:
       density: 0.5
       weight: [0, 0.3, 0.7, 1] # weight gradient
-  - model: lionking927/s11-m1-0303
     parameters:
       density: 0.33
       weight:
@@ -15,7 +36,7 @@ models:
           value: 0.5
         - value: 0
 merge_method: ties
-base_model: starnet/15star03
 parameters:
   normalize: true
   int8_mask: true

 models:
+  - model: irusl/05Ir-4
     parameters:
       density: [1, 0.7, 0.1] # density gradient
       weight: 1.0
     parameters:
       density: 0.5
       weight: [0, 0.3, 0.7, 1] # weight gradient
+  - model: starnet/15star03
+    parameters:
+      density: 0.33
+      weight:
+        - filter: mlp
+          value: 0.5
+        - value: 0
+  - model: aks1s/13Aks-18
+    parameters:
+      density: 0.33
+      weight:
+        - filter: mlp
+          value: 0.5
+        - value: 0
+  - model: OwOpeepeepoopoo/ZZZZZsubmission7
+    parameters:
+      density: 0.33
+      weight:
+        - filter: mlp
+          value: 0.5
+        - value: 0
+  - model: OwOpeepeepoopoo/ZZZZZsubmission5
     parameters:
       density: 0.33
       weight:
           value: 0.5
         - value: 0
 merge_method: ties
+base_model: irusl/05Ir-4
 parameters:
   normalize: true
   int8_mask: true

model-00001-of-00001.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0a79c3d9cc401e05fc6565283c5dde1951cee752180b701a7d82c46f87a098df
 size 3289069184

 version https://git-lfs.github.com/spec/v1
+oid sha256:e739e741d073e503685db1a5c3be3acc11b18ef5306efa408d781b6d0579d2d4
 size 3289069184

tokenizer.json CHANGED Viewed

@@ -2,13 +2,13 @@
   "version": "1.0",
   "truncation": {
     "direction": "Right",
-    "max_length": 3896,
     "strategy": "LongestFirst",
     "stride": 0
   },
   "padding": {
     "strategy": {
-      "Fixed": 3896
     },
     "direction": "Left",
     "pad_to_multiple_of": null,

   "version": "1.0",
   "truncation": {
     "direction": "Right",
+    "max_length": 3696,
     "strategy": "LongestFirst",
     "stride": 0
   },
   "padding": {
     "strategy": {
+      "Fixed": 3696
     },
     "direction": "Left",
     "pad_to_multiple_of": null,

tokenizer_config.json CHANGED Viewed

@@ -1,4 +1,5 @@
 {
   "add_prefix_space": false,
   "added_tokens_decoder": {
     "100256": {

 {
+  "add_bos_token": true,
   "add_prefix_space": false,
   "added_tokens_decoder": {
     "100256": {