Upload folder using huggingface_hub
Browse files- README.md +6 -6
- mergekit_moe_config.yml +6 -6
README.md
CHANGED
|
@@ -20,10 +20,10 @@ tags:
|
|
| 20 |
#parameters:
|
| 21 |
# t:
|
| 22 |
# - filter: self_attn
|
| 23 |
-
# value: [0.
|
| 24 |
# - filter: mlp
|
| 25 |
-
# value: [0.
|
| 26 |
-
# - value: 0.
|
| 27 |
#dtype: bfloat16
|
| 28 |
#random_seed: 0
|
| 29 |
|
|
@@ -38,10 +38,10 @@ tags:
|
|
| 38 |
#parameters:
|
| 39 |
# t:
|
| 40 |
# - filter: self_attn
|
| 41 |
-
# value: [0.
|
| 42 |
# - filter: mlp
|
| 43 |
-
# value: [0.
|
| 44 |
-
# - value: 0.
|
| 45 |
#dtype: float16
|
| 46 |
#random_seed: 0
|
| 47 |
|
|
|
|
| 20 |
#parameters:
|
| 21 |
# t:
|
| 22 |
# - filter: self_attn
|
| 23 |
+
# value: [0.6606117722434863, 0.01708760797547526, 0.8948656675765086, 0.47128075561315386, 0.5692245310177902]
|
| 24 |
# - filter: mlp
|
| 25 |
+
# value: [0.33938822775651367, 0.9829123920245247, 0.5287192443868461, 0.5287192443868461, 0.43077546898220975]
|
| 26 |
+
# - value: 0.14995989969007373
|
| 27 |
#dtype: bfloat16
|
| 28 |
#random_seed: 0
|
| 29 |
|
|
|
|
| 38 |
#parameters:
|
| 39 |
# t:
|
| 40 |
# - filter: self_attn
|
| 41 |
+
# value: [0.6606117722434863, 0.01708760797547526, 0.8948656675765086, 0.47128075561315386, 0.5692245310177902]
|
| 42 |
# - filter: mlp
|
| 43 |
+
# value: [0.33938822775651367, 0.9829123920245247, 0.10513433242349135, 0.5287192443868461, 0.43077546898220975]
|
| 44 |
+
# - value: 0.14995989969007373
|
| 45 |
#dtype: float16
|
| 46 |
#random_seed: 0
|
| 47 |
|
mergekit_moe_config.yml
CHANGED
|
@@ -10,10 +10,10 @@
|
|
| 10 |
#parameters:
|
| 11 |
# t:
|
| 12 |
# - filter: self_attn
|
| 13 |
-
# value: [0.
|
| 14 |
# - filter: mlp
|
| 15 |
-
# value: [0.
|
| 16 |
-
# - value: 0.
|
| 17 |
#dtype: bfloat16
|
| 18 |
#random_seed: 0
|
| 19 |
|
|
@@ -28,10 +28,10 @@
|
|
| 28 |
#parameters:
|
| 29 |
# t:
|
| 30 |
# - filter: self_attn
|
| 31 |
-
# value: [0.
|
| 32 |
# - filter: mlp
|
| 33 |
-
# value: [0.
|
| 34 |
-
# - value: 0.
|
| 35 |
#dtype: float16
|
| 36 |
#random_seed: 0
|
| 37 |
|
|
|
|
| 10 |
#parameters:
|
| 11 |
# t:
|
| 12 |
# - filter: self_attn
|
| 13 |
+
# value: [0.6606117722434863, 0.01708760797547526, 0.8948656675765086, 0.47128075561315386, 0.5692245310177902]
|
| 14 |
# - filter: mlp
|
| 15 |
+
# value: [0.33938822775651367, 0.9829123920245247, 0.5287192443868461, 0.5287192443868461, 0.43077546898220975]
|
| 16 |
+
# - value: 0.14995989969007373
|
| 17 |
#dtype: bfloat16
|
| 18 |
#random_seed: 0
|
| 19 |
|
|
|
|
| 28 |
#parameters:
|
| 29 |
# t:
|
| 30 |
# - filter: self_attn
|
| 31 |
+
# value: [0.6606117722434863, 0.01708760797547526, 0.8948656675765086, 0.47128075561315386, 0.5692245310177902]
|
| 32 |
# - filter: mlp
|
| 33 |
+
# value: [0.33938822775651367, 0.9829123920245247, 0.10513433242349135, 0.5287192443868461, 0.43077546898220975]
|
| 34 |
+
# - value: 0.14995989969007373
|
| 35 |
#dtype: float16
|
| 36 |
#random_seed: 0
|
| 37 |
|