Push model using huggingface_hub.
Browse files- config.json +1 -0
- model.safetensors +1 -1
config.json
CHANGED
|
@@ -79,6 +79,7 @@
|
|
| 79 |
"num_layers": 21,
|
| 80 |
"residual_gate_type": "elementwise",
|
| 81 |
"residual_per_slot_gate": true,
|
|
|
|
| 82 |
"seq_len": 8192,
|
| 83 |
"stm_size": 4096,
|
| 84 |
"use_flash_attention": false,
|
|
|
|
| 79 |
"num_layers": 21,
|
| 80 |
"residual_gate_type": "elementwise",
|
| 81 |
"residual_per_slot_gate": true,
|
| 82 |
+
"rope_base": 100000,
|
| 83 |
"seq_len": 8192,
|
| 84 |
"stm_size": 4096,
|
| 85 |
"use_flash_attention": false,
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 6099558592
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:59612cdd21216f17ccc3ea9ddbe05e76e5198888748b15a785692f15dd3e87f7
|
| 3 |
size 6099558592
|