AdamF92 commited on
Commit
59608f3
·
verified ·
1 Parent(s): d17b9ba

Push model using huggingface_hub.

Browse files
Files changed (3) hide show
  1. README.md +12 -0
  2. config.json +1 -1
  3. model.safetensors +2 -2
README.md ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ pipeline_tag: text-generation
4
+ tags:
5
+ - model_hub_mixin
6
+ - pytorch_model_hub_mixin
7
+ ---
8
+
9
+ This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
10
+ - Code: [More Information Needed]
11
+ - Paper: [More Information Needed]
12
+ - Docs: [More Information Needed]
config.json CHANGED
@@ -31,7 +31,7 @@
31
  "dense",
32
  "moe"
33
  ],
34
- "stm_size": 4096,
35
  "use_attention_output_bias": false,
36
  "use_flash_attention": true,
37
  "use_gated": true,
 
31
  "dense",
32
  "moe"
33
  ],
34
+ "stm_size": 8192,
35
  "use_attention_output_bias": false,
36
  "use_flash_attention": true,
37
  "use_gated": true,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e7ba42775d06d2150c8bd380ff47b6a6a6c23aff03e4aea974f7f30da7f72b1
3
- size 5860365104
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf7d67025934ef0acebfc67241443252fdd159ca84f5cff9a150852e114ad1ca
3
+ size 5772284720