BICORP commited on
Commit
a7ee440
·
verified ·
1 Parent(s): 61adf34

Upload 2 files

Browse files
config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"max_batch_size": 2, "max_seq_len": 8192, "dtype": "bf16", "vocab_size": 5557, "dim": 2096, "inter_dim": 1048, "moe_inter_dim": 548, "n_layers": 12, "n_dense_layers": 1, "n_heads": 16, "n_routed_experts": 32, "n_shared_experts": 2, "n_activated_experts": 6, "score_func": "softmax", "route_scale": 1.0, "q_lora_rank": 0, "kv_lora_rank": 512, "qk_nope_head_dim": 128, "qk_rope_head_dim": 64, "v_head_dim": 128, "original_seq_len": 4096, "rope_theta": 10000.0, "rope_factor": 40, "beta_fast": 32, "beta_slow": 1, "mscale": 1.0}
transformer_model-00001-of-00001-bf16.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be0fe8480a58f30a28e8c2d40d5f3854b6f24786adc6ca12b983d3e3fbb991d9
3
+ size 2137883416