Doctor-Shotgun commited on
Commit
38b9432
·
verified ·
1 Parent(s): 955fdd4

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +113 -0
  2. model-00001.safetensors +3 -0
  3. model-00002.safetensors +3 -0
  4. model-00003.safetensors +3 -0
  5. model-00004.safetensors +3 -0
  6. model-00005.safetensors +3 -0
  7. model-00006.safetensors +3 -0
  8. model-00007.safetensors +3 -0
  9. model-00008.safetensors +3 -0
  10. model-00009.safetensors +3 -0
  11. model-00010.safetensors +3 -0
  12. model-00011.safetensors +3 -0
  13. model-00012.safetensors +3 -0
  14. model-00013.safetensors +3 -0
  15. model-00014.safetensors +3 -0
  16. model-00015.safetensors +3 -0
  17. model-00016.safetensors +3 -0
  18. model-00017.safetensors +3 -0
  19. model-00018.safetensors +3 -0
  20. model-00019.safetensors +3 -0
  21. model-00020.safetensors +3 -0
  22. model-00021.safetensors +3 -0
  23. model-00022.safetensors +3 -0
  24. model-00023.safetensors +3 -0
  25. model-00024.safetensors +3 -0
  26. model-00025.safetensors +3 -0
  27. model-00026.safetensors +3 -0
  28. model-00027.safetensors +3 -0
  29. model-00028.safetensors +3 -0
  30. model-00029.safetensors +3 -0
  31. model-00030.safetensors +3 -0
  32. model-00031.safetensors +3 -0
  33. model-00032.safetensors +3 -0
  34. model-00033.safetensors +3 -0
  35. model-00034.safetensors +3 -0
  36. model-00035.safetensors +3 -0
  37. model-00036.safetensors +3 -0
  38. model-00037.safetensors +3 -0
  39. model-00038.safetensors +3 -0
  40. model-00039.safetensors +3 -0
  41. model-00040.safetensors +3 -0
  42. model-00041.safetensors +3 -0
  43. model-00042.safetensors +3 -0
  44. model-00043.safetensors +3 -0
  45. model-00044.safetensors +3 -0
  46. model-00045.safetensors +3 -0
  47. model-00046.safetensors +3 -0
  48. model-00047.safetensors +3 -0
  49. model-00048.safetensors +3 -0
  50. model-00049.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,113 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "MiniMaxM2ForCausalLM"
4
+ ],
5
+ "attn_type_list": [
6
+ 1,
7
+ 1,
8
+ 1,
9
+ 1,
10
+ 1,
11
+ 1,
12
+ 1,
13
+ 1,
14
+ 1,
15
+ 1,
16
+ 1,
17
+ 1,
18
+ 1,
19
+ 1,
20
+ 1,
21
+ 1,
22
+ 1,
23
+ 1,
24
+ 1,
25
+ 1,
26
+ 1,
27
+ 1,
28
+ 1,
29
+ 1,
30
+ 1,
31
+ 1,
32
+ 1,
33
+ 1,
34
+ 1,
35
+ 1,
36
+ 1,
37
+ 1,
38
+ 1,
39
+ 1,
40
+ 1,
41
+ 1,
42
+ 1,
43
+ 1,
44
+ 1,
45
+ 1,
46
+ 1,
47
+ 1,
48
+ 1,
49
+ 1,
50
+ 1,
51
+ 1,
52
+ 1,
53
+ 1,
54
+ 1,
55
+ 1,
56
+ 1,
57
+ 1,
58
+ 1,
59
+ 1,
60
+ 1,
61
+ 1,
62
+ 1,
63
+ 1,
64
+ 1,
65
+ 1,
66
+ 1,
67
+ 1
68
+ ],
69
+ "auto_map": {
70
+ "AutoConfig": "configuration_minimax_m2.MiniMaxM2Config",
71
+ "AutoModelForCausalLM": "modeling_minimax_m2.MiniMaxM2ForCausalLM"
72
+ },
73
+ "head_dim": 128,
74
+ "hidden_act": "silu",
75
+ "hidden_size": 3072,
76
+ "intermediate_size": 1536,
77
+ "max_position_embeddings": 196608,
78
+ "model_type": "minimax_m2",
79
+ "mtp_transformer_layers": 1,
80
+ "num_attention_heads": 48,
81
+ "num_experts_per_tok": 8,
82
+ "num_hidden_layers": 62,
83
+ "num_key_value_heads": 8,
84
+ "num_local_experts": 256,
85
+ "num_mtp_modules": 3,
86
+ "qk_norm_type": "per_layer",
87
+ "quantization_config": {
88
+ "activation_scheme": "dynamic",
89
+ "fmt": "float8_e4m3fn",
90
+ "quant_method": "fp8",
91
+ "weight_block_size": [
92
+ 128,
93
+ 128
94
+ ],
95
+ "modules_to_not_convert": [
96
+ "gate",
97
+ "e_score_correction_bias",
98
+ "lm_head"
99
+ ]
100
+ },
101
+ "rms_norm_eps": 1e-06,
102
+ "rope_theta": 5000000,
103
+ "rotary_dim": 64,
104
+ "scoring_func": "sigmoid",
105
+ "shared_intermediate_size": 0,
106
+ "tie_word_embeddings": false,
107
+ "transformers_version": "4.46.1",
108
+ "use_cache": true,
109
+ "use_mtp": true,
110
+ "use_qk_norm": true,
111
+ "use_routing_bias": true,
112
+ "vocab_size": 200064
113
+ }
model-00001.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5de8077213accff91b38a4e4fd0e516b71a8fcc50e7f45610b0268e396f95407
3
+ size 1777468168
model-00002.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1da7bf8eddd07db6a5cb73918d43965b680c056546022e1eea1c474895ac5981
3
+ size 1777468168
model-00003.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3567e44e12b03ed82e1f97cd5307bad634767869e908711e73a0983e1cb52200
3
+ size 1777468080
model-00004.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e369f892bd1e17bcde868dd1d664624988193de1211fb36ac949f7195db257c0
3
+ size 1777468168
model-00005.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a229748e6ac274cf3d3eeb90050846962bc229e590000bd758bfe5ed4d8ec07
3
+ size 1777468000
model-00006.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4382ceee9f2818706b5d4ca396ffcb032d15165434c920307760e301eb50852c
3
+ size 1777468168
model-00007.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b47844b9c106ed811868fa2507901c4f5b077c05c76cf7d96d79ad9427ac632
3
+ size 1777468032
model-00008.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:266aaed8b5f34e5770dd07edf0039772a8c655b6c322f6c95e561afd14a9b3eb
3
+ size 1777468168
model-00009.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49c48d66650c430a69fbb34869b7e52f70aa1b00578f70424881455e172f50a7
3
+ size 1777468168
model-00010.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82e2dfe3d40b369813f0b5bf202597d3e5187c487049caef1edf4324e4163c08
3
+ size 1777468168
model-00011.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4953f65cdd2839d32a5cf70d2ce97e8a1892cef3482ea52ad2d43d36d2bfe2c
3
+ size 1777468168
model-00012.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54754136048c7be202a0a22e616057d6ed375ed229e3d58b0b2e685edb7fd88a
3
+ size 1777468168
model-00013.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77242200334156c2a24ab7137445339ab46ee59d340614972d5fb93424249b24
3
+ size 1777468168
model-00014.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c128a67041a5cd0666bc993800f6ce7f052a3599e0c2f7a15f6142390900c568
3
+ size 1777468240
model-00015.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:141a37a9d88a531d39e888689f9f2b38ca0bc58e8136271934919ae3030e5233
3
+ size 1777468240
model-00016.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d574242dd6f0bfb2d06837cfa7d863ac09e2559208e50702341729b8876bf43
3
+ size 1777468240
model-00017.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:70e525c0ed663ef7ff6bc52af57d1f61f4040fbdf881f43cd79805228edd6a3d
3
+ size 1777468240
model-00018.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcf6f8ac7ddbdecb4656e149543b17d05616da840b71aca71a7eaf7ba657e0c7
3
+ size 1777468240
model-00019.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4522d36db3a17800c16914a62f4de4b07af96886cdc025c57d9abcf6b4eb75e2
3
+ size 1777468240
model-00020.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c9d7ab43b275f83e9d703823963dbae4cfe3a7ae6aa65fd1aa6c137f03b3556
3
+ size 1777468240
model-00021.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40f4576fbf009b045d547b14add0740d15919415107f827920a00995b0f4a4b6
3
+ size 1777469832
model-00022.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20f44b115e8099d88c9461df7ff34d08f08d238f4bd1db3cd26185506567efec
3
+ size 1777471216
model-00023.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5706b6fe7635834596b4e7d52275f4264672dfb566b3882c008714bc439023e4
3
+ size 1777471168
model-00024.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:721e18f1ce5df9d0c103ef054e495113d1d6a6812542087eb4d8804e735ee621
3
+ size 1777471168
model-00025.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab14a28c0f0b5b53b7011098961f7b3799841744c0e22d42af783a50ac626c17
3
+ size 1777471168
model-00026.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5820e7db15e7e8e455b88b195243670678a6389f7707e2089336b62358d21ec9
3
+ size 1777471168
model-00027.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f10ccdf4c12ec72311b97d7030ea6ca8888b9371972ccaeaa262f3e1753bf3b
3
+ size 1777471168
model-00028.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b942ad04e210b1b9d67121ded266494b5f2336669f04686589df4e92d5c025aa
3
+ size 1777471168
model-00029.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8aaaa25713fc4389c5acd11034af14682a9640402c2e7fdcf220126352a282a3
3
+ size 1777471168
model-00030.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d4c49719fd444bf1c45f0df107d677f0e06913045fcd7c22a4d9b672e6aedbf1
3
+ size 1777471168
model-00031.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d1819aa55743c0134f415230cbc2af7aacc37ffa702472e78afeac9c239c7f0
3
+ size 1777471168
model-00032.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dfc7aaba1cf41a6c314890447aed3a67ee6de6c1121e73ad21d8aa451eb5537e
3
+ size 1777471168
model-00033.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98bc232a5fb9d7d5eaed73ca07c78303180f52cfdd9805c8d2dfb2613d31e4c6
3
+ size 1777471168
model-00034.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68656ea95fc0c745582c5ec4439693e6b3c1713ae5a307ed28168a1200014f53
3
+ size 1777471168
model-00035.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4515364140fa9be08db3f9f5be5435a6ae5a5a4d3a3dfcecfcb13cf1540d0b92
3
+ size 1777471216
model-00036.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22787db1c6132fe70bc12d87895d662cb057ce722178129977b73269cf52cbd9
3
+ size 1777471240
model-00037.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49fded37a8eeca98000b1deb526f762422ab7ffa77e9ae2f7a6d48937daf00a4
3
+ size 1777471240
model-00038.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f41f443804771da9bd29a6950d6231b94c7b0bd2d0e86bae7af8a406a3bcdb6
3
+ size 1777471240
model-00039.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:29726e93720f644d7be7f2f274bca7daca0f4a1bcc4f8db45bf6776d73638227
3
+ size 1777471240
model-00040.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbc454b83547445d0e5f83899d72c07b27fe52f6767ffa066836593e258a3531
3
+ size 1777471240
model-00041.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a6676a9f1a55ab9d8dabcc7c132c57824677c54c45afa1bd06f2ec44dbd4fb7
3
+ size 1777471240
model-00042.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81a94b36bd130e8672e0b89dcfa001fab36bedf1e3db2ae54c8e957cce337d92
3
+ size 1777471248
model-00043.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ce3ec9c7b38f7b70500a6e9bcf7998fd331298fe09535826334129edee97d7a
3
+ size 1777471264
model-00044.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71c3910f818a63f6b0633bb14b7367de5c59d04df68b081b4642e7280c0a7133
3
+ size 1777471136
model-00045.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec16cf3d249b836861ec00f37f89988c7f5563bf3a4a68e30351dd2027947893
3
+ size 1777471168
model-00046.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9196f656ca08af47f5af5d392f2cc605cefe6436de97a6816047e2b51b42f9c7
3
+ size 1777471064
model-00047.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15fc5926a325b4e58b9cb4c2d4a5d696152f7ba3093710e7c9693fd8b58c506b
3
+ size 1777471168
model-00048.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e34f18af1da5eabcce11524f0e638ca7507d55e2d60bd1fcc84c243832019a08
3
+ size 1777470984
model-00049.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27e7bef87922cba48c40361d089e82acadff62eb8c11403ad7ec39f8d2da6d56
3
+ size 1777471168