davidgortega commited on
Commit
233e001
·
1 Parent(s): e3ab0d1

first commit

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. MLC32/added_tokens.json +42 -0
  2. MLC32/merges.txt +0 -0
  3. MLC32/mlc-chat-config.json +75 -0
  4. MLC32/ndarray-cache-b16.json +0 -0
  5. MLC32/ndarray-cache.json +0 -0
  6. MLC32/params_shard_0.bin +3 -0
  7. MLC32/params_shard_1.bin +3 -0
  8. MLC32/params_shard_10.bin +3 -0
  9. MLC32/params_shard_100.bin +3 -0
  10. MLC32/params_shard_101.bin +3 -0
  11. MLC32/params_shard_102.bin +3 -0
  12. MLC32/params_shard_103.bin +3 -0
  13. MLC32/params_shard_104.bin +3 -0
  14. MLC32/params_shard_105.bin +3 -0
  15. MLC32/params_shard_106.bin +3 -0
  16. MLC32/params_shard_107.bin +3 -0
  17. MLC32/params_shard_108.bin +3 -0
  18. MLC32/params_shard_109.bin +3 -0
  19. MLC32/params_shard_11.bin +3 -0
  20. MLC32/params_shard_110.bin +3 -0
  21. MLC32/params_shard_111.bin +3 -0
  22. MLC32/params_shard_112.bin +3 -0
  23. MLC32/params_shard_113.bin +3 -0
  24. MLC32/params_shard_12.bin +3 -0
  25. MLC32/params_shard_13.bin +3 -0
  26. MLC32/params_shard_14.bin +3 -0
  27. MLC32/params_shard_15.bin +3 -0
  28. MLC32/params_shard_16.bin +3 -0
  29. MLC32/params_shard_17.bin +3 -0
  30. MLC32/params_shard_18.bin +3 -0
  31. MLC32/params_shard_19.bin +3 -0
  32. MLC32/params_shard_2.bin +3 -0
  33. MLC32/params_shard_20.bin +3 -0
  34. MLC32/params_shard_21.bin +3 -0
  35. MLC32/params_shard_22.bin +3 -0
  36. MLC32/params_shard_23.bin +3 -0
  37. MLC32/params_shard_24.bin +3 -0
  38. MLC32/params_shard_25.bin +3 -0
  39. MLC32/params_shard_26.bin +3 -0
  40. MLC32/params_shard_27.bin +3 -0
  41. MLC32/params_shard_28.bin +3 -0
  42. MLC32/params_shard_29.bin +3 -0
  43. MLC32/params_shard_3.bin +3 -0
  44. MLC32/params_shard_30.bin +3 -0
  45. MLC32/params_shard_31.bin +3 -0
  46. MLC32/params_shard_32.bin +3 -0
  47. MLC32/params_shard_33.bin +3 -0
  48. MLC32/params_shard_34.bin +3 -0
  49. MLC32/params_shard_35.bin +3 -0
  50. MLC32/params_shard_36.bin +3 -0
MLC32/added_tokens.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "\t\t": 50294,
3
+ "\t\t\t": 50293,
4
+ "\t\t\t\t": 50292,
5
+ "\t\t\t\t\t": 50291,
6
+ "\t\t\t\t\t\t": 50290,
7
+ "\t\t\t\t\t\t\t": 50289,
8
+ "\t\t\t\t\t\t\t\t": 50288,
9
+ "\t\t\t\t\t\t\t\t\t": 50287,
10
+ " ": 50286,
11
+ " ": 50285,
12
+ " ": 50284,
13
+ " ": 50283,
14
+ " ": 50282,
15
+ " ": 50281,
16
+ " ": 50280,
17
+ " ": 50279,
18
+ " ": 50278,
19
+ " ": 50277,
20
+ " ": 50276,
21
+ " ": 50275,
22
+ " ": 50274,
23
+ " ": 50273,
24
+ " ": 50272,
25
+ " ": 50271,
26
+ " ": 50270,
27
+ " ": 50269,
28
+ " ": 50268,
29
+ " ": 50267,
30
+ " ": 50266,
31
+ " ": 50265,
32
+ " ": 50264,
33
+ " ": 50263,
34
+ " ": 50262,
35
+ " ": 50261,
36
+ " ": 50260,
37
+ " ": 50259,
38
+ " ": 50258,
39
+ " ": 50257,
40
+ "<|im_end|>": 50295,
41
+ "<|im_start|>": 50296
42
+ }
MLC32/merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
MLC32/mlc-chat-config.json ADDED
@@ -0,0 +1,75 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "model_type": "phi-msft",
3
+ "quantization": "q0f32",
4
+ "model_config": {
5
+ "model_type": "phi-msft",
6
+ "vocab_size": 51200,
7
+ "n_positions": 2048,
8
+ "n_embd": 2560,
9
+ "n_layer": 32,
10
+ "n_inner": 10240,
11
+ "n_head": 32,
12
+ "rotary_dim": 32,
13
+ "position_embedding_base": 10000,
14
+ "layer_norm_epsilon": 1e-05,
15
+ "context_window_size": 2048,
16
+ "prefill_chunk_size": 2048,
17
+ "n_head_kv": 32,
18
+ "head_dim": 80,
19
+ "tensor_parallel_shards": 1
20
+ },
21
+ "vocab_size": 51200,
22
+ "context_window_size": 2048,
23
+ "sliding_window_size": -1,
24
+ "prefill_chunk_size": 2048,
25
+ "attention_sink_size": -1,
26
+ "tensor_parallel_shards": 1,
27
+ "mean_gen_len": 128,
28
+ "max_gen_len": 512,
29
+ "shift_fill_factor": 0.3,
30
+ "temperature": 0.7,
31
+ "presence_penalty": 0.0,
32
+ "frequency_penalty": 0.0,
33
+ "repetition_penalty": 1.0,
34
+ "top_p": 0.95,
35
+ "conv_template": {
36
+ "name": "chatml",
37
+ "system_template": "<|im_start|>system\n{system_message}",
38
+ "system_message": "A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.",
39
+ "add_role_after_system_message": true,
40
+ "roles": {
41
+ "user": "<|im_start|>user",
42
+ "assistant": "<|im_start|>assistant"
43
+ },
44
+ "role_templates": {
45
+ "user": "{user_message}",
46
+ "assistant": "{assistant_message}",
47
+ "tool": "{tool_message}"
48
+ },
49
+ "messages": [],
50
+ "seps": [
51
+ "<|im_end|>\n"
52
+ ],
53
+ "role_content_sep": "\n",
54
+ "role_empty_sep": "\n",
55
+ "stop_str": [
56
+ "<|im_end|>"
57
+ ],
58
+ "stop_token_ids": [
59
+ 2
60
+ ],
61
+ "function_string": "",
62
+ "use_function_calling": false
63
+ },
64
+ "pad_token_id": 0,
65
+ "bos_token_id": 1,
66
+ "eos_token_id": 2,
67
+ "tokenizer_files": [
68
+ "tokenizer.json",
69
+ "vocab.json",
70
+ "merges.txt",
71
+ "added_tokens.json",
72
+ "tokenizer_config.json"
73
+ ],
74
+ "version": "0.1.0"
75
+ }
MLC32/ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
MLC32/ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
MLC32/params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ba9ffed0d64ef572b721255dd7dcc7f5852c420f41073ae5d38ba7ca6e46d3b
3
+ size 262144000
MLC32/params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b11f7a95c291cc7e189727c00879b899ecb2d041a595e0b92edf83e5c95a2d90
3
+ size 39321600
MLC32/params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8bb15f1cb3536f6832426f207075ffbda11ed5d46fbd74cbcb2689a9879faf0f
3
+ size 52428800
MLC32/params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ce588a1d174b7263f2dc9ef467f50f210def6eba07dd07c926d89318490791d
3
+ size 26327040
MLC32/params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e08de8a0cfd5a77548d5f1867776f080cdcd82e34edb1e33ee55bd3ecbdf38f7
3
+ size 52428800
MLC32/params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db3d6e6ce698dd3b95732bc8236380f5ce91350ea33a644a8f760ac97c3cdca1
3
+ size 52428800
MLC32/params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8dfe8178b3d6edbb5a874c20b5173490acd856f89f268e37fa31f5b76f452960
3
+ size 39321600
MLC32/params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d2ddf5d08f4519e71e81ed9793bc9dc43ee0c913bd415c9c4744eb24d8c7541
3
+ size 52428800
MLC32/params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:694fee14ff88bfcf9f9e16be882c89a8cfeee08e093142001160daa5f53fb888
3
+ size 52428800
MLC32/params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:263727517853bbfd5c9e43bf34ab90a418448e787e9f079e88967cdb0bde4349
3
+ size 39321600
MLC32/params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c41ea2c2ac3878e7dface27a62cd6065f180c05da262012bb9b62823360ef63
3
+ size 26327040
MLC32/params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:612d683124e578c8c3fe659701e8b9b895162315abda77c596f19488aa641dc8
3
+ size 52428800
MLC32/params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:265c7ba4281f4e9970b3ccbd21eeec5a233b539a11ec1ef304bc9cef6814e5e8
3
+ size 52428800
MLC32/params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1145a501247888af1be6e06ee6d014d1900b6a4f50b7f47b912ab48bcd8a89b3
3
+ size 52428800
MLC32/params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d097fe071c19cae9ca64cf15a89971e72904a805948a97f06f9f83f924e414c2
3
+ size 39321600
MLC32/params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d42203e716f570e8db6c063fc290b98b9c42538607cd9cc0c6c730b1cbcac05e
3
+ size 52428800
MLC32/params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c803335f7d08979a7195af0aae96797748c08f99d7d032b3c3bbf579865dda76
3
+ size 52428800
MLC32/params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a52368775787bdb3194f2fb448c9e95febabf511fb4fea224693becbfdd911c7
3
+ size 26296320
MLC32/params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6d9c605defb3b8fdd4692f4e7118f277f613f33bd7e794efc1ca26e2af7d696
3
+ size 39321600
MLC32/params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e243e23ccb8953f87e347c79a8318967b8a9196e8a9872081fd4f6a44cf485ec
3
+ size 52428800
MLC32/params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b41d9fc0ec54bbcc8684e7e89b1ba3c90892a915e0f3328cbb78c6ec4e0c43a
3
+ size 52428800
MLC32/params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:558e7528ba9f294612de4cec28c0bb15367068cf9ccbd49519f0ffddb41279ae
3
+ size 39321600
MLC32/params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c4b1af151d13719784111a5beb91301fef4a6b073cab218721827397a81c3f5
3
+ size 26327040
MLC32/params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c7abc2571b4105ee0fa81b35550b356f226c194ec8cc27825b33c42851318258
3
+ size 52428800
MLC32/params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3beb9e73f09afd50f69d34d8917806824ecc73cdbcb115e11a2e34e932ffb9cb
3
+ size 52428800
MLC32/params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec4d9daa8c27b6e311b45c52569ceb086db9f84a508f29eee7e8f74eba21d500
3
+ size 39321600
MLC32/params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c10dd61f7d12532c4159436b8276817a6493181c49d30fa67a74d4b145220ff1
3
+ size 52428800
MLC32/params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:594fc2bea09c493d601eb4c17b377f360163ea6e490999a7ee98d94b991213bf
3
+ size 52428800
MLC32/params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07d610fcef6955ed55a85103909738804171addd5bf34a9a7c66b571bb4b7a3a
3
+ size 52428800
MLC32/params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a2c68bf420d558bb51b88d76de347857a8725f7f4ef15ec4cfec0cd93933032
3
+ size 39321600
MLC32/params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7bb2309c6081bd24ed9ed3bad0c91b4ea342ab65d8663a2be9953c5887f31b0d
3
+ size 26327040
MLC32/params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3b0db17945e48d21e560f6aee7b4c69974831f4f8ae33e4cf220185d7fdb124a
3
+ size 52428800
MLC32/params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f14fede593f30000323a284d3f10cb5c51df8fd341435c5fd1035b3f6a46c09
3
+ size 52428800
MLC32/params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f46140cbece76b4cb6145f724409a1395218db99e69ce988ba21b37552ce85c9
3
+ size 39321600
MLC32/params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ba41b73dd3d1744371834222cdd684ca422acc9264be41d7d4ff1689e5cbe6f
3
+ size 52428800
MLC32/params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:84755b852bcbc8fdc3688442ef9f037fd0dc3509af29d90d07d2e77612f3ccd6
3
+ size 52428800
MLC32/params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74cf80a7f7f83c1010ed4950cb17ac82b14a55d729abf427c5e2e229420922d5
3
+ size 39321600
MLC32/params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35fecfee7949f48ad3b4d44f72e9f20ba0fc514ad520fe405026a694973f415a
3
+ size 52428800
MLC32/params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a5c6968189dbfcab92ec00c9a8733b426e978a9fe2d203845b77b80d34c5242
3
+ size 26327040
MLC32/params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9745775d710b439e957111038a6361f919ad121f6243e5cf4f2458061787dca8
3
+ size 52428800
MLC32/params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6697e8da4f413a558b9d4f54da6d513c1f6b4b8bc38a4624a722a716da87c3a6
3
+ size 52428800
MLC32/params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00c53f495ecd99f04e6782e3a16aa65c04fa38b053b112ebf6e1909d98a7243b
3
+ size 39321600
MLC32/params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1aeda857baca9608f206871dfa58d848ca8a3b7b04f5b5061f139f565c1f559b
3
+ size 52428800
MLC32/params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:395a2a3631492821b18c376a30e3081c6361a136dc5e75d66c4caf917c1ce31d
3
+ size 52428800
MLC32/params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9acc5e77352359d45091ed1e63ae267d996180c59c19aeeaea4f824797abe180
3
+ size 39321600