Distilledoreo commited on
Commit
f3e5490
·
verified ·
1 Parent(s): e216e37

Upload GLM-OCR MLC model pack (json+bin shards)

Browse files
GLM-OCR-q4f16_1-MLC/mlc-chat-config.json ADDED
@@ -0,0 +1,152 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "glm_ocr",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "model_type": "glm_ocr",
7
+ "text_config": {
8
+ "model_type": "glm_ocr_text",
9
+ "pad_token_id": 59246,
10
+ "vocab_size": 59392,
11
+ "eos_token_id": [
12
+ 59246,
13
+ 59253
14
+ ],
15
+ "attention_bias": false,
16
+ "attention_dropout": 0.0,
17
+ "head_dim": 128,
18
+ "hidden_act": "silu",
19
+ "hidden_size": 1536,
20
+ "initializer_range": 0.02,
21
+ "intermediate_size": 4608,
22
+ "max_position_embeddings": 131072,
23
+ "num_attention_heads": 16,
24
+ "num_hidden_layers": 16,
25
+ "num_nextn_predict_layers": 1,
26
+ "num_key_value_heads": 8,
27
+ "rms_norm_eps": 1e-05,
28
+ "dtype": "bfloat16",
29
+ "rope_parameters": {
30
+ "rope_type": "default",
31
+ "mrope_section": [
32
+ 16,
33
+ 24,
34
+ 24
35
+ ],
36
+ "partial_rotary_factor": 1.0,
37
+ "rope_theta": 10000
38
+ },
39
+ "tie_word_embeddings": false,
40
+ "use_cache": true
41
+ },
42
+ "vision_config": {
43
+ "model_type": "glm_ocr_vision",
44
+ "hidden_size": 1024,
45
+ "depth": 24,
46
+ "num_heads": 16,
47
+ "attention_bias": true,
48
+ "intermediate_size": 4096,
49
+ "hidden_act": "silu",
50
+ "hidden_dropout_prob": 0.0,
51
+ "initializer_range": 0.02,
52
+ "image_size": 336,
53
+ "patch_size": 14,
54
+ "out_hidden_size": 1536,
55
+ "rms_norm_eps": 1e-05,
56
+ "spatial_merge_size": 2,
57
+ "temporal_patch_size": 2
58
+ },
59
+ "image_start_token_id": 59256,
60
+ "image_end_token_id": 59257,
61
+ "image_token_id": 59280,
62
+ "video_start_token_id": 59258,
63
+ "video_end_token_id": 59259,
64
+ "video_token_id": 59281,
65
+ "tie_word_embeddings": false,
66
+ "vocab_size": 59392,
67
+ "hidden_size": 1536,
68
+ "intermediate_size": 4608,
69
+ "num_attention_heads": 16,
70
+ "num_hidden_layers": 16,
71
+ "num_key_value_heads": 8,
72
+ "rms_norm_eps": 1e-05,
73
+ "rope_theta": 10000,
74
+ "context_window_size": 131072,
75
+ "prefill_chunk_size": 8192,
76
+ "tensor_parallel_shards": 1,
77
+ "head_dim": 128,
78
+ "dtype": "float32",
79
+ "max_batch_size": 128,
80
+ "vision_hidden_size": 1024,
81
+ "vision_intermediate_size": 4096,
82
+ "vision_num_hidden_layers": 24,
83
+ "vision_num_attention_heads": 16,
84
+ "vision_out_hidden_size": 1536,
85
+ "vision_patch_size": 14,
86
+ "vision_temporal_patch_size": 2,
87
+ "vision_spatial_merge_size": 2,
88
+ "vision_rms_norm_eps": 1e-05,
89
+ "vision_hidden_act": "silu",
90
+ "vision_attention_bias": true
91
+ },
92
+ "vocab_size": 59392,
93
+ "context_window_size": 131072,
94
+ "sliding_window_size": -1,
95
+ "prefill_chunk_size": 8192,
96
+ "attention_sink_size": -1,
97
+ "tensor_parallel_shards": 1,
98
+ "pipeline_parallel_stages": 1,
99
+ "active_vocab_size": 59282,
100
+ "temperature": 1.0,
101
+ "presence_penalty": 0.0,
102
+ "frequency_penalty": 0.0,
103
+ "repetition_penalty": 1.0,
104
+ "top_p": 1.0,
105
+ "tokenizer_files": [
106
+ "tokenizer.json",
107
+ "tokenizer_config.json"
108
+ ],
109
+ "tokenizer_info": {
110
+ "token_postproc_method": "byte_level",
111
+ "prepend_space_in_encode": false,
112
+ "strip_space_in_decode": false
113
+ },
114
+ "conv_template": {
115
+ "name": "glm_ocr",
116
+ "system_template": "{system_message}",
117
+ "system_message": "",
118
+ "system_prefix_token_ids": null,
119
+ "add_role_after_system_message": true,
120
+ "roles": {
121
+ "user": "<|user|>",
122
+ "assistant": "<|assistant|>",
123
+ "tool": "<|observation|>"
124
+ },
125
+ "role_templates": {
126
+ "user": "{user_message}",
127
+ "assistant": "{assistant_message}",
128
+ "tool": "{tool_message}"
129
+ },
130
+ "messages": [],
131
+ "seps": [
132
+ "\n"
133
+ ],
134
+ "role_content_sep": "\n",
135
+ "role_empty_sep": "\n",
136
+ "stop_str": [
137
+ "<|endoftext|>"
138
+ ],
139
+ "stop_token_ids": [
140
+ 59246,
141
+ 59253
142
+ ],
143
+ "function_string": "",
144
+ "use_function_calling": false
145
+ },
146
+ "pad_token_id": 59246,
147
+ "bos_token_id": 1,
148
+ "eos_token_id": [
149
+ 59246,
150
+ 59253
151
+ ]
152
+ }
GLM-OCR-q4f16_1-MLC/params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a0ef96799ee581a1f0246af23b76c67188ceb74c9e9b59258e61ea0605d125f
3
+ size 45613056
GLM-OCR-q4f16_1-MLC/params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c88ecb6479a96914920fb2ca267777ef2f1a805017ec629de78c212db0b40d1
3
+ size 45613056
GLM-OCR-q4f16_1-MLC/params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:138f1e8206e551ffc384b2938e75b5911b8354100a0590a6f5a2bba98c663cd4
3
+ size 33444864
GLM-OCR-q4f16_1-MLC/params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1c1bbac106ecde99afa61652be505a9b005aaa8d6b287e514c260ca636b48f70
3
+ size 31858688
GLM-OCR-q4f16_1-MLC/params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2663869b30d044826d7c0f46e13d6138f54ebaebd1eb042d300b3a51c3274df2
3
+ size 33139456
GLM-OCR-q4f16_1-MLC/params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71f15207fca50387de699a003563131dae1e78db2d390d8f680ad8d8370cef9d
3
+ size 33137664
GLM-OCR-q4f16_1-MLC/params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e973cef3720314e708244bb17ca4d9f5eca93858f33866ff6cf476c8f42e33c0
3
+ size 33139456
GLM-OCR-q4f16_1-MLC/params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a5a435bbbfd9d95ffced2882bb48513815a5e0a6bf4b053d0afbeefb1608e9a
3
+ size 33137664
GLM-OCR-q4f16_1-MLC/params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91046021e8932b549fcae430299bebe99ee7376c1b662e83c1293c7f4d6fd69b
3
+ size 33139456
GLM-OCR-q4f16_1-MLC/params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43af9cc2af5d97972947f9d21d37e336b17ac2e9705855225b998ea4e99144b0
3
+ size 30770944
GLM-OCR-q4f16_1-MLC/params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fd1f13a6d73350b3cd732730c807d0eb35f0b0cc3f4a1c1571a331ff07298f3
3
+ size 26546176
GLM-OCR-q4f16_1-MLC/params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec0ef8367e91cb5f66b6c2a4c1036ad42aa935ce8f25c4c4dc9415f9c2c5ac7b
3
+ size 32652288
GLM-OCR-q4f16_1-MLC/params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8bec185ba26f4b3e306bc38e37c492d9a44518845f2dca68ea683851a6f534c
3
+ size 30547968
GLM-OCR-q4f16_1-MLC/params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1e1ce13f99ba9dbfbf648d8a4b63a6cd06d7f8c7bc0c27587fc52c3c3b85e52
3
+ size 33444864
GLM-OCR-q4f16_1-MLC/params_shard_5.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25059825bed8f69e4d5449a2564ef33cd4a1f91a4e621c8e6ec90248ed770284
3
+ size 32956416
GLM-OCR-q4f16_1-MLC/params_shard_6.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:080469492dc87b91cb43c8ede3128b2ba4be7b0e27221fc45270f236764a8e49
3
+ size 32759808
GLM-OCR-q4f16_1-MLC/params_shard_7.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8bc16060280e7430a8478c11be25d2624f446df120e9cab576017c57d41fa16
3
+ size 32750592
GLM-OCR-q4f16_1-MLC/params_shard_8.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53cba8cb26800d90588449fd29cb168730120223fb23210e9fa71fdd06cefe8d
3
+ size 27451392
GLM-OCR-q4f16_1-MLC/params_shard_9.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0840a5c09f75a11978c819529c30771eb7f988d5fe55c27d0bc50b848ecea663
3
+ size 30547968
GLM-OCR-q4f16_1-MLC/tensor-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
GLM-OCR-q4f16_1-MLC/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
GLM-OCR-q4f16_1-MLC/tokenizer_config.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "backend": "tokenizers",
3
+ "clean_up_tokenization_spaces": false,
4
+ "eos_token": "<|endoftext|>",
5
+ "extra_special_tokens": [
6
+ "<|endoftext|>",
7
+ "[MASK]",
8
+ "[gMASK]",
9
+ "[sMASK]",
10
+ "<sop>",
11
+ "<eop>",
12
+ "<|system|>",
13
+ "<|user|>",
14
+ "<|assistant|>",
15
+ "<|observation|>",
16
+ "<|begin_of_image|>",
17
+ "<|end_of_image|>",
18
+ "<|begin_of_video|>",
19
+ "<|end_of_video|>",
20
+ "<|begin_of_audio|>",
21
+ "<|end_of_audio|>",
22
+ "<|begin_of_transcription|>",
23
+ "<|end_of_transcription|>",
24
+ "<|code_prefix|>",
25
+ "<|code_middle|>",
26
+ "<|code_suffix|>",
27
+ "<think>",
28
+ "</think>",
29
+ "<tool_call>",
30
+ "</tool_call>",
31
+ "<tool_response>",
32
+ "</tool_response>",
33
+ "<arg_key>",
34
+ "</arg_key>",
35
+ "<arg_value>",
36
+ "</arg_value>",
37
+ "/nothink",
38
+ "<|begin_of_box|>",
39
+ "<|end_of_box|>",
40
+ "<|image|>",
41
+ "<|video|>"
42
+ ],
43
+ "is_local": true,
44
+ "model_max_length": 655380,
45
+ "pad_token": "<|endoftext|>",
46
+ "padding_side": "left",
47
+ "processor_class": "Glm46VProcessor",
48
+ "tokenizer_class": "TokenizersBackend"
49
+ }