Upload GLM-OCR MLC model pack (json+bin shards)
Browse files- GLM-OCR-q4f16_1-MLC/mlc-chat-config.json +152 -0
- GLM-OCR-q4f16_1-MLC/params_shard_0.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_1.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_10.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_11.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_12.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_13.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_14.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_15.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_16.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_17.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_18.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_2.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_3.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_4.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_5.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_6.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_7.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_8.bin +3 -0
- GLM-OCR-q4f16_1-MLC/params_shard_9.bin +3 -0
- GLM-OCR-q4f16_1-MLC/tensor-cache.json +0 -0
- GLM-OCR-q4f16_1-MLC/tokenizer.json +0 -0
- GLM-OCR-q4f16_1-MLC/tokenizer_config.json +49 -0
GLM-OCR-q4f16_1-MLC/mlc-chat-config.json
ADDED
|
@@ -0,0 +1,152 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"version": "0.1.0",
|
| 3 |
+
"model_type": "glm_ocr",
|
| 4 |
+
"quantization": "q4f16_1",
|
| 5 |
+
"model_config": {
|
| 6 |
+
"model_type": "glm_ocr",
|
| 7 |
+
"text_config": {
|
| 8 |
+
"model_type": "glm_ocr_text",
|
| 9 |
+
"pad_token_id": 59246,
|
| 10 |
+
"vocab_size": 59392,
|
| 11 |
+
"eos_token_id": [
|
| 12 |
+
59246,
|
| 13 |
+
59253
|
| 14 |
+
],
|
| 15 |
+
"attention_bias": false,
|
| 16 |
+
"attention_dropout": 0.0,
|
| 17 |
+
"head_dim": 128,
|
| 18 |
+
"hidden_act": "silu",
|
| 19 |
+
"hidden_size": 1536,
|
| 20 |
+
"initializer_range": 0.02,
|
| 21 |
+
"intermediate_size": 4608,
|
| 22 |
+
"max_position_embeddings": 131072,
|
| 23 |
+
"num_attention_heads": 16,
|
| 24 |
+
"num_hidden_layers": 16,
|
| 25 |
+
"num_nextn_predict_layers": 1,
|
| 26 |
+
"num_key_value_heads": 8,
|
| 27 |
+
"rms_norm_eps": 1e-05,
|
| 28 |
+
"dtype": "bfloat16",
|
| 29 |
+
"rope_parameters": {
|
| 30 |
+
"rope_type": "default",
|
| 31 |
+
"mrope_section": [
|
| 32 |
+
16,
|
| 33 |
+
24,
|
| 34 |
+
24
|
| 35 |
+
],
|
| 36 |
+
"partial_rotary_factor": 1.0,
|
| 37 |
+
"rope_theta": 10000
|
| 38 |
+
},
|
| 39 |
+
"tie_word_embeddings": false,
|
| 40 |
+
"use_cache": true
|
| 41 |
+
},
|
| 42 |
+
"vision_config": {
|
| 43 |
+
"model_type": "glm_ocr_vision",
|
| 44 |
+
"hidden_size": 1024,
|
| 45 |
+
"depth": 24,
|
| 46 |
+
"num_heads": 16,
|
| 47 |
+
"attention_bias": true,
|
| 48 |
+
"intermediate_size": 4096,
|
| 49 |
+
"hidden_act": "silu",
|
| 50 |
+
"hidden_dropout_prob": 0.0,
|
| 51 |
+
"initializer_range": 0.02,
|
| 52 |
+
"image_size": 336,
|
| 53 |
+
"patch_size": 14,
|
| 54 |
+
"out_hidden_size": 1536,
|
| 55 |
+
"rms_norm_eps": 1e-05,
|
| 56 |
+
"spatial_merge_size": 2,
|
| 57 |
+
"temporal_patch_size": 2
|
| 58 |
+
},
|
| 59 |
+
"image_start_token_id": 59256,
|
| 60 |
+
"image_end_token_id": 59257,
|
| 61 |
+
"image_token_id": 59280,
|
| 62 |
+
"video_start_token_id": 59258,
|
| 63 |
+
"video_end_token_id": 59259,
|
| 64 |
+
"video_token_id": 59281,
|
| 65 |
+
"tie_word_embeddings": false,
|
| 66 |
+
"vocab_size": 59392,
|
| 67 |
+
"hidden_size": 1536,
|
| 68 |
+
"intermediate_size": 4608,
|
| 69 |
+
"num_attention_heads": 16,
|
| 70 |
+
"num_hidden_layers": 16,
|
| 71 |
+
"num_key_value_heads": 8,
|
| 72 |
+
"rms_norm_eps": 1e-05,
|
| 73 |
+
"rope_theta": 10000,
|
| 74 |
+
"context_window_size": 131072,
|
| 75 |
+
"prefill_chunk_size": 8192,
|
| 76 |
+
"tensor_parallel_shards": 1,
|
| 77 |
+
"head_dim": 128,
|
| 78 |
+
"dtype": "float32",
|
| 79 |
+
"max_batch_size": 128,
|
| 80 |
+
"vision_hidden_size": 1024,
|
| 81 |
+
"vision_intermediate_size": 4096,
|
| 82 |
+
"vision_num_hidden_layers": 24,
|
| 83 |
+
"vision_num_attention_heads": 16,
|
| 84 |
+
"vision_out_hidden_size": 1536,
|
| 85 |
+
"vision_patch_size": 14,
|
| 86 |
+
"vision_temporal_patch_size": 2,
|
| 87 |
+
"vision_spatial_merge_size": 2,
|
| 88 |
+
"vision_rms_norm_eps": 1e-05,
|
| 89 |
+
"vision_hidden_act": "silu",
|
| 90 |
+
"vision_attention_bias": true
|
| 91 |
+
},
|
| 92 |
+
"vocab_size": 59392,
|
| 93 |
+
"context_window_size": 131072,
|
| 94 |
+
"sliding_window_size": -1,
|
| 95 |
+
"prefill_chunk_size": 8192,
|
| 96 |
+
"attention_sink_size": -1,
|
| 97 |
+
"tensor_parallel_shards": 1,
|
| 98 |
+
"pipeline_parallel_stages": 1,
|
| 99 |
+
"active_vocab_size": 59282,
|
| 100 |
+
"temperature": 1.0,
|
| 101 |
+
"presence_penalty": 0.0,
|
| 102 |
+
"frequency_penalty": 0.0,
|
| 103 |
+
"repetition_penalty": 1.0,
|
| 104 |
+
"top_p": 1.0,
|
| 105 |
+
"tokenizer_files": [
|
| 106 |
+
"tokenizer.json",
|
| 107 |
+
"tokenizer_config.json"
|
| 108 |
+
],
|
| 109 |
+
"tokenizer_info": {
|
| 110 |
+
"token_postproc_method": "byte_level",
|
| 111 |
+
"prepend_space_in_encode": false,
|
| 112 |
+
"strip_space_in_decode": false
|
| 113 |
+
},
|
| 114 |
+
"conv_template": {
|
| 115 |
+
"name": "glm_ocr",
|
| 116 |
+
"system_template": "{system_message}",
|
| 117 |
+
"system_message": "",
|
| 118 |
+
"system_prefix_token_ids": null,
|
| 119 |
+
"add_role_after_system_message": true,
|
| 120 |
+
"roles": {
|
| 121 |
+
"user": "<|user|>",
|
| 122 |
+
"assistant": "<|assistant|>",
|
| 123 |
+
"tool": "<|observation|>"
|
| 124 |
+
},
|
| 125 |
+
"role_templates": {
|
| 126 |
+
"user": "{user_message}",
|
| 127 |
+
"assistant": "{assistant_message}",
|
| 128 |
+
"tool": "{tool_message}"
|
| 129 |
+
},
|
| 130 |
+
"messages": [],
|
| 131 |
+
"seps": [
|
| 132 |
+
"\n"
|
| 133 |
+
],
|
| 134 |
+
"role_content_sep": "\n",
|
| 135 |
+
"role_empty_sep": "\n",
|
| 136 |
+
"stop_str": [
|
| 137 |
+
"<|endoftext|>"
|
| 138 |
+
],
|
| 139 |
+
"stop_token_ids": [
|
| 140 |
+
59246,
|
| 141 |
+
59253
|
| 142 |
+
],
|
| 143 |
+
"function_string": "",
|
| 144 |
+
"use_function_calling": false
|
| 145 |
+
},
|
| 146 |
+
"pad_token_id": 59246,
|
| 147 |
+
"bos_token_id": 1,
|
| 148 |
+
"eos_token_id": [
|
| 149 |
+
59246,
|
| 150 |
+
59253
|
| 151 |
+
]
|
| 152 |
+
}
|
GLM-OCR-q4f16_1-MLC/params_shard_0.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a0ef96799ee581a1f0246af23b76c67188ceb74c9e9b59258e61ea0605d125f
|
| 3 |
+
size 45613056
|
GLM-OCR-q4f16_1-MLC/params_shard_1.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c88ecb6479a96914920fb2ca267777ef2f1a805017ec629de78c212db0b40d1
|
| 3 |
+
size 45613056
|
GLM-OCR-q4f16_1-MLC/params_shard_10.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:138f1e8206e551ffc384b2938e75b5911b8354100a0590a6f5a2bba98c663cd4
|
| 3 |
+
size 33444864
|
GLM-OCR-q4f16_1-MLC/params_shard_11.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c1bbac106ecde99afa61652be505a9b005aaa8d6b287e514c260ca636b48f70
|
| 3 |
+
size 31858688
|
GLM-OCR-q4f16_1-MLC/params_shard_12.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2663869b30d044826d7c0f46e13d6138f54ebaebd1eb042d300b3a51c3274df2
|
| 3 |
+
size 33139456
|
GLM-OCR-q4f16_1-MLC/params_shard_13.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:71f15207fca50387de699a003563131dae1e78db2d390d8f680ad8d8370cef9d
|
| 3 |
+
size 33137664
|
GLM-OCR-q4f16_1-MLC/params_shard_14.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e973cef3720314e708244bb17ca4d9f5eca93858f33866ff6cf476c8f42e33c0
|
| 3 |
+
size 33139456
|
GLM-OCR-q4f16_1-MLC/params_shard_15.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8a5a435bbbfd9d95ffced2882bb48513815a5e0a6bf4b053d0afbeefb1608e9a
|
| 3 |
+
size 33137664
|
GLM-OCR-q4f16_1-MLC/params_shard_16.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:91046021e8932b549fcae430299bebe99ee7376c1b662e83c1293c7f4d6fd69b
|
| 3 |
+
size 33139456
|
GLM-OCR-q4f16_1-MLC/params_shard_17.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:43af9cc2af5d97972947f9d21d37e336b17ac2e9705855225b998ea4e99144b0
|
| 3 |
+
size 30770944
|
GLM-OCR-q4f16_1-MLC/params_shard_18.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8fd1f13a6d73350b3cd732730c807d0eb35f0b0cc3f4a1c1571a331ff07298f3
|
| 3 |
+
size 26546176
|
GLM-OCR-q4f16_1-MLC/params_shard_2.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ec0ef8367e91cb5f66b6c2a4c1036ad42aa935ce8f25c4c4dc9415f9c2c5ac7b
|
| 3 |
+
size 32652288
|
GLM-OCR-q4f16_1-MLC/params_shard_3.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a8bec185ba26f4b3e306bc38e37c492d9a44518845f2dca68ea683851a6f534c
|
| 3 |
+
size 30547968
|
GLM-OCR-q4f16_1-MLC/params_shard_4.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1e1ce13f99ba9dbfbf648d8a4b63a6cd06d7f8c7bc0c27587fc52c3c3b85e52
|
| 3 |
+
size 33444864
|
GLM-OCR-q4f16_1-MLC/params_shard_5.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:25059825bed8f69e4d5449a2564ef33cd4a1f91a4e621c8e6ec90248ed770284
|
| 3 |
+
size 32956416
|
GLM-OCR-q4f16_1-MLC/params_shard_6.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:080469492dc87b91cb43c8ede3128b2ba4be7b0e27221fc45270f236764a8e49
|
| 3 |
+
size 32759808
|
GLM-OCR-q4f16_1-MLC/params_shard_7.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d8bc16060280e7430a8478c11be25d2624f446df120e9cab576017c57d41fa16
|
| 3 |
+
size 32750592
|
GLM-OCR-q4f16_1-MLC/params_shard_8.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:53cba8cb26800d90588449fd29cb168730120223fb23210e9fa71fdd06cefe8d
|
| 3 |
+
size 27451392
|
GLM-OCR-q4f16_1-MLC/params_shard_9.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0840a5c09f75a11978c819529c30771eb7f988d5fe55c27d0bc50b848ecea663
|
| 3 |
+
size 30547968
|
GLM-OCR-q4f16_1-MLC/tensor-cache.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
GLM-OCR-q4f16_1-MLC/tokenizer.json
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
GLM-OCR-q4f16_1-MLC/tokenizer_config.json
ADDED
|
@@ -0,0 +1,49 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"backend": "tokenizers",
|
| 3 |
+
"clean_up_tokenization_spaces": false,
|
| 4 |
+
"eos_token": "<|endoftext|>",
|
| 5 |
+
"extra_special_tokens": [
|
| 6 |
+
"<|endoftext|>",
|
| 7 |
+
"[MASK]",
|
| 8 |
+
"[gMASK]",
|
| 9 |
+
"[sMASK]",
|
| 10 |
+
"<sop>",
|
| 11 |
+
"<eop>",
|
| 12 |
+
"<|system|>",
|
| 13 |
+
"<|user|>",
|
| 14 |
+
"<|assistant|>",
|
| 15 |
+
"<|observation|>",
|
| 16 |
+
"<|begin_of_image|>",
|
| 17 |
+
"<|end_of_image|>",
|
| 18 |
+
"<|begin_of_video|>",
|
| 19 |
+
"<|end_of_video|>",
|
| 20 |
+
"<|begin_of_audio|>",
|
| 21 |
+
"<|end_of_audio|>",
|
| 22 |
+
"<|begin_of_transcription|>",
|
| 23 |
+
"<|end_of_transcription|>",
|
| 24 |
+
"<|code_prefix|>",
|
| 25 |
+
"<|code_middle|>",
|
| 26 |
+
"<|code_suffix|>",
|
| 27 |
+
"<think>",
|
| 28 |
+
"</think>",
|
| 29 |
+
"<tool_call>",
|
| 30 |
+
"</tool_call>",
|
| 31 |
+
"<tool_response>",
|
| 32 |
+
"</tool_response>",
|
| 33 |
+
"<arg_key>",
|
| 34 |
+
"</arg_key>",
|
| 35 |
+
"<arg_value>",
|
| 36 |
+
"</arg_value>",
|
| 37 |
+
"/nothink",
|
| 38 |
+
"<|begin_of_box|>",
|
| 39 |
+
"<|end_of_box|>",
|
| 40 |
+
"<|image|>",
|
| 41 |
+
"<|video|>"
|
| 42 |
+
],
|
| 43 |
+
"is_local": true,
|
| 44 |
+
"model_max_length": 655380,
|
| 45 |
+
"pad_token": "<|endoftext|>",
|
| 46 |
+
"padding_side": "left",
|
| 47 |
+
"processor_class": "Glm46VProcessor",
|
| 48 |
+
"tokenizer_class": "TokenizersBackend"
|
| 49 |
+
}
|