diff --git a/.gitattributes b/.gitattributes index 9aaf029aa8349fd3e7185f81e8f93607f17a0f6e..76252070b5b8a1785cf279eddf665a79477bcd06 100644 --- a/.gitattributes +++ b/.gitattributes @@ -56,3 +56,4 @@ llm/GGUF/unsloth/Qwen3-VL-8B-Instruct-GGUF/mmproj-F16.gguf filter=lfs diff=lfs m llm/GGUF/unsloth/Qwen3-VL-8B-Instruct-GGUF/Qwen3-VL-8B-Instruct-UD-Q4_K_XL.gguf filter=lfs diff=lfs merge=lfs -text unet/flux2_dev_Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text TTS/ACE-Step-v1-3.5B/umt5-base/tokenizer.json filter=lfs diff=lfs merge=lfs -text +glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/model_index.json b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/model_index.json new file mode 100644 index 0000000000000000000000000000000000000000..8db189758a4cb6251ac1d36beb98e4b5a58f2921 --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/model_index.json @@ -0,0 +1,33 @@ +{ + "_class_name": "GlmImagePipeline", + "_diffusers_version": "0.37.0.dev0", + "_name_or_path": "zai-org/GLM-Image", + "processor": [ + "glm_image", + "GlmImageProcessor" + ], + "scheduler": [ + "diffusers", + "FlowMatchEulerDiscreteScheduler" + ], + "text_encoder": [ + "transformers", + "T5EncoderModel" + ], + "tokenizer": [ + "transformers", + "ByT5Tokenizer" + ], + "transformer": [ + "diffusers", + "GlmImageTransformer2DModel" + ], + "vae": [ + "diffusers", + "AutoencoderKL" + ], + "vision_language_encoder": [ + "glm_image", + "GlmImageForConditionalGeneration" + ] +} diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/chat_template.jinja b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/chat_template.jinja new file mode 100644 index 0000000000000000000000000000000000000000..637cd237529e862e7db5eaec7e590290178da177 --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/chat_template.jinja @@ -0,0 +1,13 @@ +{%- for m in messages -%} + {%- if m.content is string -%} + {{ m.content }} + {%- else -%} + {%- for item in m.content -%} + {%- if item.type == 'image' or item.get('image') is not none -%} + <|dit_token_16384|><|image|><|dit_token_16385|> + {%- elif item.type == 'text' -%} + {{ item.text }} + {%- endif -%} + {%- endfor -%} + {%- endif -%} +{%- endfor -%} \ No newline at end of file diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/processor_config.json b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/processor_config.json new file mode 100644 index 0000000000000000000000000000000000000000..61a637d9aecc3079542ec2a0ac13011f483204df --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/processor_config.json @@ -0,0 +1,31 @@ +{ + "image_processor": { + "do_convert_rgb": true, + "do_normalize": true, + "do_rescale": true, + "do_resize": true, + "image_mean": [ + 0.5, + 0.5, + 0.5 + ], + "image_processor_type": "GlmImageImageProcessor", + "image_std": [ + 0.5, + 0.5, + 0.5 + ], + "max_pixels": 4194304, + "merge_size": 1, + "min_pixels": 262144, + "patch_size": 16, + "resample": 3, + "rescale_factor": 0.00392156862745098, + "size": { + "longest_edge": 4194304, + "shortest_edge": 262144 + }, + "temporal_patch_size": 1 + }, + "processor_class": "GlmImageProcessor" +} diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/tokenizer.json b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..a1a1273a9c1ba778f16df8d78ad82675c65911b8 --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d771c9659fd2c65c0ef8a8daf9d9f9f07b53f89ce164cc832a28137db604d01d +size 23765636 diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/tokenizer_config.json b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..3fe7f3564eeb6e51c9301b0c72649d622ec90f39 --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/processor/tokenizer_config.json @@ -0,0 +1,44 @@ +{ + "backend": "tokenizers", + "bos_token": "<|dit_token_16384|>", + "clean_up_tokenization_spaces": false, + "do_lower_case": false, + "eos_token": "<|dit_token_16385|>", + "extra_special_tokens": [ + "<|endoftext|>", + "[MASK]", + "[gMASK]", + "[sMASK]", + "", + "", + "<|system|>", + "<|user|>", + "<|assistant|>", + "<|observation|>", + "<|begin_of_image|>", + "<|end_of_image|>", + "<|begin_of_video|>", + "<|end_of_video|>", + "<|image|>", + "<|video|>" + ], + "grid_bos_token": "", + "grid_eos_token": "", + "image_token": "<|image|>", + "is_local": true, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 65536, + "model_specific_special_tokens": { + "grid_bos_token": "", + "grid_eos_token": "", + "image_token": "<|image|>" + }, + "pad_token": "<|dit_token_16385|>", + "padding_side": "left", + "processor_class": "GlmImageProcessor", + "remove_space": false, + "tokenizer_class": "TokenizersBackend" +} diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/scheduler/scheduler_config.json b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/scheduler/scheduler_config.json new file mode 100644 index 0000000000000000000000000000000000000000..b7051e28f47b16720b38ef9f2cb58cb090b8516a --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/scheduler/scheduler_config.json @@ -0,0 +1,18 @@ +{ + "_class_name": "FlowMatchEulerDiscreteScheduler", + "_diffusers_version": "0.37.0.dev0", + "base_image_seq_len": 256, + "base_shift": 0.25, + "invert_sigmas": false, + "max_image_seq_len": 4096, + "max_shift": 0.75, + "num_train_timesteps": 1000, + "shift": 1.0, + "shift_terminal": null, + "stochastic_sampling": false, + "time_shift_type": "linear", + "use_beta_sigmas": false, + "use_dynamic_shifting": true, + "use_exponential_sigmas": false, + "use_karras_sigmas": false +} diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/text_encoder/config.json b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/text_encoder/config.json new file mode 100644 index 0000000000000000000000000000000000000000..153318487ae57ede910edeaaca3a84ec5485442c --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/text_encoder/config.json @@ -0,0 +1,32 @@ +{ + "architectures": [ + "T5EncoderModel" + ], + "classifier_dropout": 0.0, + "d_ff": 3584, + "d_kv": 64, + "d_model": 1472, + "decoder_start_token_id": 0, + "dense_act_fn": "gelu_new", + "dropout_rate": 0.1, + "dtype": "bfloat16", + "eos_token_id": 1, + "feed_forward_proj": "gated-gelu", + "gradient_checkpointing": false, + "initializer_factor": 1.0, + "is_encoder_decoder": false, + "is_gated_act": true, + "layer_norm_epsilon": 1e-06, + "model_type": "t5", + "num_decoder_layers": 4, + "num_heads": 6, + "num_layers": 12, + "pad_token_id": 0, + "relative_attention_max_distance": 128, + "relative_attention_num_buckets": 32, + "scale_decoder_outputs": false, + "tokenizer_class": "ByT5Tokenizer", + "transformers_version": "5.0.0.dev0", + "use_cache": false, + "vocab_size": 384 +} diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/text_encoder/model.safetensors b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/text_encoder/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0cc702d96d93536eafcc67b83fb0f44d82bfbd8e --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/text_encoder/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bc470014c3782064177d29ca80f9b03da30f0e259f6fa06c256bc5ecdf600d6 +size 561943976 diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/tokenizer/added_tokens.json b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/tokenizer/added_tokens.json new file mode 100644 index 0000000000000000000000000000000000000000..93c190b5690dd55aac16723222a9909e2be0faec --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/tokenizer/added_tokens.json @@ -0,0 +1,127 @@ +{ + "": 259, + "": 359, + "": 360, + "": 361, + "": 362, + "": 363, + "": 364, + "": 365, + "": 366, + "": 367, + "": 368, + "": 269, + "": 369, + "": 370, + "": 371, + "": 372, + "": 373, + "": 374, + "": 375, + "": 376, + "": 377, + "": 378, + "": 270, + "": 379, + "": 380, + "": 381, + "": 382, + "": 383, + "": 271, + "": 272, + "": 273, + "": 274, + "": 275, + "": 276, + "": 277, + "": 278, + "": 260, + "": 279, + "": 280, + "": 281, + "": 282, + "": 283, + "": 284, + "": 285, + "": 286, + "": 287, + "": 288, + "": 261, + "": 289, + "": 290, + "": 291, + "": 292, + "": 293, + "": 294, + "": 295, + "": 296, + "": 297, + "": 298, + "": 262, + "": 299, + "": 300, + "": 301, + "": 302, + "": 303, + "": 304, + "": 305, + "": 306, + "": 307, + "": 308, + "": 263, + "": 309, + "": 310, + "": 311, + "": 312, + "": 313, + "": 314, + "": 315, + "": 316, + "": 317, + "": 318, + "": 264, + "": 319, + "": 320, + "": 321, + "": 322, + "": 323, + "": 324, + "": 325, + "": 326, + "": 327, + "": 328, + "": 265, + "": 329, + "": 330, + "": 331, + "": 332, + "": 333, + "": 334, + "": 335, + "": 336, + "": 337, + "": 338, + "": 266, + "": 339, + "": 340, + "": 341, + "": 342, + "": 343, + "": 344, + "": 345, + "": 346, + "": 347, + "": 348, + "": 267, + "": 349, + "": 350, + "": 351, + "": 352, + "": 353, + "": 354, + "": 355, + "": 356, + "": 357, + "": 358, + "": 268 +} diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/tokenizer/tokenizer_config.json b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/tokenizer/tokenizer_config.json new file mode 100644 index 0000000000000000000000000000000000000000..f2a1baf8be1c2fb0578967b194024c0ab61df871 --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/tokenizer/tokenizer_config.json @@ -0,0 +1,1292 @@ +{ + "added_tokens_decoder": { + "0": { + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": true + }, + "1": { + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": true + }, + "2": { + "content": "", + "lstrip": false, + "normalized": true, + "rstrip": false, + "single_word": false, + "special": true + }, + "259": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "260": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "261": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "262": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "263": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "264": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "265": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "266": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "267": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "268": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "269": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "270": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "271": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "272": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "273": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "274": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "275": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "276": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "277": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "278": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "279": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "280": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "281": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "282": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "283": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "284": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "285": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "286": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "287": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "288": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "289": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "290": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "291": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "292": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "293": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "294": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "295": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "296": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "297": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "298": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "299": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "300": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "301": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "302": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "303": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "304": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "305": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "306": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "307": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "308": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "309": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "310": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "311": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "312": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "313": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "314": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "315": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "316": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "317": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "318": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "319": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "320": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "321": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "322": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "323": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "324": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "325": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "326": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "327": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "328": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "329": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "330": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "331": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "332": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "333": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "334": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "335": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "336": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "337": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "338": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "339": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "340": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "341": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "342": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "343": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "344": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "345": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "346": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "347": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "348": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "349": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "350": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "351": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "352": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "353": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "354": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "355": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "356": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "357": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "358": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "359": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "360": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "361": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "362": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "363": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "364": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "365": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "366": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "367": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "368": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "369": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "370": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "371": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "372": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "373": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "374": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "375": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "376": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "377": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "378": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "379": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "380": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "381": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "382": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "383": { + "content": "", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "additional_special_tokens": [ + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "" + ], + "backend": "custom", + "clean_up_tokenization_spaces": false, + "eos_token": "", + "extra_ids": 0, + "extra_special_tokens": [ + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "", + "" + ], + "is_local": true, + "model_max_length": 1000000000000000019884624838656, + "model_specific_special_tokens": {}, + "pad_token": "", + "tokenizer_class": "ByT5Tokenizer", + "unk_token": "" +} diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/transformer/config.json b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/transformer/config.json new file mode 100644 index 0000000000000000000000000000000000000000..0fe7eafcd1ade4cf7f853604b18fbad3cd1e1c42 --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/transformer/config.json @@ -0,0 +1,266 @@ +{ + "_class_name": "GlmImageTransformer2DModel", + "_diffusers_version": "0.37.0.dev0", + "_name_or_path": "zai-org/GLM-Image", + "attention_head_dim": 128, + "condition_dim": 256, + "in_channels": 16, + "num_attention_heads": 32, + "num_layers": 30, + "out_channels": 16, + "patch_size": 2, + "prior_vq_quantizer_codebook_size": 16384, + "quantization_config": { + "add_skip_keys": true, + "dequantize_fp32": false, + "dynamic_loss_threshold": 0.01, + "group_size": 0, + "is_integer": true, + "is_training": false, + "modules_dtype_dict": { + "float5_e3m1fn": [ + "transformer_blocks.23.norm1.linear.weight", + "transformer_blocks.24.norm1.linear.weight", + "transformer_blocks.25.norm1.linear.weight" + ], + "int5": [ + "transformer_blocks.0.attn1.to_k.weight", + "transformer_blocks.0.attn1.to_v.weight", + "transformer_blocks.0.ff.net.0.proj.weight", + "transformer_blocks.1.attn1.to_k.weight", + "transformer_blocks.1.attn1.to_q.weight", + "transformer_blocks.1.attn1.to_v.weight", + "transformer_blocks.1.ff.net.0.proj.weight", + "transformer_blocks.10.attn1.to_v.weight", + "transformer_blocks.2.attn1.to_k.weight", + "transformer_blocks.2.attn1.to_q.weight", + "transformer_blocks.2.attn1.to_v.weight", + "transformer_blocks.3.attn1.to_k.weight", + "transformer_blocks.3.attn1.to_q.weight", + "transformer_blocks.3.attn1.to_v.weight", + "transformer_blocks.3.ff.net.0.proj.weight", + "transformer_blocks.4.attn1.to_k.weight", + "transformer_blocks.4.attn1.to_q.weight", + "transformer_blocks.4.attn1.to_v.weight", + "transformer_blocks.5.attn1.to_v.weight", + "transformer_blocks.6.attn1.to_v.weight", + "transformer_blocks.7.attn1.to_v.weight", + "transformer_blocks.8.attn1.to_v.weight", + "transformer_blocks.9.attn1.to_v.weight", + "transformer_blocks.21.norm1.linear.weight", + "transformer_blocks.22.norm1.linear.weight", + "transformer_blocks.25.ff.net.2.weight", + "transformer_blocks.26.attn1.to_v.weight", + "transformer_blocks.26.ff.net.2.weight", + "transformer_blocks.26.norm1.linear.weight", + "transformer_blocks.27.attn1.to_v.weight", + "transformer_blocks.27.norm1.linear.weight", + "transformer_blocks.28.attn1.to_v.weight", + "transformer_blocks.29.attn1.to_v.weight" + ], + "uint4": [ + "transformer_blocks.0.attn1.to_out.0.weight", + "transformer_blocks.0.attn1.to_q.weight", + "transformer_blocks.0.ff.net.2.weight", + "transformer_blocks.1.attn1.to_out.0.weight", + "transformer_blocks.1.ff.net.2.weight", + "transformer_blocks.1.norm1.linear.weight", + "transformer_blocks.10.attn1.to_k.weight", + "transformer_blocks.10.attn1.to_out.0.weight", + "transformer_blocks.10.attn1.to_q.weight", + "transformer_blocks.10.norm1.linear.weight", + "transformer_blocks.2.attn1.to_out.0.weight", + "transformer_blocks.2.ff.net.0.proj.weight", + "transformer_blocks.2.ff.net.2.weight", + "transformer_blocks.2.norm1.linear.weight", + "transformer_blocks.3.attn1.to_out.0.weight", + "transformer_blocks.3.ff.net.2.weight", + "transformer_blocks.3.norm1.linear.weight", + "transformer_blocks.4.attn1.to_out.0.weight", + "transformer_blocks.4.ff.net.0.proj.weight", + "transformer_blocks.4.ff.net.2.weight", + "transformer_blocks.4.norm1.linear.weight", + "transformer_blocks.5.attn1.to_k.weight", + "transformer_blocks.5.attn1.to_out.0.weight", + "transformer_blocks.5.attn1.to_q.weight", + "transformer_blocks.5.ff.net.0.proj.weight", + "transformer_blocks.5.ff.net.2.weight", + "transformer_blocks.5.norm1.linear.weight", + "transformer_blocks.6.attn1.to_k.weight", + "transformer_blocks.6.attn1.to_out.0.weight", + "transformer_blocks.6.attn1.to_q.weight", + "transformer_blocks.6.ff.net.0.proj.weight", + "transformer_blocks.6.ff.net.2.weight", + "transformer_blocks.6.norm1.linear.weight", + "transformer_blocks.7.attn1.to_k.weight", + "transformer_blocks.7.attn1.to_out.0.weight", + "transformer_blocks.7.attn1.to_q.weight", + "transformer_blocks.7.ff.net.0.proj.weight", + "transformer_blocks.7.ff.net.2.weight", + "transformer_blocks.7.norm1.linear.weight", + "transformer_blocks.8.attn1.to_k.weight", + "transformer_blocks.8.attn1.to_out.0.weight", + "transformer_blocks.8.attn1.to_q.weight", + "transformer_blocks.8.ff.net.0.proj.weight", + "transformer_blocks.8.ff.net.2.weight", + "transformer_blocks.8.norm1.linear.weight", + "transformer_blocks.9.attn1.to_k.weight", + "transformer_blocks.9.attn1.to_out.0.weight", + "transformer_blocks.9.attn1.to_q.weight", + "transformer_blocks.9.ff.net.0.proj.weight", + "transformer_blocks.9.ff.net.2.weight", + "transformer_blocks.9.norm1.linear.weight", + "transformer_blocks.10.ff.net.0.proj.weight", + "transformer_blocks.10.ff.net.2.weight", + "transformer_blocks.11.attn1.to_k.weight", + "transformer_blocks.11.attn1.to_out.0.weight", + "transformer_blocks.11.attn1.to_q.weight", + "transformer_blocks.11.attn1.to_v.weight", + "transformer_blocks.11.ff.net.0.proj.weight", + "transformer_blocks.11.ff.net.2.weight", + "transformer_blocks.11.norm1.linear.weight", + "transformer_blocks.12.attn1.to_k.weight", + "transformer_blocks.12.attn1.to_out.0.weight", + "transformer_blocks.12.attn1.to_q.weight", + "transformer_blocks.12.attn1.to_v.weight", + "transformer_blocks.12.ff.net.0.proj.weight", + "transformer_blocks.12.ff.net.2.weight", + "transformer_blocks.12.norm1.linear.weight", + "transformer_blocks.13.attn1.to_k.weight", + "transformer_blocks.13.attn1.to_out.0.weight", + "transformer_blocks.13.attn1.to_q.weight", + "transformer_blocks.13.attn1.to_v.weight", + "transformer_blocks.13.ff.net.0.proj.weight", + "transformer_blocks.13.ff.net.2.weight", + "transformer_blocks.13.norm1.linear.weight", + "transformer_blocks.14.attn1.to_k.weight", + "transformer_blocks.14.attn1.to_out.0.weight", + "transformer_blocks.14.attn1.to_q.weight", + "transformer_blocks.14.attn1.to_v.weight", + "transformer_blocks.14.ff.net.0.proj.weight", + "transformer_blocks.14.ff.net.2.weight", + "transformer_blocks.14.norm1.linear.weight", + "transformer_blocks.15.attn1.to_k.weight", + "transformer_blocks.15.attn1.to_out.0.weight", + "transformer_blocks.15.attn1.to_q.weight", + "transformer_blocks.15.attn1.to_v.weight", + "transformer_blocks.15.ff.net.0.proj.weight", + "transformer_blocks.15.ff.net.2.weight", + "transformer_blocks.15.norm1.linear.weight", + "transformer_blocks.16.attn1.to_k.weight", + "transformer_blocks.16.attn1.to_out.0.weight", + "transformer_blocks.16.attn1.to_q.weight", + "transformer_blocks.16.attn1.to_v.weight", + "transformer_blocks.16.ff.net.0.proj.weight", + "transformer_blocks.16.ff.net.2.weight", + "transformer_blocks.16.norm1.linear.weight", + "transformer_blocks.17.attn1.to_k.weight", + "transformer_blocks.17.attn1.to_out.0.weight", + "transformer_blocks.17.attn1.to_q.weight", + "transformer_blocks.17.attn1.to_v.weight", + "transformer_blocks.17.ff.net.0.proj.weight", + "transformer_blocks.17.ff.net.2.weight", + "transformer_blocks.17.norm1.linear.weight", + "transformer_blocks.18.attn1.to_k.weight", + "transformer_blocks.18.attn1.to_out.0.weight", + "transformer_blocks.18.attn1.to_q.weight", + "transformer_blocks.18.attn1.to_v.weight", + "transformer_blocks.18.ff.net.0.proj.weight", + "transformer_blocks.18.ff.net.2.weight", + "transformer_blocks.18.norm1.linear.weight", + "transformer_blocks.19.attn1.to_k.weight", + "transformer_blocks.19.attn1.to_out.0.weight", + "transformer_blocks.19.attn1.to_q.weight", + "transformer_blocks.19.attn1.to_v.weight", + "transformer_blocks.19.ff.net.0.proj.weight", + "transformer_blocks.19.ff.net.2.weight", + "transformer_blocks.19.norm1.linear.weight", + "transformer_blocks.20.attn1.to_k.weight", + "transformer_blocks.20.attn1.to_out.0.weight", + "transformer_blocks.20.attn1.to_q.weight", + "transformer_blocks.20.attn1.to_v.weight", + "transformer_blocks.20.ff.net.0.proj.weight", + "transformer_blocks.20.ff.net.2.weight", + "transformer_blocks.20.norm1.linear.weight", + "transformer_blocks.21.attn1.to_k.weight", + "transformer_blocks.21.attn1.to_out.0.weight", + "transformer_blocks.21.attn1.to_q.weight", + "transformer_blocks.21.attn1.to_v.weight", + "transformer_blocks.21.ff.net.0.proj.weight", + "transformer_blocks.21.ff.net.2.weight", + "transformer_blocks.22.attn1.to_k.weight", + "transformer_blocks.22.attn1.to_out.0.weight", + "transformer_blocks.22.attn1.to_q.weight", + "transformer_blocks.22.attn1.to_v.weight", + "transformer_blocks.22.ff.net.0.proj.weight", + "transformer_blocks.22.ff.net.2.weight", + "transformer_blocks.23.attn1.to_k.weight", + "transformer_blocks.23.attn1.to_out.0.weight", + "transformer_blocks.23.attn1.to_q.weight", + "transformer_blocks.23.attn1.to_v.weight", + "transformer_blocks.23.ff.net.0.proj.weight", + "transformer_blocks.23.ff.net.2.weight", + "transformer_blocks.24.attn1.to_k.weight", + "transformer_blocks.24.attn1.to_out.0.weight", + "transformer_blocks.24.attn1.to_q.weight", + "transformer_blocks.24.attn1.to_v.weight", + "transformer_blocks.24.ff.net.0.proj.weight", + "transformer_blocks.24.ff.net.2.weight", + "transformer_blocks.25.attn1.to_k.weight", + "transformer_blocks.25.attn1.to_out.0.weight", + "transformer_blocks.25.attn1.to_q.weight", + "transformer_blocks.25.attn1.to_v.weight", + "transformer_blocks.25.ff.net.0.proj.weight", + "transformer_blocks.26.attn1.to_k.weight", + "transformer_blocks.26.attn1.to_out.0.weight", + "transformer_blocks.26.attn1.to_q.weight", + "transformer_blocks.26.ff.net.0.proj.weight", + "transformer_blocks.27.attn1.to_k.weight", + "transformer_blocks.27.attn1.to_out.0.weight", + "transformer_blocks.27.attn1.to_q.weight", + "transformer_blocks.27.ff.net.0.proj.weight", + "transformer_blocks.27.ff.net.2.weight", + "transformer_blocks.28.attn1.to_k.weight", + "transformer_blocks.28.attn1.to_out.0.weight", + "transformer_blocks.28.attn1.to_q.weight", + "transformer_blocks.28.ff.net.0.proj.weight", + "transformer_blocks.28.ff.net.2.weight", + "transformer_blocks.28.norm1.linear.weight", + "transformer_blocks.29.attn1.to_k.weight", + "transformer_blocks.29.attn1.to_out.0.weight", + "transformer_blocks.29.attn1.to_q.weight", + "transformer_blocks.29.ff.net.0.proj.weight", + "transformer_blocks.29.ff.net.2.weight", + "transformer_blocks.29.norm1.linear.weight" + ] + }, + "modules_to_not_convert": [ + "transformer_blocks.0.norm1.linear.weight", + "time_condition_embed", + "image_projector", + "proj_out", + "prior_projector", + "glyph_projector", + "norm_out" + ], + "non_blocking": false, + "quant_conv": false, + "quant_method": "sdnq", + "quantization_device": "cuda", + "quantized_matmul_dtype": null, + "return_device": "cuda", + "sdnq_version": "0.1.4", + "svd_rank": 32, + "svd_steps": 8, + "use_dynamic_quantization": true, + "use_grad_ckpt": true, + "use_quantized_matmul": false, + "use_quantized_matmul_conv": false, + "use_static_quantization": true, + "use_stochastic_rounding": false, + "use_svd": false, + "weights_dtype": "uint4" + }, + "text_embed_dim": 1472, + "time_embed_dim": 512 +} diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/transformer/diffusion_pytorch_model.safetensors b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/transformer/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..4f88b98bef791233be4366caa51f1ab729e96890 --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/transformer/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a228933f18126ec5015f8d216cf5609a9cda9373ce662574abf159bb251843d +size 4193985424 diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vae/config.json b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vae/config.json new file mode 100644 index 0000000000000000000000000000000000000000..aeb81840be9c02e90cba9263e8991e79979151d3 --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vae/config.json @@ -0,0 +1,72 @@ +{ + "_class_name": "AutoencoderKL", + "_diffusers_version": "0.37.0.dev0", + "_name_or_path": "/home/disty/.cache/huggingface/hub/models--zai-org--GLM-Image/snapshots/a32e429538178757f852fd54b52a5e1681da1e35/vae", + "act_fn": "silu", + "block_out_channels": [ + 128, + 512, + 1024, + 1024 + ], + "down_block_types": [ + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D", + "DownEncoderBlock2D" + ], + "force_upcast": true, + "in_channels": 3, + "latent_channels": 16, + "latents_mean": [ + -0.2080078125, + 1.875, + -0.470703125, + -1.265625, + -1.421875, + 0.77734375, + -0.3671875, + -0.9453125, + 0.318359375, + 0.7734375, + -0.1884765625, + -0.022216796875, + -0.220703125, + -1.59375, + -0.81640625, + -0.255859375 + ], + "latents_std": [ + 3.0625, + 2.203125, + 2.265625, + 4.84375, + 2.5, + 3.9375, + 2.203125, + 3.03125, + 2.1875, + 2.046875, + 2.71875, + 2.390625, + 2.390625, + 2.453125, + 2.25, + 2.15625 + ], + "layers_per_block": 3, + "mid_block_add_attention": false, + "norm_num_groups": 32, + "out_channels": 3, + "sample_size": 1024, + "scaling_factor": 0.18215, + "shift_factor": null, + "up_block_types": [ + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D", + "UpDecoderBlock2D" + ], + "use_post_quant_conv": false, + "use_quant_conv": false +} diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vae/diffusion_pytorch_model.safetensors b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vae/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..57a49305526ac7470648c6462fb1d1233af3c10b --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vae/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a80a129b649cdb6d74d9c2b5bb060f3b882b7826b63a732306a7d3393deedbc0 +size 812234342 diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vision_language_encoder/config.json b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vision_language_encoder/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bd27d298466d8882519de177a035b6b95a4f934f --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vision_language_encoder/config.json @@ -0,0 +1,505 @@ +{ + "architectures": [ + "GlmImageForConditionalGeneration" + ], + "dtype": "bfloat16", + "image_end_token_id": 16385, + "image_start_token_id": 16384, + "image_token_id": 167855, + "model_type": "glm_image", + "quantization_config": { + "add_skip_keys": false, + "dequantize_fp32": false, + "dynamic_loss_threshold": 0.01, + "group_size": 0, + "is_integer": true, + "is_training": false, + "modules_dtype_dict": { + "int5": [ + "model.language_model.layers.28.self_attn.v_proj.weight", + "model.language_model.layers.29.self_attn.v_proj.weight", + "model.language_model.layers.32.self_attn.v_proj.weight", + "model.language_model.layers.33.self_attn.v_proj.weight", + "model.visual.blocks.0.attn.qkv.weight", + "model.visual.blocks.0.mlp.fc2.weight", + "model.visual.blocks.1.attn.qkv.weight", + "model.visual.blocks.1.mlp.fc1.weight", + "model.visual.blocks.1.mlp.fc2.weight", + "model.visual.blocks.2.attn.qkv.weight", + "model.visual.blocks.2.mlp.fc2.weight", + "model.visual.blocks.3.attn.qkv.weight", + "model.visual.blocks.3.mlp.fc2.weight", + "model.visual.blocks.4.mlp.fc2.weight", + "model.visual.blocks.5.mlp.fc2.weight", + "model.visual.blocks.6.mlp.fc2.weight", + "model.visual.blocks.7.mlp.fc2.weight", + "model.visual.blocks.8.mlp.fc2.weight", + "model.visual.blocks.9.mlp.fc2.weight" + ], + "uint4": [ + "model.language_model.layers.0.mlp.down_proj.weight", + "model.language_model.layers.0.mlp.gate_up_proj.weight", + "model.language_model.layers.0.self_attn.k_proj.weight", + "model.language_model.layers.0.self_attn.o_proj.weight", + "model.language_model.layers.0.self_attn.q_proj.weight", + "model.language_model.layers.0.self_attn.v_proj.weight", + "model.language_model.layers.1.mlp.down_proj.weight", + "model.language_model.layers.1.mlp.gate_up_proj.weight", + "model.language_model.layers.1.self_attn.k_proj.weight", + "model.language_model.layers.1.self_attn.o_proj.weight", + "model.language_model.layers.1.self_attn.q_proj.weight", + "model.language_model.layers.1.self_attn.v_proj.weight", + "model.language_model.layers.2.mlp.down_proj.weight", + "model.language_model.layers.2.mlp.gate_up_proj.weight", + "model.language_model.layers.2.self_attn.k_proj.weight", + "model.language_model.layers.2.self_attn.o_proj.weight", + "model.language_model.layers.2.self_attn.q_proj.weight", + "model.language_model.layers.2.self_attn.v_proj.weight", + "model.language_model.layers.3.mlp.down_proj.weight", + "model.language_model.layers.3.mlp.gate_up_proj.weight", + "model.language_model.layers.3.self_attn.k_proj.weight", + "model.language_model.layers.3.self_attn.o_proj.weight", + "model.language_model.layers.3.self_attn.q_proj.weight", + "model.language_model.layers.3.self_attn.v_proj.weight", + "model.language_model.layers.4.mlp.down_proj.weight", + "model.language_model.layers.4.mlp.gate_up_proj.weight", + "model.language_model.layers.4.self_attn.k_proj.weight", + "model.language_model.layers.4.self_attn.o_proj.weight", + "model.language_model.layers.4.self_attn.q_proj.weight", + "model.language_model.layers.4.self_attn.v_proj.weight", + "model.language_model.layers.5.mlp.down_proj.weight", + "model.language_model.layers.5.mlp.gate_up_proj.weight", + "model.language_model.layers.5.self_attn.k_proj.weight", + "model.language_model.layers.5.self_attn.o_proj.weight", + "model.language_model.layers.5.self_attn.q_proj.weight", + "model.language_model.layers.5.self_attn.v_proj.weight", + "model.language_model.layers.6.mlp.down_proj.weight", + "model.language_model.layers.6.mlp.gate_up_proj.weight", + "model.language_model.layers.6.self_attn.k_proj.weight", + "model.language_model.layers.6.self_attn.o_proj.weight", + "model.language_model.layers.6.self_attn.q_proj.weight", + "model.language_model.layers.6.self_attn.v_proj.weight", + "model.language_model.layers.7.mlp.down_proj.weight", + "model.language_model.layers.7.mlp.gate_up_proj.weight", + "model.language_model.layers.7.self_attn.k_proj.weight", + "model.language_model.layers.7.self_attn.o_proj.weight", + "model.language_model.layers.7.self_attn.q_proj.weight", + "model.language_model.layers.7.self_attn.v_proj.weight", + "model.language_model.layers.8.mlp.down_proj.weight", + "model.language_model.layers.8.mlp.gate_up_proj.weight", + "model.language_model.layers.8.self_attn.k_proj.weight", + "model.language_model.layers.8.self_attn.o_proj.weight", + "model.language_model.layers.8.self_attn.q_proj.weight", + "model.language_model.layers.8.self_attn.v_proj.weight", + "model.language_model.layers.9.mlp.down_proj.weight", + "model.language_model.layers.9.mlp.gate_up_proj.weight", + "model.language_model.layers.9.self_attn.k_proj.weight", + "model.language_model.layers.9.self_attn.o_proj.weight", + "model.language_model.layers.9.self_attn.q_proj.weight", + "model.language_model.layers.9.self_attn.v_proj.weight", + "model.language_model.layers.10.mlp.down_proj.weight", + "model.language_model.layers.10.mlp.gate_up_proj.weight", + "model.language_model.layers.10.self_attn.k_proj.weight", + "model.language_model.layers.10.self_attn.o_proj.weight", + "model.language_model.layers.10.self_attn.q_proj.weight", + "model.language_model.layers.10.self_attn.v_proj.weight", + "model.language_model.layers.11.mlp.down_proj.weight", + "model.language_model.layers.11.mlp.gate_up_proj.weight", + "model.language_model.layers.11.self_attn.k_proj.weight", + "model.language_model.layers.11.self_attn.o_proj.weight", + "model.language_model.layers.11.self_attn.q_proj.weight", + "model.language_model.layers.11.self_attn.v_proj.weight", + "model.language_model.layers.12.mlp.down_proj.weight", + "model.language_model.layers.12.mlp.gate_up_proj.weight", + "model.language_model.layers.12.self_attn.k_proj.weight", + "model.language_model.layers.12.self_attn.o_proj.weight", + "model.language_model.layers.12.self_attn.q_proj.weight", + "model.language_model.layers.12.self_attn.v_proj.weight", + "model.language_model.layers.13.mlp.down_proj.weight", + "model.language_model.layers.13.mlp.gate_up_proj.weight", + "model.language_model.layers.13.self_attn.k_proj.weight", + "model.language_model.layers.13.self_attn.o_proj.weight", + "model.language_model.layers.13.self_attn.q_proj.weight", + "model.language_model.layers.13.self_attn.v_proj.weight", + "model.language_model.layers.14.mlp.down_proj.weight", + "model.language_model.layers.14.mlp.gate_up_proj.weight", + "model.language_model.layers.14.self_attn.k_proj.weight", + "model.language_model.layers.14.self_attn.o_proj.weight", + "model.language_model.layers.14.self_attn.q_proj.weight", + "model.language_model.layers.14.self_attn.v_proj.weight", + "model.language_model.layers.15.mlp.down_proj.weight", + "model.language_model.layers.15.mlp.gate_up_proj.weight", + "model.language_model.layers.15.self_attn.k_proj.weight", + "model.language_model.layers.15.self_attn.o_proj.weight", + "model.language_model.layers.15.self_attn.q_proj.weight", + "model.language_model.layers.15.self_attn.v_proj.weight", + "model.language_model.layers.16.mlp.down_proj.weight", + "model.language_model.layers.16.mlp.gate_up_proj.weight", + "model.language_model.layers.16.self_attn.k_proj.weight", + "model.language_model.layers.16.self_attn.o_proj.weight", + "model.language_model.layers.16.self_attn.q_proj.weight", + "model.language_model.layers.16.self_attn.v_proj.weight", + "model.language_model.layers.17.mlp.down_proj.weight", + "model.language_model.layers.17.mlp.gate_up_proj.weight", + "model.language_model.layers.17.self_attn.k_proj.weight", + "model.language_model.layers.17.self_attn.o_proj.weight", + "model.language_model.layers.17.self_attn.q_proj.weight", + "model.language_model.layers.17.self_attn.v_proj.weight", + "model.language_model.layers.18.mlp.down_proj.weight", + "model.language_model.layers.18.mlp.gate_up_proj.weight", + "model.language_model.layers.18.self_attn.k_proj.weight", + "model.language_model.layers.18.self_attn.o_proj.weight", + "model.language_model.layers.18.self_attn.q_proj.weight", + "model.language_model.layers.18.self_attn.v_proj.weight", + "model.language_model.layers.19.mlp.down_proj.weight", + "model.language_model.layers.19.mlp.gate_up_proj.weight", + "model.language_model.layers.19.self_attn.k_proj.weight", + "model.language_model.layers.19.self_attn.o_proj.weight", + "model.language_model.layers.19.self_attn.q_proj.weight", + "model.language_model.layers.19.self_attn.v_proj.weight", + "model.language_model.layers.20.mlp.down_proj.weight", + "model.language_model.layers.20.mlp.gate_up_proj.weight", + "model.language_model.layers.20.self_attn.k_proj.weight", + "model.language_model.layers.20.self_attn.o_proj.weight", + "model.language_model.layers.20.self_attn.q_proj.weight", + "model.language_model.layers.20.self_attn.v_proj.weight", + "model.language_model.layers.21.mlp.down_proj.weight", + "model.language_model.layers.21.mlp.gate_up_proj.weight", + "model.language_model.layers.21.self_attn.k_proj.weight", + "model.language_model.layers.21.self_attn.o_proj.weight", + "model.language_model.layers.21.self_attn.q_proj.weight", + "model.language_model.layers.21.self_attn.v_proj.weight", + "model.language_model.layers.22.mlp.down_proj.weight", + "model.language_model.layers.22.mlp.gate_up_proj.weight", + "model.language_model.layers.22.self_attn.k_proj.weight", + "model.language_model.layers.22.self_attn.o_proj.weight", + "model.language_model.layers.22.self_attn.q_proj.weight", + "model.language_model.layers.22.self_attn.v_proj.weight", + "model.language_model.layers.23.mlp.down_proj.weight", + "model.language_model.layers.23.mlp.gate_up_proj.weight", + "model.language_model.layers.23.self_attn.k_proj.weight", + "model.language_model.layers.23.self_attn.o_proj.weight", + "model.language_model.layers.23.self_attn.q_proj.weight", + "model.language_model.layers.23.self_attn.v_proj.weight", + "model.language_model.layers.24.mlp.down_proj.weight", + "model.language_model.layers.24.mlp.gate_up_proj.weight", + "model.language_model.layers.24.self_attn.k_proj.weight", + "model.language_model.layers.24.self_attn.o_proj.weight", + "model.language_model.layers.24.self_attn.q_proj.weight", + "model.language_model.layers.24.self_attn.v_proj.weight", + "model.language_model.layers.25.mlp.down_proj.weight", + "model.language_model.layers.25.mlp.gate_up_proj.weight", + "model.language_model.layers.25.self_attn.k_proj.weight", + "model.language_model.layers.25.self_attn.o_proj.weight", + "model.language_model.layers.25.self_attn.q_proj.weight", + "model.language_model.layers.25.self_attn.v_proj.weight", + "model.language_model.layers.26.mlp.down_proj.weight", + "model.language_model.layers.26.mlp.gate_up_proj.weight", + "model.language_model.layers.26.self_attn.k_proj.weight", + "model.language_model.layers.26.self_attn.o_proj.weight", + "model.language_model.layers.26.self_attn.q_proj.weight", + "model.language_model.layers.26.self_attn.v_proj.weight", + "model.language_model.layers.27.mlp.down_proj.weight", + "model.language_model.layers.27.mlp.gate_up_proj.weight", + "model.language_model.layers.27.self_attn.k_proj.weight", + "model.language_model.layers.27.self_attn.o_proj.weight", + "model.language_model.layers.27.self_attn.q_proj.weight", + "model.language_model.layers.27.self_attn.v_proj.weight", + "model.language_model.layers.28.mlp.down_proj.weight", + "model.language_model.layers.28.mlp.gate_up_proj.weight", + "model.language_model.layers.28.self_attn.k_proj.weight", + "model.language_model.layers.28.self_attn.o_proj.weight", + "model.language_model.layers.28.self_attn.q_proj.weight", + "model.language_model.layers.29.mlp.down_proj.weight", + "model.language_model.layers.29.mlp.gate_up_proj.weight", + "model.language_model.layers.29.self_attn.k_proj.weight", + "model.language_model.layers.29.self_attn.o_proj.weight", + "model.language_model.layers.29.self_attn.q_proj.weight", + "model.language_model.layers.30.mlp.down_proj.weight", + "model.language_model.layers.30.mlp.gate_up_proj.weight", + "model.language_model.layers.30.self_attn.k_proj.weight", + "model.language_model.layers.30.self_attn.o_proj.weight", + "model.language_model.layers.30.self_attn.q_proj.weight", + "model.language_model.layers.30.self_attn.v_proj.weight", + "model.language_model.layers.31.mlp.down_proj.weight", + "model.language_model.layers.31.mlp.gate_up_proj.weight", + "model.language_model.layers.31.self_attn.k_proj.weight", + "model.language_model.layers.31.self_attn.o_proj.weight", + "model.language_model.layers.31.self_attn.q_proj.weight", + "model.language_model.layers.31.self_attn.v_proj.weight", + "model.language_model.layers.32.mlp.down_proj.weight", + "model.language_model.layers.32.mlp.gate_up_proj.weight", + "model.language_model.layers.32.self_attn.k_proj.weight", + "model.language_model.layers.32.self_attn.o_proj.weight", + "model.language_model.layers.32.self_attn.q_proj.weight", + "model.language_model.layers.33.mlp.down_proj.weight", + "model.language_model.layers.33.mlp.gate_up_proj.weight", + "model.language_model.layers.33.self_attn.k_proj.weight", + "model.language_model.layers.33.self_attn.o_proj.weight", + "model.language_model.layers.33.self_attn.q_proj.weight", + "model.language_model.layers.34.mlp.down_proj.weight", + "model.language_model.layers.34.mlp.gate_up_proj.weight", + "model.language_model.layers.34.self_attn.k_proj.weight", + "model.language_model.layers.34.self_attn.o_proj.weight", + "model.language_model.layers.34.self_attn.q_proj.weight", + "model.language_model.layers.34.self_attn.v_proj.weight", + "model.language_model.layers.35.mlp.down_proj.weight", + "model.language_model.layers.35.mlp.gate_up_proj.weight", + "model.language_model.layers.35.self_attn.k_proj.weight", + "model.language_model.layers.35.self_attn.o_proj.weight", + "model.language_model.layers.35.self_attn.q_proj.weight", + "model.language_model.layers.35.self_attn.v_proj.weight", + "model.language_model.layers.36.mlp.down_proj.weight", + "model.language_model.layers.36.mlp.gate_up_proj.weight", + "model.language_model.layers.36.self_attn.k_proj.weight", + "model.language_model.layers.36.self_attn.o_proj.weight", + "model.language_model.layers.36.self_attn.q_proj.weight", + "model.language_model.layers.36.self_attn.v_proj.weight", + "model.language_model.layers.37.mlp.down_proj.weight", + "model.language_model.layers.37.mlp.gate_up_proj.weight", + "model.language_model.layers.37.self_attn.k_proj.weight", + "model.language_model.layers.37.self_attn.o_proj.weight", + "model.language_model.layers.37.self_attn.q_proj.weight", + "model.language_model.layers.37.self_attn.v_proj.weight", + "model.language_model.layers.38.mlp.down_proj.weight", + "model.language_model.layers.38.mlp.gate_up_proj.weight", + "model.language_model.layers.38.self_attn.k_proj.weight", + "model.language_model.layers.38.self_attn.o_proj.weight", + "model.language_model.layers.38.self_attn.q_proj.weight", + "model.language_model.layers.38.self_attn.v_proj.weight", + "model.language_model.layers.39.mlp.down_proj.weight", + "model.language_model.layers.39.mlp.gate_up_proj.weight", + "model.language_model.layers.39.self_attn.k_proj.weight", + "model.language_model.layers.39.self_attn.o_proj.weight", + "model.language_model.layers.39.self_attn.q_proj.weight", + "model.language_model.layers.39.self_attn.v_proj.weight", + "model.visual.blocks.0.attn.proj.weight", + "model.visual.blocks.0.mlp.fc1.weight", + "model.visual.blocks.1.attn.proj.weight", + "model.visual.blocks.2.attn.proj.weight", + "model.visual.blocks.2.mlp.fc1.weight", + "model.visual.blocks.3.attn.proj.weight", + "model.visual.blocks.3.mlp.fc1.weight", + "model.visual.blocks.4.attn.proj.weight", + "model.visual.blocks.4.attn.qkv.weight", + "model.visual.blocks.4.mlp.fc1.weight", + "model.visual.blocks.5.attn.proj.weight", + "model.visual.blocks.5.attn.qkv.weight", + "model.visual.blocks.5.mlp.fc1.weight", + "model.visual.blocks.6.attn.proj.weight", + "model.visual.blocks.6.attn.qkv.weight", + "model.visual.blocks.6.mlp.fc1.weight", + "model.visual.blocks.7.attn.proj.weight", + "model.visual.blocks.7.attn.qkv.weight", + "model.visual.blocks.7.mlp.fc1.weight", + "model.visual.blocks.8.attn.proj.weight", + "model.visual.blocks.8.attn.qkv.weight", + "model.visual.blocks.8.mlp.fc1.weight", + "model.visual.blocks.9.attn.proj.weight", + "model.visual.blocks.9.attn.qkv.weight", + "model.visual.blocks.9.mlp.fc1.weight", + "model.visual.blocks.10.attn.proj.weight", + "model.visual.blocks.10.attn.qkv.weight", + "model.visual.blocks.10.mlp.fc1.weight", + "model.visual.blocks.10.mlp.fc2.weight", + "model.visual.blocks.11.attn.proj.weight", + "model.visual.blocks.11.attn.qkv.weight", + "model.visual.blocks.11.mlp.fc1.weight", + "model.visual.blocks.11.mlp.fc2.weight", + "model.visual.blocks.12.attn.proj.weight", + "model.visual.blocks.12.attn.qkv.weight", + "model.visual.blocks.12.mlp.fc1.weight", + "model.visual.blocks.12.mlp.fc2.weight", + "model.visual.blocks.13.attn.proj.weight", + "model.visual.blocks.13.attn.qkv.weight", + "model.visual.blocks.13.mlp.fc1.weight", + "model.visual.blocks.13.mlp.fc2.weight", + "model.visual.blocks.14.attn.proj.weight", + "model.visual.blocks.14.attn.qkv.weight", + "model.visual.blocks.14.mlp.fc1.weight", + "model.visual.blocks.14.mlp.fc2.weight", + "model.visual.blocks.15.attn.proj.weight", + "model.visual.blocks.15.attn.qkv.weight", + "model.visual.blocks.15.mlp.fc1.weight", + "model.visual.blocks.15.mlp.fc2.weight", + "model.visual.blocks.16.attn.proj.weight", + "model.visual.blocks.16.attn.qkv.weight", + "model.visual.blocks.16.mlp.fc1.weight", + "model.visual.blocks.16.mlp.fc2.weight", + "model.visual.blocks.17.attn.proj.weight", + "model.visual.blocks.17.attn.qkv.weight", + "model.visual.blocks.17.mlp.fc1.weight", + "model.visual.blocks.17.mlp.fc2.weight", + "model.visual.blocks.18.attn.proj.weight", + "model.visual.blocks.18.attn.qkv.weight", + "model.visual.blocks.18.mlp.fc1.weight", + "model.visual.blocks.18.mlp.fc2.weight", + "model.visual.blocks.19.attn.proj.weight", + "model.visual.blocks.19.attn.qkv.weight", + "model.visual.blocks.19.mlp.fc1.weight", + "model.visual.blocks.19.mlp.fc2.weight", + "model.visual.blocks.20.attn.proj.weight", + "model.visual.blocks.20.attn.qkv.weight", + "model.visual.blocks.20.mlp.fc1.weight", + "model.visual.blocks.20.mlp.fc2.weight", + "model.visual.blocks.21.attn.proj.weight", + "model.visual.blocks.21.attn.qkv.weight", + "model.visual.blocks.21.mlp.fc1.weight", + "model.visual.blocks.21.mlp.fc2.weight", + "model.visual.blocks.22.attn.proj.weight", + "model.visual.blocks.22.attn.qkv.weight", + "model.visual.blocks.22.mlp.fc1.weight", + "model.visual.blocks.22.mlp.fc2.weight", + "model.visual.blocks.23.attn.proj.weight", + "model.visual.blocks.23.attn.qkv.weight", + "model.visual.blocks.23.mlp.fc1.weight", + "model.visual.blocks.23.mlp.fc2.weight", + "model.visual.blocks.24.attn.proj.weight", + "model.visual.blocks.24.attn.qkv.weight", + "model.visual.blocks.24.mlp.fc1.weight", + "model.visual.blocks.24.mlp.fc2.weight", + "model.visual.blocks.25.attn.proj.weight", + "model.visual.blocks.25.attn.qkv.weight", + "model.visual.blocks.25.mlp.fc1.weight", + "model.visual.blocks.25.mlp.fc2.weight", + "model.visual.blocks.26.attn.proj.weight", + "model.visual.blocks.26.attn.qkv.weight", + "model.visual.blocks.26.mlp.fc1.weight", + "model.visual.blocks.26.mlp.fc2.weight", + "model.visual.blocks.27.attn.proj.weight", + "model.visual.blocks.27.attn.qkv.weight", + "model.visual.blocks.27.mlp.fc1.weight", + "model.visual.blocks.27.mlp.fc2.weight", + "model.visual.blocks.28.attn.proj.weight", + "model.visual.blocks.28.attn.qkv.weight", + "model.visual.blocks.28.mlp.fc1.weight", + "model.visual.blocks.28.mlp.fc2.weight", + "model.visual.blocks.29.attn.proj.weight", + "model.visual.blocks.29.attn.qkv.weight", + "model.visual.blocks.29.mlp.fc1.weight", + "model.visual.blocks.29.mlp.fc2.weight", + "model.visual.blocks.30.attn.proj.weight", + "model.visual.blocks.30.attn.qkv.weight", + "model.visual.blocks.30.mlp.fc1.weight", + "model.visual.blocks.30.mlp.fc2.weight", + "model.visual.blocks.31.attn.proj.weight", + "model.visual.blocks.31.attn.qkv.weight", + "model.visual.blocks.31.mlp.fc1.weight", + "model.visual.blocks.31.mlp.fc2.weight", + "model.visual.blocks.32.attn.proj.weight", + "model.visual.blocks.32.attn.qkv.weight", + "model.visual.blocks.32.mlp.fc1.weight", + "model.visual.blocks.32.mlp.fc2.weight", + "model.visual.blocks.33.attn.proj.weight", + "model.visual.blocks.33.attn.qkv.weight", + "model.visual.blocks.33.mlp.fc1.weight", + "model.visual.blocks.33.mlp.fc2.weight", + "model.visual.blocks.34.attn.proj.weight", + "model.visual.blocks.34.attn.qkv.weight", + "model.visual.blocks.34.mlp.fc1.weight", + "model.visual.blocks.34.mlp.fc2.weight", + "model.visual.blocks.35.attn.proj.weight", + "model.visual.blocks.35.attn.qkv.weight", + "model.visual.blocks.35.mlp.fc1.weight", + "model.visual.blocks.35.mlp.fc2.weight", + "model.visual.blocks.36.attn.proj.weight", + "model.visual.blocks.36.attn.qkv.weight", + "model.visual.blocks.36.mlp.fc1.weight", + "model.visual.blocks.36.mlp.fc2.weight", + "model.visual.blocks.37.attn.proj.weight", + "model.visual.blocks.37.attn.qkv.weight", + "model.visual.blocks.37.mlp.fc1.weight", + "model.visual.blocks.37.mlp.fc2.weight", + "model.visual.blocks.38.attn.proj.weight", + "model.visual.blocks.38.attn.qkv.weight", + "model.visual.blocks.38.mlp.fc1.weight", + "model.visual.blocks.38.mlp.fc2.weight", + "model.visual.blocks.39.attn.proj.weight", + "model.visual.blocks.39.attn.qkv.weight", + "model.visual.blocks.39.mlp.fc1.weight", + "model.visual.blocks.39.mlp.fc2.weight" + ] + }, + "modules_to_not_convert": [ + "vqmodel", + "lm_head", + "embeddings", + "embed_tokens", + "patch_embed" + ], + "non_blocking": false, + "quant_conv": false, + "quant_method": "sdnq", + "quantization_device": null, + "quantized_matmul_dtype": null, + "return_device": null, + "sdnq_version": "0.1.4", + "svd_rank": 32, + "svd_steps": 8, + "use_dynamic_quantization": true, + "use_grad_ckpt": true, + "use_quantized_matmul": false, + "use_quantized_matmul_conv": false, + "use_static_quantization": true, + "use_stochastic_rounding": false, + "use_svd": false, + "weights_dtype": "uint4" + }, + "text_config": { + "attention_bias": true, + "attention_dropout": 0.0, + "dtype": "bfloat16", + "eos_token_id": 16385, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 13696, + "max_position_embeddings": 131072, + "model_type": "glm_image_text", + "num_attention_heads": 32, + "num_hidden_layers": 40, + "num_key_value_heads": 2, + "pad_token_id": 167841, + "rms_norm_eps": 1e-05, + "rope_parameters": { + "mrope_section": [ + 8, + 12, + 12 + ], + "partial_rotary_factor": 0.5, + "rope_theta": 10000, + "rope_type": "default" + }, + "use_cache": true, + "vision_vocab_size": 16512, + "vocab_size": 168064 + }, + "transformers_version": "5.0.0.dev0", + "vision_config": { + "attention_bias": true, + "attention_dropout": 0.0, + "depth": 40, + "dtype": "bfloat16", + "hidden_act": "gelu", + "hidden_size": 1536, + "image_size": 2048, + "in_channels": 3, + "initializer_range": 0.02, + "intermediate_size": 6144, + "layer_norm_eps": 1e-06, + "model_type": "glm_image_vision", + "num_heads": 16, + "patch_size": 16, + "spatial_merge_size": 1 + }, + "vq_config": { + "dtype": "bfloat16", + "embed_dim": 2048, + "in_channels": 3, + "initializer_range": 0.02, + "latent_channels": 1536, + "model_type": "glm_image_vqmodel", + "num_embeddings": 16384 + } +} diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vision_language_encoder/model-00001-of-00002.safetensors b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vision_language_encoder/model-00001-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ead558964e74f376925f7140800623d2edc28963 --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vision_language_encoder/model-00001-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a666a690adf0c16670b9613707f331bc2a9a4ecf4484a63c0c1dd6399defae +size 4990261848 diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vision_language_encoder/model-00002-of-00002.safetensors b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vision_language_encoder/model-00002-of-00002.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bfb2398b7ee1e0e1f12eb213195c0dce296517e3 --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vision_language_encoder/model-00002-of-00002.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b1d6be8219eab4d13bb7c8a38f4d247400cb34bf11831ae482b10bebbc9fe54 +size 1894171528 diff --git a/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vision_language_encoder/model.safetensors.index.json b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vision_language_encoder/model.safetensors.index.json new file mode 100644 index 0000000000000000000000000000000000000000..aebfff2a0d3109b29a60afaf1c091da607bea9aa --- /dev/null +++ b/glm-image/GLM-Image-SDNQ-4bit-dynamic/snapshots/0a8f8b4885f706bdc7ca08c623b959a61bb5aec8/vision_language_encoder/model.safetensors.index.json @@ -0,0 +1,1800 @@ +{ + "metadata": { + "total_parameters": 5773222912, + "total_size": 6884214784 + }, + "weight_map": { + "lm_head.weight": "model-00001-of-00002.safetensors", + "model.language_model.embed_tokens.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.0.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.1.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.10.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.11.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.12.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.13.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.14.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.15.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.16.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.17.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.18.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.19.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.2.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.20.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.21.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.22.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.23.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.24.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.25.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.26.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.27.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.28.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.29.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.3.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.30.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.30.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.30.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.30.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.30.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.30.mlp.gate_up_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.mlp.gate_up_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.post_mlp_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.post_self_attn_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.k_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.k_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.o_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.o_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.q_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.q_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.v_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.30.self_attn.v_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.mlp.down_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.mlp.down_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.mlp.gate_up_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.mlp.gate_up_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.mlp.gate_up_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.post_mlp_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.post_self_attn_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.k_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.k_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.o_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.o_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.q_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.q_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.v_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.31.self_attn.v_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.mlp.down_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.mlp.down_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.mlp.gate_up_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.mlp.gate_up_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.mlp.gate_up_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.post_mlp_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.post_self_attn_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.k_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.k_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.o_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.o_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.q_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.q_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.v_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.32.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.mlp.down_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.mlp.down_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.mlp.gate_up_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.mlp.gate_up_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.mlp.gate_up_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.post_mlp_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.post_self_attn_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.k_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.k_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.o_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.o_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.q_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.q_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.v_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.33.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.mlp.down_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.mlp.down_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.mlp.gate_up_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.mlp.gate_up_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.mlp.gate_up_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.post_mlp_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.post_self_attn_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.k_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.k_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.o_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.o_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.q_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.q_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.v_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.34.self_attn.v_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.mlp.down_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.mlp.down_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.mlp.gate_up_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.mlp.gate_up_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.mlp.gate_up_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.post_mlp_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.post_self_attn_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.k_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.k_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.o_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.o_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.q_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.q_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.v_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.35.self_attn.v_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.mlp.down_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.mlp.down_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.mlp.gate_up_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.mlp.gate_up_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.mlp.gate_up_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.post_mlp_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.post_self_attn_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.k_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.k_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.o_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.o_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.q_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.q_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.v_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.36.self_attn.v_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.mlp.down_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.mlp.down_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.mlp.gate_up_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.mlp.gate_up_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.mlp.gate_up_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.post_mlp_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.post_self_attn_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.k_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.k_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.o_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.o_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.q_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.q_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.v_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.37.self_attn.v_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.mlp.down_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.mlp.down_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.mlp.gate_up_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.mlp.gate_up_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.mlp.gate_up_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.post_mlp_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.post_self_attn_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.k_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.k_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.o_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.o_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.q_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.q_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.v_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.38.self_attn.v_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.input_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.mlp.down_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.mlp.down_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.mlp.down_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.mlp.gate_up_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.mlp.gate_up_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.mlp.gate_up_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.post_attention_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.post_mlp_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.post_self_attn_layernorm.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.k_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.k_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.k_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.k_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.o_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.o_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.o_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.q_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.q_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.q_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.q_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.v_proj.bias": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.v_proj.scale": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.v_proj.weight": "model-00002-of-00002.safetensors", + "model.language_model.layers.39.self_attn.v_proj.zero_point": "model-00002-of-00002.safetensors", + "model.language_model.layers.4.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.4.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.5.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.6.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.7.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.8.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.input_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.mlp.down_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.mlp.down_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.mlp.down_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.mlp.gate_up_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.mlp.gate_up_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.mlp.gate_up_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.post_attention_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.post_mlp_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.post_self_attn_layernorm.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.k_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.k_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.k_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.k_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.o_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.o_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.o_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.q_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.q_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.q_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.q_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.v_proj.bias": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.v_proj.scale": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.v_proj.weight": "model-00001-of-00002.safetensors", + "model.language_model.layers.9.self_attn.v_proj.zero_point": "model-00001-of-00002.safetensors", + "model.language_model.norm.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.0.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.1.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.10.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.11.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.12.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.13.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.14.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.15.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.16.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.17.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.18.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.19.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.2.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.20.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.21.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.22.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.23.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.24.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.25.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.26.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.27.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.28.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.29.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.3.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.30.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.31.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.32.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.33.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.34.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.35.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.36.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.37.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.38.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.mlp.fc2.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.39.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.4.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.5.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.6.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.7.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.8.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.attn.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.attn.proj.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.attn.proj.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.attn.proj.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.attn.qkv.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.attn.qkv.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.attn.qkv.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.attn.qkv.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.mlp.fc1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.mlp.fc1.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.mlp.fc1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.mlp.fc1.zero_point": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.mlp.fc2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.mlp.fc2.scale": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.mlp.fc2.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.norm1.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.norm1.weight": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.norm2.bias": "model-00002-of-00002.safetensors", + "model.visual.blocks.9.norm2.weight": "model-00002-of-00002.safetensors", + "model.visual.embeddings.position_embedding.weight": "model-00002-of-00002.safetensors", + "model.visual.patch_embed.proj.bias": "model-00002-of-00002.safetensors", + "model.visual.patch_embed.proj.weight": "model-00002-of-00002.safetensors", + "model.vqmodel.post_quant_conv.bias": "model-00002-of-00002.safetensors", + "model.vqmodel.post_quant_conv.weight": "model-00002-of-00002.safetensors", + "model.vqmodel.quant_conv.bias": "model-00002-of-00002.safetensors", + "model.vqmodel.quant_conv.weight": "model-00002-of-00002.safetensors", + "model.vqmodel.quantize.embedding.weight": "model-00002-of-00002.safetensors" + } +}