| { |
| "model_type":"chatglm", |
| "model_class": "FineTuneVisualGLMModel", |
| "tokenizer_type": "THUDM/chatglm-6b", |
| "num_layers": 28, |
| "hidden_size": 4096, |
| "num_attention_heads": 32, |
| "vocab_size": 130528, |
| "layernorm_order": "post", |
| "model_parallel_size": 1, |
| "max_sequence_length": 2048, |
| "pre_seq_len": 4, |
| "lora_rank": 32, |
| "use_ptuning": false, |
| "use_lora": true, |
| "use_qlora": false, |
| "layer_range": [], |
| "image_length": 32, |
| "eva_args": { |
| "num_layers": 39, |
| "hidden_size": 1408, |
| "num_attention_heads": 16, |
| "vocab_size": 1, |
| "layernorm_order": "pre", |
| "model_parallel_size": 1, |
| "max_sequence_length": 257, |
| "inner_hidden_size": 6144, |
| "use_final_layernorm": false, |
| "layernorm_epsilon": 1e-06, |
| "image_size": [ |
| 224, |
| 224 |
| ], |
| "pre_len": 1, |
| "post_len": 0, |
| "in_channels": 3, |
| "num_classes": 0, |
| "patch_size": 14 |
| }, |
| "qformer_args": { |
| "num_layers": 12, |
| "hidden_size": 768, |
| "num_attention_heads": 12, |
| "vocab_size": 32, |
| "layernorm_order": "post", |
| "model_parallel_size": 1, |
| "max_sequence_length": 0, |
| "is_decoder": [ |
| true, |
| false, |
| true, |
| false, |
| true, |
| false, |
| true, |
| false, |
| true, |
| false, |
| true, |
| false |
| ], |
| "cross_attn_hidden_size": 1408, |
| "layernorm_epsilon": 1e-12 |
| }, |
| "bos_token_id": 130004, |
| "mask_token_id": 130000, |
| "gmask_token_id": 130001, |
| "pad_token_id": 3, |
| "image_size": [ |
| 224, |
| 224 |
| ], |
| "pre_len": 1, |
| "post_len": 0, |
| "in_channels": 3, |
| "patch_size": 14 |
| } |
|
|