Rihong's picture
Update config.json
0cb2c4c verified
{
"add_second_msg": true,
"architectures": [
"VideoChat2_it_hd_mistral"
],
"auto_map": {
"AutoConfig": "configuration_videochat2.Config",
"AutoModel": "videochat2_it_hd_mistral.VideoChat2_it_hd_mistral"
},
"dynamic_config": {
"add_global": true,
"hd_num": 6,
"local_size": 224,
"padding": false
},
"end_token": "</Video>",
"extra_num_query_token": 64,
"freeze_qformer": false,
"freeze_vit": false,
"img_end_token": "</Image>",
"img_start_token": "<Image>",
"lora_alpha": 32,
"lora_dropout": 0.1,
"lora_r": 16,
"low_resource": false,
"max_txt_len": 512,
"mistral_model_path": "mistralai/Mistral-7B-Instruct-v0.2",
"model_cls": "VideoChat2_it_hd_mistral",
"num_query_token": 32,
"qformer_attention_probs_dropout_prob": 0.1,
"qformer_drop_path_rate": 0.2,
"qformer_hidden_dropout_prob": 0.1,
"qformer_text_input": true,
"random_shuffle": true,
"return_question_instruction": false,
"start_token": "<Video>",
"system": "",
"torch_dtype": "float32",
"transformers_version": "4.49.0",
"use_flash_attention": false,
"use_lora": false,
"videochat2_model_path": "",
"vision_encoder": {
"checkpoint_num": 18,
"ckpt_num_frame": 4,
"d_model": 1024,
"drop_path_rate": 0.0,
"encoder_depth": 24,
"encoder_embed_dim": 1024,
"encoder_num_heads": 16,
"img_size": 224,
"name": "vit_l14",
"num_frames": 4,
"patch_size": 16,
"pretrained": "",
"return_index": -2,
"tubelet_size": 1,
"use_checkpoint": true,
"vit_add_ln": true
},
"vit_blip_model_path": ""
}