MedPLIB-7b-2e / generation_config.json
Huangxs's picture
Upload 8 files
ca935d3 verified
{
"auto_resume": true,
"batch_size": 4,
"bce_loss_weight": 1.0,
"beta1": 0.9,
"beta2": 0.95,
"bos_token_id": 1,
"capacity_factor": 2.0,
"ce_loss_weight": 2.0,
"conv_type": "llava_v1",
"data_path": "/root/paddlejob/workspace/env_run/data/huangxiaoshuang/jsons/seg/0301_CombinedAll_7.5w_train1_chatlm_img_coord2_rand5k_seg_cat_origin.json",
"dice_loss_weight": 1.0,
"eos_token_id": 2,
"ep_size": 1,
"epochs": 1,
"eval_capacity_factor": 2,
"eval_only": true,
"exclude_val": false,
"exp_name": "",
"expert_pretrained_path": "/root/paddlejob/workspace/env_run/output/huangxiaoshuang/BiRD2/runs/medplib-7b-stage3/hf,/root/paddlejob/workspace/env_run/output/huangxiaoshuang/BiRD2/runs/medplib-7b-stage2/hf",
"explanatory": 0.1,
"finetune_moe": false,
"focal_loss_weight": 1.0,
"grad_accumulation_steps": 8,
"gradient_checkpointing": true,
"image_aspect_ratio": "pad",
"image_folder": "/tmp/v2_mnt/HCG/huangxiaoshuang/SAMed2D_v1",
"iou_loss_weight": 2.0,
"is_multimodal": true,
"local_rank": 0,
"log_base_dir": "./runs",
"log_dir": "./runs/",
"lora_alpha": 16,
"lora_dropout": 0.05,
"lora_r": 8,
"lora_target_modules": "gate_proj,up_proj,down_proj,q_proj,v_proj",
"lr": 2e-05,
"max_length": 4096,
"max_sample_point": 512,
"min_capacity": 0,
"model_max_length": 1024,
"moe_enable": true,
"moe_layers_idx": null,
"moe_mode": "dense",
"no_eval": false,
"num_classes_per_sample": 3,
"num_experts": [
2
],
"out_dim": 256,
"pad_token_id": 0,
"precision": "bf16",
"pretrain_mm_mlp_adapter": null,
"print_freq": 1,
"region_fea_adapter": true,
"region_geo_sampler": false,
"resume": "",
"router_aux_loss_coef": 0.0,
"sam_img_size": 256,
"sampler_pooler_mode": "max",
"save_path": "/root/paddlejob/workspace/env_run/output/huangxiaoshuang/BiRD2/runs/lisa-7b-bird-0514_1/hf",
"save_steps": 200,
"seg_token_idx": 32000,
"sft_modules": "wg,lm_head,embed_tokens,mask_decoder,text_hidden_fcs,region_fea_adapter",
"start_epoch": 0,
"top_k_experts": 1,
"train_mask_decoder": true,
"transformers_version": "4.31.0",
"use_mm_start_end": true,
"use_residual": false,
"val_batch_size": 1,
"val_data_path": "/root/paddlejob/workspace/env_run/data/huangxiaoshuang/jsons/seg/0301_CombinedAll_7.5w_train1_chatlm_img_coord2_rand5k_seg.json",
"version": "/root/paddlejob/workspace/env_run/output/huangxiaoshuang/BiRD2/runs/lisa-7b-bird-0504/hf",
"vis_save_path": "./vis_output",
"vision_pretrained": "/root/paddlejob/workspace/env_run/output/huangxiaoshuang/huggingface_models/sam-med2d_b.pth",
"vision_tower": "/root/paddlejob/workspace/env_run/output/huangxiaoshuang/huggingface_models/clip-vit-large-patch14-336",
"weight": "/root/paddlejob/workspace/env_run/output/huangxiaoshuang/BiRD2/runs/lisa-7b-bird-0514_1/pytorch_model.bin",
"workers": 8
}