| { | |
| "auto_resume": true, | |
| "batch_size": 4, | |
| "bce_loss_weight": 1.0, | |
| "beta1": 0.9, | |
| "beta2": 0.95, | |
| "bos_token_id": 1, | |
| "capacity_factor": 2.0, | |
| "ce_loss_weight": 2.0, | |
| "conv_type": "llava_v1", | |
| "data_path": "/root/paddlejob/workspace/env_run/data/huangxiaoshuang/jsons/seg/0301_CombinedAll_7.5w_train1_chatlm_img_coord2_rand5k_seg_cat_origin.json", | |
| "dice_loss_weight": 1.0, | |
| "eos_token_id": 2, | |
| "ep_size": 1, | |
| "epochs": 1, | |
| "eval_capacity_factor": 2, | |
| "eval_only": true, | |
| "exclude_val": false, | |
| "exp_name": "", | |
| "expert_pretrained_path": "/root/paddlejob/workspace/env_run/output/huangxiaoshuang/BiRD2/runs/medplib-7b-stage3/hf,/root/paddlejob/workspace/env_run/output/huangxiaoshuang/BiRD2/runs/medplib-7b-stage2/hf", | |
| "explanatory": 0.1, | |
| "finetune_moe": false, | |
| "focal_loss_weight": 1.0, | |
| "grad_accumulation_steps": 8, | |
| "gradient_checkpointing": true, | |
| "image_aspect_ratio": "pad", | |
| "image_folder": "/tmp/v2_mnt/HCG/huangxiaoshuang/SAMed2D_v1", | |
| "iou_loss_weight": 2.0, | |
| "is_multimodal": true, | |
| "local_rank": 0, | |
| "log_base_dir": "./runs", | |
| "log_dir": "./runs/", | |
| "lora_alpha": 16, | |
| "lora_dropout": 0.05, | |
| "lora_r": 8, | |
| "lora_target_modules": "gate_proj,up_proj,down_proj,q_proj,v_proj", | |
| "lr": 2e-05, | |
| "max_length": 4096, | |
| "max_sample_point": 512, | |
| "min_capacity": 0, | |
| "model_max_length": 1024, | |
| "moe_enable": true, | |
| "moe_layers_idx": null, | |
| "moe_mode": "dense", | |
| "no_eval": false, | |
| "num_classes_per_sample": 3, | |
| "num_experts": [ | |
| 2 | |
| ], | |
| "out_dim": 256, | |
| "pad_token_id": 0, | |
| "precision": "bf16", | |
| "pretrain_mm_mlp_adapter": null, | |
| "print_freq": 1, | |
| "region_fea_adapter": true, | |
| "region_geo_sampler": false, | |
| "resume": "", | |
| "router_aux_loss_coef": 0.0, | |
| "sam_img_size": 256, | |
| "sampler_pooler_mode": "max", | |
| "save_path": "/root/paddlejob/workspace/env_run/output/huangxiaoshuang/BiRD2/runs/lisa-7b-bird-0514_1/hf", | |
| "save_steps": 200, | |
| "seg_token_idx": 32000, | |
| "sft_modules": "wg,lm_head,embed_tokens,mask_decoder,text_hidden_fcs,region_fea_adapter", | |
| "start_epoch": 0, | |
| "top_k_experts": 1, | |
| "train_mask_decoder": true, | |
| "transformers_version": "4.31.0", | |
| "use_mm_start_end": true, | |
| "use_residual": false, | |
| "val_batch_size": 1, | |
| "val_data_path": "/root/paddlejob/workspace/env_run/data/huangxiaoshuang/jsons/seg/0301_CombinedAll_7.5w_train1_chatlm_img_coord2_rand5k_seg.json", | |
| "version": "/root/paddlejob/workspace/env_run/output/huangxiaoshuang/BiRD2/runs/lisa-7b-bird-0504/hf", | |
| "vis_save_path": "./vis_output", | |
| "vision_pretrained": "/root/paddlejob/workspace/env_run/output/huangxiaoshuang/huggingface_models/sam-med2d_b.pth", | |
| "vision_tower": "/root/paddlejob/workspace/env_run/output/huangxiaoshuang/huggingface_models/clip-vit-large-patch14-336", | |
| "weight": "/root/paddlejob/workspace/env_run/output/huangxiaoshuang/BiRD2/runs/lisa-7b-bird-0514_1/pytorch_model.bin", | |
| "workers": 8 | |
| } | |