|
|
|
|
|
from mmengine.dataset import DefaultSampler |
|
|
from mmengine.hooks import (CheckpointHook, DistSamplerSeedHook, IterTimerHook, |
|
|
LoggerHook, ParamSchedulerHook) |
|
|
|
|
|
from vlm.engine.runner.loops import AnnoLoop |
|
|
from xtuner.dataset import ConcatDataset |
|
|
|
|
|
from projects.mllm_labeling.models import MLLM_Annotor |
|
|
from projects.mllm_labeling.datasets.demo_dataset import DemoImageCap |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
llm_name_or_path = './pretrained/internvl/InternVL2-Llama3-76B-AWQ/' |
|
|
save_folder = './1215_demos/mllm_object_cap/' |
|
|
|
|
|
model = dict( |
|
|
type=MLLM_Annotor, |
|
|
model=llm_name_or_path, |
|
|
save_folder=save_folder, |
|
|
) |
|
|
|
|
|
test_dataset = [dict( |
|
|
type=DemoImageCap, |
|
|
image_folder='./1215_demos/mask_outs/out/', |
|
|
bs=8, |
|
|
)] |
|
|
|
|
|
test_dataloader = dict( |
|
|
batch_size=1, |
|
|
num_workers=1, |
|
|
drop_last=False, |
|
|
sampler=dict(type=DefaultSampler, shuffle=False), |
|
|
dataset=dict(type=ConcatDataset, datasets=test_dataset), |
|
|
) |
|
|
|
|
|
test_evaluator = dict() |
|
|
test_cfg = dict(type=AnnoLoop, select_metric='first') |
|
|
|
|
|
custom_hooks = [] |
|
|
|
|
|
|
|
|
default_hooks = dict( |
|
|
|
|
|
timer=dict(type=IterTimerHook), |
|
|
|
|
|
logger=dict(type=LoggerHook, log_metric_by_epoch=False, interval=10), |
|
|
|
|
|
param_scheduler=dict(type=ParamSchedulerHook), |
|
|
|
|
|
sampler_seed=dict(type=DistSamplerSeedHook), |
|
|
) |
|
|
|
|
|
|
|
|
env_cfg = dict( |
|
|
|
|
|
cudnn_benchmark=False, |
|
|
|
|
|
mp_cfg=dict(mp_start_method='fork', opencv_num_threads=0), |
|
|
|
|
|
dist_cfg=dict(backend='nccl'), |
|
|
) |
|
|
|
|
|
|
|
|
visualizer = None |
|
|
|
|
|
|
|
|
log_level = 'INFO' |
|
|
|
|
|
|
|
|
load_from = None |
|
|
|
|
|
|
|
|
resume = False |
|
|
|
|
|
|
|
|
randomness = dict(seed=None, deterministic=False) |
|
|
|
|
|
|
|
|
log_processor = dict(by_epoch=False) |
|
|
|