vlm_clone_2 / VILA /scripts /v1_5 /eval /chartqa.sh
tuandunghcmut's picture
Add files using upload-large-folder tool
c7702b8 verified
#!/bin/bash
MODEL_PATH=$1
CKPT=$2
CONV_MODE=vicuna_v1
if [ "$#" -ge 3 ]; then
CONV_MODE="$3"
fi
torchrun --nproc-per-node=8 \
llava/eval/evaluate_vqa.py \
--model-path $MODEL_PATH \
--conv-mode $CONV_MODE \
--generation-config '{"max_new_tokens": 100}' \
--dataset chartqa_test_human \
--image-folder ./playground/data/eval/chartqa \
--data-path ./playground/data/eval/chartqa/test_human.jsonl \
--answers-file runs/eval/$CKPT/chartqa/answers1/merge.jsonl
python -m llava.eval.evaluate_vqa_score --answers-file runs/eval/$CKPT/chartqa/answers1/merge.jsonl --metric relaxed_accuracy
torchrun --nproc-per-node=8 \
llava/eval/evaluate_vqa.py \
--model-path $MODEL_PATH \
--conv-mode $CONV_MODE \
--generation-config '{"max_new_tokens": 100}' \
--dataset chartqa_test_augmented \
--data-path ./playground/data/eval/chartqa/test_augmented.jsonl \
--image-folder ./playground/data/eval/chartqa \
--answers-file runs/eval/$CKPT/chartqa/answers2/merge.jsonl
python -m llava.eval.evaluate_vqa_score --answers-file runs/eval/$CKPT/chartqa/answers2/merge.jsonl --metric relaxed_accuracy