lmt-arr / scripts /eval_multi.sh
sleepyhead111's picture
Upload folder using huggingface_hub
746b7a6 verified
raw
history blame
1.76 kB
# !/bin/bash
set -eux
ROOT_DIR=$(dirname $(dirname `readlink -f $0`))
export HF_HOME="./cache/"
export HF_DATASETS_CACHE="./cache/huggingface_cache/datasets"
export HF_EVALUATE_OFFLINE=1
export HF_DATASETS_OFFLINE=1
decode_dir=${1:-""}
comet_model=$ROOT_DIR/model_card/wmt22-comet-da/checkpoints/model.ckpt
xcome_model=$ROOT_DIR/model_card/XCOMET-XXL/checkpoints/model.ckpt
src_file_strs=""
ref_file_strs=""
hypo_file_strs=""
lang_pair_strs=""
for lang in en de ru bn hi th jv sw si km;do
for src in $lang zh ;do
if [ $src = "zh" ]; then # en2zh
src_lang=zh
tgt_lang=$lang
else # zh2en
src_lang=$lang
tgt_lang=zh
fi
lp=${src_lang}2${tgt_lang}
# hypo_file=$decode_dir/${lang_pair}.txt
# hypo_file=$decode_dir/hypo.${lp}.txt
hypo_file=$decode_dir/$lp/hypo.${lp}.txt
# hypo_file=$decode_dir/niu.${lp}.txt
# hypo_file=$decode_dir/hypo.${lp}.$tgt_lang
# hypo_file=$decode_dir/hypo_${lang_pair}.txt
src_file=$ROOT_DIR/data/flores200/zh-${lang}/test.zh-$lang.$src_lang
ref_file=$ROOT_DIR/data/flores200/zh-${lang}/test.zh-$lang.$tgt_lang
src_file_strs=${src_file_strs:+$src_file_strs,}$src_file
ref_file_strs=${ref_file_strs:+$ref_file_strs,}$ref_file
hypo_file_strs=${hypo_file_strs:+$hypo_file_strs,}$hypo_file
lang_pair_strs=${lang_pair_strs:+$lang_pair_strs,}$lp
done
done
# metric="bleu,comet_22,xcomet_xxl"
metric="bleu,comet_22"
python $ROOT_DIR/src/mt_scoring.py \
--metric $metric \
--comet_22_path $comet_model \
--xcomet_xxl_path $xcome_model \
--lang_pair $lang_pair_strs \
--src_file $src_file_strs \
--ref_file $ref_file_strs \
--hypo_file $hypo_file_strs \
--record_file "result_mt.xlsx"