2024-10-29 16:56:11 +08:00

38 lines
930 B
Bash

if [ -z "$HF_HUB_CACHE" ]; then
export HF_HUB_CACHE="$HOME/.cache/huggingface/hub"
fi
dataset_names="bn hi sw te th yo"
eval_args="\
--eval_name miracl \
--dataset_dir ./miracl/data \
--dataset_names $dataset_names \
--splits dev \
--corpus_embd_save_dir ./miracl/corpus_embd \
--output_dir ./miracl/search_results \
--search_top_k 1000 --rerank_top_k 100 \
--cache_path $HF_HUB_CACHE \
--overwrite False \
--k_values 10 100 \
--eval_output_method markdown \
--eval_output_path ./miracl/miracl_eval_results.md \
--eval_metrics ndcg_at_10 recall_at_100 \
"
model_args="\
--embedder_name_or_path BAAI/bge-m3 \
--reranker_name_or_path BAAI/bge-reranker-v2-m3 \
--devices cuda:0 cuda:1 \
--cache_dir $HF_HUB_CACHE \
--reranker_max_length 1024 \
"
cmd="python -m FlagEmbedding.evaluation.miracl \
$eval_args \
$model_args \
"
echo $cmd
eval $cmd