| | if [ -z "$HF_HUB_CACHE" ]; then |
| | export HF_HUB_CACHE="$HOME/.cache/huggingface/hub" |
| | fi |
| |
|
| | |
| | dataset_names="biology earth_science economics psychology robotics stackoverflow sustainable_living leetcode pony aops theoremqa_questions theoremqa_theorems" |
| |
|
| | model_args="\ |
| | --embedder_name_or_path hanhainebula/reason-embed-basic-qwen3-4b-0928 \ |
| | --embedder_model_class decoder-only-base \ |
| | --query_instruction_format_for_retrieval 'Instruct: {}\nQuery: {}' \ |
| | --pooling_method last_token \ |
| | --devices cuda:0 cuda:1 cuda:2 cuda:3 cuda:4 cuda:5 cuda:6 cuda:7 \ |
| | --cache_dir $HF_HUB_CACHE \ |
| | --embedder_batch_size 8 \ |
| | --embedder_query_max_length 8192 \ |
| | --embedder_passage_max_length 8192 \ |
| | " |
| |
|
| | split_list=("examples") |
| |
|
| | for split in "${split_list[@]}"; do |
| | eval_args="\ |
| | --task_type short \ |
| | --use_special_instructions True \ |
| | --eval_name bright_short \ |
| | --dataset_dir ./bright_short/data \ |
| | --dataset_names $dataset_names \ |
| | --splits $split \ |
| | --corpus_embd_save_dir ./bright_short/corpus_embd \ |
| | --output_dir ./bright_short/search_results/$split \ |
| | --search_top_k 2000 \ |
| | --cache_path $HF_HUB_CACHE \ |
| | --overwrite False \ |
| | --k_values 1 10 100 \ |
| | --eval_output_method markdown \ |
| | --eval_output_path ./bright_short/eval_results_$split.md \ |
| | --eval_metrics ndcg_at_10 recall_at_10 recall_at_100 \ |
| | " |
| |
|
| | cmd="python -m FlagEmbedding.evaluation.bright \ |
| | $eval_args \ |
| | $model_args \ |
| | " |
| |
|
| | echo $cmd |
| | eval $cmd |
| |
|
| | done |
| |
|