-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathrun.sh
32 lines (27 loc) · 3.24 KB
/
run.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
#!/bin/bash
set -e
# Install packages
# pip uninstall -y transformer-engine # Use this if flash-attn is not installed
pip install -r requirements.txt
MAX_JOBS=4 pip install flash-attn --no-build-isolation
# Download dataset from kaggle
python prepare_dataset.py
# Pre-trieval
python pre_retrieval.py
# Intermediate Retrieve
python rerank.py --task FinanceBench --model jinaai/jina-reranker-v2-base-multilingual --top_k 99999 --batch_size 128 --dataset_dir ./dataset --dataset_filename merge.json --save_dir ./results/intermediate --save_top_k 200
python rerank.py --task FinQABench --model jinaai/jina-reranker-v2-base-multilingual --top_k 99999 --batch_size 128 --dataset_dir ./dataset --dataset_filename merge.json --save_dir ./results/intermediate --save_top_k 200
python rerank.py --task FinDER --model jinaai/jina-reranker-v2-base-multilingual --top_k 99999 --batch_size 128 --dataset_dir ./dataset --dataset_filename merge.json --save_dir ./results/intermediate --save_top_k 200
python rerank.py --task ConvFinQA --model jinaai/jina-reranker-v2-base-multilingual --top_k 99999 --batch_size 128 --dataset_dir ./dataset --dataset_filename merge.json --save_dir ./results/intermediate --save_top_k 200
python rerank.py --task FinQA --model jinaai/jina-reranker-v2-base-multilingual --top_k 99999 --batch_size 128 --dataset_dir ./dataset --dataset_filename merge.json --save_dir ./results/intermediate --save_top_k 200
python rerank.py --task TATQA --model jinaai/jina-reranker-v2-base-multilingual --top_k 99999 --batch_size 128 --dataset_dir ./dataset --dataset_filename merge.json --save_dir ./results/intermediate --save_top_k 200
python rerank.py --task MultiHiertt --model jinaai/jina-reranker-v2-base-multilingual --top_k 99999 --batch_size 128 --dataset_dir ./dataset --dataset_filename merge.json --save_dir ./results/intermediate --save_top_k 200
# Final Retrieve
python rerank.py --task FinanceBench --model jinaai/jina-reranker-v2-base-multilingual --top_k 200 --batch_size 128 --dataset_dir ./results/intermediate --dataset_filename results.json --save_dir ./results
python rerank.py --task FinQABench --model jinaai/jina-reranker-v2-base-multilingual --top_k 200 --batch_size 128 --dataset_dir ./results/intermediate --dataset_filename results.json --save_dir ./results
python rerank.py --task FinDER --model BAAI/bge-reranker-v2-m3 --top_k 200 --batch_size 4 --dataset_dir ./results/intermediate --dataset_filename results.json --save_dir ./results
python rerank.py --task ConvFinQA --model BAAI/bge-reranker-v2-m3 --top_k 200 --batch_size 4 --dataset_dir ./results/intermediate --dataset_filename results.json --save_dir ./results
python rerank.py --task FinQA --model Alibaba-NLP/gte-multilingual-reranker-base --top_k 200 --batch_size 4 --dataset_dir ./results/intermediate --dataset_filename results.json --save_dir ./results
python rerank.py --task TATQA --model BAAI/bge-reranker-v2-m3 --top_k 200 --batch_size 4 --dataset_dir ./results/intermediate --dataset_filename results.json --save_dir ./results
python rerank.py --task MultiHiertt --model jinaai/jina-reranker-v2-base-multilingual --top_k 200 --batch_size 128 --dataset_dir ./results/intermediate --dataset_filename results.json --save_dir ./results
python rerank.py --save_dir ./results --dataset_dir ./dataset --do_post_process