-
Notifications
You must be signed in to change notification settings - Fork 35
/
bbh.sh
32 lines (26 loc) · 844 Bytes
/
bbh.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
export CUDA_VISIBLE_DEVICES=0,1
DATA_DIR=data/eval/bbh
if [ ! -d "data" ]; then
mkdir data
fi
if [ ! -d "data/eval" ]; then
mkdir data/eval
fi
if [ ! -d $DATA_DIR ]; then
echo "Downloading BBH data..."
mkdir -p data/downloads
wget -O data/downloads/bbh_data.zip https://github.com/suzgunmirac/BIG-Bench-Hard/archive/refs/heads/main.zip
unzip data/downloads/bbh_data.zip -d data/downloads/bbh
mv data/downloads/bbh/BIG-Bench-Hard-main data/eval/bbh && rm -rf data/downloads/
fi
MODEL_DIR=codellama/CodeLlama-7b-Instruct-hf
OUTPUT_DIR=results/bbh/llama-2-7b-hf
python -m xchat.eval.bbh.run_eval \
--data_dir data/eval/bbh/ \
--save_dir $OUTPUT_DIR \
--model $MODEL_DIR \
--tokenizer $MODEL_DIR \
--eval_batch_size 20 \
--load_in_8bit \
--no_cot \
--chat_format codellama-instruct