-
Notifications
You must be signed in to change notification settings - Fork 67
/
run_mtbench.sh
35 lines (32 loc) · 1.19 KB
/
run_mtbench.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
#download data
wget https://raw.githubusercontent.com/lm-sys/FastChat/v0.2.31/fastchat/llm_judge/data/mt_bench/question.jsonl -O mtbench.jsonl
export CUDA=0
export LADE=0
export LEVEL=0
export WIN=0
export GUESS=0
export FLASH=0
export PP=0
CUDA_VISIBLE_DEVICES=$CUDA USE_LADE=$LADE python eval_mtbench.py \
--model-path meta-llama/Llama-2-7b-chat-hf --model-id \
llama-2-7b-level-$LEVEL-win-$WIN-guess-$GUESS-f$FLASH-pp$CUDA \
--level $LEVEL --window $WIN --guess $GUESS --use-flash $FLASH --use-pp $PP
export CUDA=0
export LADE=1
export LEVEL=5
export WIN=15
export GUESS=15
export FLASH=0
export PP=0
CUDA_VISIBLE_DEVICES=$CUDA USE_LADE=$LADE python eval_mtbench.py \
--model-path meta-llama/Llama-2-7b-chat-hf --model-id \
llama-2-7b-level-$LEVEL-win-$WIN-guess-$GUESS-f$FLASH-pp$CUDA \
--level $LEVEL --window $WIN --guess $GUESS --use-flash $FLASH --use-pp $PP
export GPUS=1
export LEVEL=0
export WIN=0
export GUESS=0
export FLASH=0
deepspeed --num_gpus $GPUS eval_mtbench.py --model-path meta-llama/Llama-2-7b-chat-hf \
--model-id llama-2-7b-level-$LEVEL-win-$WIN-guess-$GUESS-f$FLASH-ds$GPUS \
--level $LEVEL --window $WIN --guess $GUESS --use-flash $FLASH --use-tp-ds 1