-
Notifications
You must be signed in to change notification settings - Fork 826
/
eval_TruthfulQA.sh
25 lines (25 loc) · 1.64 KB
/
eval_TruthfulQA.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
cd model
python ChatGPT.py --api_key your_api_key --dataset TruthfulQA
python Claude.py --api_key your_api_key --dataset TruthfulQA
python davinci-003.py --api_key your_api_key --dataset TruthfulQA
python davinci-002.py --api_key your_api_key --dataset TruthfulQA
python Vicuna.py --dataset TruthfulQA --device 0 --model-path lmsys/vicuna-7b-delta-v1.1
python Alpaca.py --dataset TruthfulQA --device 0 --model-path chainyo/alpaca-lora-7b
python ChatGLM.py --dataset TruthfulQA --device 0 --model-path THUDM/chatglm-6b
python LLaMA.py --dataset TruthfulQA --device 0 --model-path decapoda-research/llama-7b-hf
python Falcon.py --dataset TruthfulQA --device 0 --model-path tiiuae/falcon-7b-instruct
python Pythia.py --dataset TruthfulQA --device 0 --model-path EleutherAI/pythia-6.9b --save_path Pythia-7b
python Pythia.py --dataset TruthfulQA --device 0 --model-path EleutherAI/pythia-12b --save_path Pythia-12b
cd ../metric
python eval_truthfulqa.py --api_key your_api_key --model gpt-3.5-turbo
python eval_truthfulqa.py --api_key your_api_key --model Claude
python eval_truthfulqa.py --api_key your_api_key --model davinci-003
python eval_truthfulqa.py --api_key your_api_key --model davinci-002
python eval_truthfulqa.py --api_key your_api_key --model Vicuna
python eval_truthfulqa.py --api_key your_api_key --model Alpaca
python eval_truthfulqa.py --api_key your_api_key --model ChatGLM
python eval_truthfulqa.py --api_key your_api_key --model Falcon
python eval_truthfulqa.py --api_key your_api_key --model LlaMA
python eval_truthfulqa.py --api_key your_api_key --model Pythia-7b
python eval_truthfulqa.py --api_key your_api_key --model Pythia-12b
python cal_truth_res.py