-
Notifications
You must be signed in to change notification settings - Fork 15
/
Copy pathtune_proofstep.sh
33 lines (30 loc) · 1.01 KB
/
tune_proofstep.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
BASE_DIR=.
TRAIN_FILE=${BASE_DIR}/data/leandojo_benchmark_4/processed/proofstep-train.jsonl
VALID_FILE=${BASE_DIR}/data/leandojo_benchmark_4/processed/proofstep-val.jsonl
MODEL=EleutherAI/pythia-2.8b-deduped
CONFIG=${BASE_DIR}/deepspeed_config.json
OUTDIR=./model/${MODEL}
deepspeed --include localhost:0,1,2,3,4,5,6,7 ${BASE_DIR}/tune.py \
--deepspeed ${CONFIG} \
--model_name_or_path ${MODEL} \
--train_data_path ${TRAIN_FILE} \
--valid_data_path ${VALID_FILE} \
--fp16 \
--output_dir ${OUTDIR} \
--num_train_epochs 10 \
--per_device_train_batch_size 4 \
--per_device_eval_batch_size 4 \
--gradient_accumulation_steps 2 \
--evaluation_strategy "steps" \
--eval_steps 500 \
--save_strategy "steps" \
--save_steps 500 \
--save_total_limit 1 \
--learning_rate 1e-5 \
--load_best_model_at_end 1 \
--weight_decay 0. \
--warmup_ratio 0.03 \
--lr_scheduler_type "cosine" \
--logging_steps 10 \
--logging_dir "$OUTDIR" \
--report_to="tensorboard"