AbrahamicSolver / solver_train.sh
Gatsby767's picture
Upload 5 files
da64666 verified
solver_model_path=$1
questioner_model_path=$2
experiment_name=$3
echo $STORAGE_PATH
echo "start train solver $experiment_name $solver_model_path $questioner_model_path"
export VLLM_DISABLE_COMPILE_CACHE=1
echo 'start generate question'
bash question_generate/question_generate.bash $questioner_model_path 1000 $experiment_name
echo 'start evaluate generated question'
bash question_evaluate/evaluate.sh $solver_model_path $experiment_name
echo 'start upload'
python question_evaluate/upload.py --repo_name ${experiment_name} --max_score 0.8 --min_score 0.3 --experiment_name ${experiment_name}
echo 'start train'
python3 -m verl.trainer.main \
config=examples/config.yaml \
data.max_response_length=4096 \
worker.actor.model.model_path=$solver_model_path \
trainer.experiment_name=${experiment_name} \
trainer.save_checkpoint_path=${STORAGE_PATH}/models/${experiment_name}/ \
data.train_files=${HUGGINGFACENAME}/${experiment_name}@train \
trainer.total_epochs=100 \
trainer.max_steps=20 \
data.format_prompt=./examples/format_prompt/solver.jinja \
trainer.val_freq=4 \
worker.actor.micro_batch_size_per_device_for_update=1 \
worker.actor.micro_batch_size_per_device_for_experience=1 \
echo "merging model"
python scripts/model_merger.py --local_dir ${STORAGE_PATH}/models/${experiment_name}/global_step_15/actor
sleep 10
echo "solver training finished"
bash evaluation/eval_math.bash ${STORAGE_PATH}/models/${experiment_name}/global_step_15/actor/huggingface