Spaces:
Running
Running
solver_model_path=$1 | |
questioner_model_path=$2 | |
experiment_name=$3 | |
echo $STORAGE_PATH | |
echo "start train solver $experiment_name $solver_model_path $questioner_model_path" | |
export VLLM_DISABLE_COMPILE_CACHE=1 | |
echo 'start generate question' | |
bash question_generate/question_generate.bash $questioner_model_path 1000 $experiment_name | |
echo 'start evaluate generated question' | |
bash question_evaluate/evaluate.sh $solver_model_path $experiment_name | |
echo 'start upload' | |
python question_evaluate/upload.py --repo_name ${experiment_name} --max_score 0.8 --min_score 0.3 --experiment_name ${experiment_name} | |
echo 'start train' | |
python3 -m verl.trainer.main \ | |
config=examples/config.yaml \ | |
data.max_response_length=4096 \ | |
worker.actor.model.model_path=$solver_model_path \ | |
trainer.experiment_name=${experiment_name} \ | |
trainer.save_checkpoint_path=${STORAGE_PATH}/models/${experiment_name}/ \ | |
data.train_files=${HUGGINGFACENAME}/${experiment_name}@train \ | |
trainer.total_epochs=100 \ | |
trainer.max_steps=20 \ | |
data.format_prompt=./examples/format_prompt/solver.jinja \ | |
trainer.val_freq=4 \ | |
worker.actor.micro_batch_size_per_device_for_update=1 \ | |
worker.actor.micro_batch_size_per_device_for_experience=1 \ | |
echo "merging model" | |
python scripts/model_merger.py --local_dir ${STORAGE_PATH}/models/${experiment_name}/global_step_15/actor | |
sleep 10 | |
echo "solver training finished" | |
bash evaluation/eval_math.bash ${STORAGE_PATH}/models/${experiment_name}/global_step_15/actor/huggingface |