@@ -8,6 +8,12 @@ MODEL_PATH=${MODEL_PATH:-${HOME}/models/${MODEL_ID}}
88
99TRAIN_FILES=${TRAIN_FILES:- ${HOME} / data/ gsm8k/ train.parquet}
1010VAL_FILES=${VAL_FILES:- ${HOME} / data/ gsm8k/ test.parquet}
11+ VAL_BEFORE_TRAIN=${VAL_BEFORE_TRAIN:- False}
12+ NUM_GPUS=${NUM_GPUS:- 8}
13+ FSDP_SIZE=${FSDP_SIZE:- 4}
14+ SP_SIZE=${SP_SIZE:- 2}
15+ EP_SIZE=${EP_SIZE:- 2}
16+ VERL_EXP_NAME=${VERL_EXP_NAME:- qwen2.5-0.5b-function-reward-minimal-fsdp-size8}
1117
1218python3 -m verl.trainer.main_ppo --config-path=config\
1319 --config-name=" ppo_veomni_trainer.yaml" \
@@ -33,8 +39,9 @@ python3 -m verl.trainer.main_ppo --config-path=config\
3339 actor_rollout_ref.actor.kl_loss_type=low_var_kl \
3440 actor_rollout_ref.actor.entropy_coeff=0 \
3541 actor_rollout_ref.actor.use_torch_compile=False \
36- actor_rollout_ref.actor.veomni.data_parallel_size=4 \
37- actor_rollout_ref.actor.veomni.ulysses_parallel_size=2 \
42+ actor_rollout_ref.actor.veomni.data_parallel_size=" ${FSDP_SIZE} " \
43+ actor_rollout_ref.actor.veomni.ulysses_parallel_size=" ${SP_SIZE} " \
44+ actor_rollout_ref.actor.veomni.expert_parallel_size=" ${EP_SIZE} " \
3845 actor_rollout_ref.ref.log_prob_micro_batch_size_per_gpu=1 \
3946 actor_rollout_ref.ref.veomni.param_offload=True \
4047 actor_rollout_ref.ref.use_torch_compile=False \
@@ -54,8 +61,9 @@ python3 -m verl.trainer.main_ppo --config-path=config\
5461 trainer.critic_warmup=0 \
5562 trainer.logger=console \
5663 trainer.project_name=' verl_grpo_example_gsm8k' \
57- trainer.experiment_name=' qwen25_05b_function_rm' \
58- trainer.n_gpus_per_node=8 \
64+ trainer.experiment_name=" ${VERL_EXP_NAME} " \
65+ trainer.n_gpus_per_node=" ${NUM_GPUS} " \
66+ trainer.val_before_train=" ${VAL_BEFORE_TRAIN} " \
5967 trainer.nnodes=1 \
6068 trainer.save_freq=-1 \
6169 trainer.test_freq=-1 \
0 commit comments