@@ -166,7 +166,7 @@ actor_rollout_ref:
166166 use_torch_compile : ${oc.select:actor_rollout_ref.actor.use_torch_compile,true}
167167 log_prob_micro_batch_size : null
168168 log_prob_micro_batch_size_per_gpu : null
169- log_prob_use_dynamic_bsz : ${oc.select:actor_rollout_ref.actor.use_dynamic_bsz,false}
169+ log_prob_use_dynamic_bsz : true
170170 log_prob_max_token_len_per_gpu : ${oc.select:actor_rollout_ref.actor.ppo_max_token_len_per_gpu,16384}
171171 profiler :
172172 _target_ : verl.utils.profiler.ProfilerConfig
@@ -248,7 +248,7 @@ actor_rollout_ref:
248248 dtype : bfloat16
249249 gpu_memory_utilization : 0.80
250250 ignore_eos : false
251- enforce_eager : false
251+ enforce_eager : true
252252 cudagraph_capture_sizes : null
253253 free_cache_engine : true
254254 tensor_model_parallel_size : 1
@@ -265,7 +265,7 @@ actor_rollout_ref:
265265 load_format : dummy
266266 log_prob_micro_batch_size : null
267267 log_prob_micro_batch_size_per_gpu : 1
268- log_prob_use_dynamic_bsz : ${oc.select:actor_rollout_ref.actor.use_dynamic_bsz,false}
268+ log_prob_use_dynamic_bsz : true
269269 log_prob_max_token_len_per_gpu : ${oc.select:actor_rollout_ref.actor.ppo_max_token_len_per_gpu,16384}
270270 disable_log_stats : true
271271 do_sample : true
@@ -508,7 +508,7 @@ critic:
508508 ppo_mini_batch_size : ${oc.select:actor_rollout_ref.actor.ppo_mini_batch_size,256}
509509 ppo_micro_batch_size : null
510510 ppo_micro_batch_size_per_gpu : ${oc.select:.ppo_micro_batch_size,null}
511- use_dynamic_bsz : ${oc.select:actor_rollout_ref.actor.use_dynamic_bsz,false}
511+ use_dynamic_bsz : true
512512 ppo_max_token_len_per_gpu : 32768
513513 forward_max_token_len_per_gpu : ${.ppo_max_token_len_per_gpu}
514514 ppo_epochs : ${oc.select:actor_rollout_ref.actor.ppo_epochs,1}
0 commit comments