require grad_sync to be true now for this ckpt

Signed-off-by: Terry Kong <terryk@nvidia.com>
NVIDIA · Nov 22, 2024 · 7f75e47 · 7f75e47
1 parent 79eed88
commit 7f75e47
Showing 1 changed file with 1 addition and 1 deletion.
diff --git a/tests/functional/ppo.sh b/tests/functional/ppo.sh
@@ -82,7 +82,7 @@ python -u ${GPFS}/examples/nlp/gpt/serve_ppo_critic.py \
     ++model.global_batch_size=1 \
     ++model.tensor_model_parallel_size=1 \
     ++model.optim.bucket_cap_mb=200 \
-    ++model.optim.overlap_grad_sync=False \
+    ++model.optim.overlap_grad_sync=True \
     ++model.optim.contiguous_grad_buffer=True \
     ++trainer.ppo.pad_sequence_length_to_multiple=32 \
     model.reward_standardization.enable=True \