diff --git a/tests/test_tipc/dygraph/hybrid_parallelism/llama2/auto_config_llama2_70b/pretrain-llama2_70b-auto_tuner.json b/tests/test_tipc/dygraph/hybrid_parallelism/llama2/auto_config_llama2_70b/pretrain-llama2_70b-auto_tuner.json index 2f36b770b806..2c3d5a57622e 100644 --- a/tests/test_tipc/dygraph/hybrid_parallelism/llama2/auto_config_llama2_70b/pretrain-llama2_70b-auto_tuner.json +++ b/tests/test_tipc/dygraph/hybrid_parallelism/llama2/auto_config_llama2_70b/pretrain-llama2_70b-auto_tuner.json @@ -11,7 +11,7 @@ "sharding": "stage1", "sharding_parallel_config": "split_param enable_stage1_overlap", "tensor_parallel_config": "enable_delay_scale_loss enable_mp_async_allreduce enable_mp_skip_c_identity enable_mp_fused_linear_param_grad_add", - "pipeline_parallel_config": "enable_delay_scale_loss enable_release_grads disable_partial_send_recv", + "pipeline_parallel_config": "enable_delay_scale_loss enable_release_grads disable_partial_send_recv enable_overlap_p2p_comm", "virtual_pp_degree": 5, "sequence_parallel": 1, "use_flash_attention": true,