Skip to content

Commit

Permalink
Fix nemo2 interface for ucc
Browse files Browse the repository at this point in the history
Signed-off-by: Guyue Huang <guyueh@login-preos01.a51.clusters.nvidia.com>
  • Loading branch information
Guyue Huang committed Jan 4, 2025
1 parent af35a8c commit 90a99d3
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 1 deletion.
2 changes: 1 addition & 1 deletion nemo/lightning/_strategy_lib.py
Original file line number Diff line number Diff line change
Expand Up @@ -82,7 +82,7 @@ def init_parallel_ranks(
tensor_model_parallel_size=parallel_config.tensor_model_parallel_size,
expert_model_parallel_size=parallel_config.expert_model_parallel_size,
pipeline_model_parallel_size=parallel_config.pipeline_model_parallel_size,
pipeline_model_parallel_comm_backend=parallel_config.get('pipeline_model_parallel_comm_backend', 'nccl'),
pipeline_model_parallel_comm_backend=parallel_config.pipeline_model_parallel_comm_backend,
virtual_pipeline_model_parallel_size=parallel_config.virtual_pipeline_model_parallel_size,
context_parallel_size=parallel_config.context_parallel_size,
encoder_tensor_model_parallel_size=getattr(parallel_config, "encoder_tensor_model_parallel_size", 0),
Expand Down
1 change: 1 addition & 0 deletions nemo/lightning/pytorch/strategies/megatron_strategy.py
Original file line number Diff line number Diff line change
Expand Up @@ -905,6 +905,7 @@ def parallelism(self) -> ParallelismConfig:
return ParallelismConfig(
tensor_model_parallel_size=self.tensor_model_parallel_size,
pipeline_model_parallel_size=self.pipeline_model_parallel_size,
pipeline_model_parallel_comm_backend=self.pipeline_model_parallel_comm_backend,
virtual_pipeline_model_parallel_size=self.virtual_pipeline_model_parallel_size,
microbatch_group_size_per_vp_stage=self.microbatch_group_size_per_vp_stage,
context_parallel_size=self.context_parallel_size,
Expand Down

0 comments on commit 90a99d3

Please sign in to comment.