Loading megatron/training.py +1 −1 Original line number Diff line number Diff line Loading @@ -311,7 +311,7 @@ def setup_model_and_optimizer(model_provider_func): # We only support local DDP with multiple micro-batches. if get_num_microbatches() > 1: assert args.DDP_impl == 'local' if len(model) == 1: if len(model) > 1: assert args.DDP_impl == 'local' if mpu.get_pipeline_model_parallel_world_size() > 1: assert args.DDP_impl == 'local' Loading Loading
megatron/training.py +1 −1 Original line number Diff line number Diff line Loading @@ -311,7 +311,7 @@ def setup_model_and_optimizer(model_provider_func): # We only support local DDP with multiple micro-batches. if get_num_microbatches() > 1: assert args.DDP_impl == 'local' if len(model) == 1: if len(model) > 1: assert args.DDP_impl == 'local' if mpu.get_pipeline_model_parallel_world_size() > 1: assert args.DDP_impl == 'local' Loading