diff --git a/accelerator/mps_accelerator.py b/accelerator/mps_accelerator.py index 1083ba14d27e..aa8e86ef1ce0 100644 --- a/accelerator/mps_accelerator.py +++ b/accelerator/mps_accelerator.py @@ -26,7 +26,8 @@ def is_synchronized_device(self): return False def use_host_timers(self): - return self.is_synchronized_device() + # Event timers are not supported on MPS + return True def resolves_data_dependency(self): return self.is_synchronized_device() diff --git a/deepspeed/runtime/engine.py b/deepspeed/runtime/engine.py index a1bcf3d9943a..01468d87e42a 100755 --- a/deepspeed/runtime/engine.py +++ b/deepspeed/runtime/engine.py @@ -457,6 +457,9 @@ def __init__(self, self._is_compiled_autograd_enabled = False self._compile_kwargs = {} + if self.dist_backend is None: + self.enable_backward_allreduce = False + def _optimized_linear_offload_setup(self): self.optimized_linear_base_weight_sharding = False self.optimized_linear_lora_enabled = False @@ -1309,6 +1312,8 @@ def _do_sanity_check(self): f'Client Optimizer (type = {type(self.client_optimizer)} is not instantiated but Client LR Scheduler is instantiated' def _broadcast_model(self): + if self.dist_backend is None: + return def is_replicated(p): if hasattr(p, "ds_status") and p.ds_status is not ZeroParamStatus.AVAILABLE: