Fix hf_device_map device comparison in prepare_model (#3895)

rezaqorbani · Reza Qorbani · web-flow · commit 27ed776d8a53 · 2026-01-06T15:30:38.000+01:00
Co-authored-by: Reza Qorbani &lt;rezaqorbani@Rezas-MacBook-Pro.local&gt;
diff --git a/src/accelerate/accelerator.py b/src/accelerate/accelerator.py
@@ -1811,10 +1811,11 @@ def prepare_model(
                 else:
                     current_device_index = current_device
 
+                current_device_index = int(current_device_index) if current_device_index is not None else None
                 if self.device.type == "cpu" and is_bitsandbytes_multi_backend_available():
                     # bnb with multi-backend supports CPU which don't need to check index.
                     pass
-                elif torch.device(current_device_index) != self.device:
+                elif torch.device(self.device.type, current_device_index) != self.device:
                     # if on the first device (GPU 0) we don't care
                     if (self.device.index is not None) or (current_device_index != 0):
                         raise ValueError(
diff --git a/tests/test_accelerator.py b/tests/test_accelerator.py
@@ -44,6 +44,7 @@
 )
 from accelerate.test_utils.testing import (
     AccelerateTestCase,
+    assert_exception,
     require_cuda,
     require_non_torch_xla,
     require_torchdata_stateful_dataloader,
@@ -861,3 +862,27 @@ def forward(self, x):
             #       weight is on the meta device, we need a `value` to put in on 0
             x = torch.randn(1, 2)
             my_model(x)
+
+    @require_non_torch_xla
+    def test_prepare_model_8bit_cpu_offload_raises_valueerror_not_typeerror(self):
+        class ModelForTest(torch.nn.Module):
+            def __init__(self):
+                super().__init__()
+                self.l = torch.nn.Linear(2, 2)
+
+            def forward(self, x):
+                return self.l(x)
+
+        accelerator = Accelerator()
+        model = ModelForTest()
+
+        # Trigger the 8-bit/4-bit + hf_device_map code path.
+        model.is_loaded_in_8bit = True
+        model.hf_device_map = {"": "cpu"}
+
+        with (
+            patch("accelerate.accelerator.is_bitsandbytes_multi_backend_available", return_value=False),
+            patch("accelerate.accelerator.is_xpu_available", return_value=False),
+        ):
+            with assert_exception(ValueError, "CPU or disk offload"):
+                accelerator.prepare_model(model)