huggingface
diff --git a/‎scripts/convert_cogview3_to_diffusers.py‎
Lines changed: 1 addition & 1 deletion b/‎scripts/convert_cogview3_to_diffusers.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎scripts/convert_flux_to_diffusers.py‎
Lines changed: 1 addition & 1 deletion b/‎scripts/convert_flux_to_diffusers.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎scripts/convert_mochi_to_diffusers.py‎
Lines changed: 1 addition & 1 deletion b/‎scripts/convert_mochi_to_diffusers.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎scripts/convert_sd3_to_diffusers.py‎
Lines changed: 1 addition & 1 deletion b/‎scripts/convert_sd3_to_diffusers.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/diffusers/models/autoencoders/autoencoder_kl_mochi.py‎
Lines changed: 3 additions & 2 deletions b/‎src/diffusers/models/autoencoders/autoencoder_kl_mochi.py‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎tests/single_file/single_file_testing_utils.py‎
Lines changed: 2 additions & 2 deletions b/‎tests/single_file/single_file_testing_utils.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎tests/single_file/test_model_controlnet_single_file.py‎
Lines changed: 6 additions & 4 deletions b/‎tests/single_file/test_model_controlnet_single_file.py‎
Lines changed: 6 additions & 4 deletions
diff --git a/‎tests/single_file/test_model_sd_cascade_unet_single_file.py‎
Lines changed: 6 additions & 4 deletions b/‎tests/single_file/test_model_sd_cascade_unet_single_file.py‎
Lines changed: 6 additions & 4 deletions
diff --git a/‎tests/single_file/test_model_vae_single_file.py‎
Lines changed: 5 additions & 4 deletions b/‎tests/single_file/test_model_vae_single_file.py‎
Lines changed: 5 additions & 4 deletions
diff --git a/‎tests/single_file/test_stable_diffusion_controlnet_img2img_single_file.py‎
Lines changed: 5 additions & 4 deletions b/‎tests/single_file/test_stable_diffusion_controlnet_img2img_single_file.py‎
Lines changed: 5 additions & 4 deletions
@@ -36,7 +36,7 @@
 from diffusers.utils.import_utils import is_accelerate_available
 
 
-CTX = init_empty_weights if is_accelerate_available else nullcontext
+CTX = init_empty_weights if is_accelerate_available() else nullcontext
 
 TOKENIZER_MAX_LENGTH = 224
 
 
@@ -31,7 +31,7 @@
 --vae
 """
 
-CTX = init_empty_weights if is_accelerate_available else nullcontext
+CTX = init_empty_weights if is_accelerate_available() else nullcontext
 
 parser = argparse.ArgumentParser()
 parser.add_argument("--original_state_dict_repo_id", default=None, type=str)
 
@@ -10,7 +10,7 @@
 from diffusers.utils.import_utils import is_accelerate_available
 
 
-CTX = init_empty_weights if is_accelerate_available else nullcontext
+CTX = init_empty_weights if is_accelerate_available() else nullcontext
 
 TOKENIZER_MAX_LENGTH = 256
 
 
@@ -11,7 +11,7 @@
 from diffusers.utils.import_utils import is_accelerate_available
 
 
-CTX = init_empty_weights if is_accelerate_available else nullcontext
+CTX = init_empty_weights if is_accelerate_available() else nullcontext
 
 parser = argparse.ArgumentParser()
 parser.add_argument("--checkpoint_path", type=str)
 
@@ -437,7 +437,8 @@ def __init__(self, start: int = 6, stop: int = 8, step: int = 1):
 
     def forward(self, inputs: torch.Tensor) -> torch.Tensor:
         r"""Forward method of the `FourierFeatures` class."""
-
+        original_dtype = inputs.dtype
+        inputs = inputs.to(torch.float32)
         num_channels = inputs.shape[1]
         num_freqs = (self.stop - self.start) // self.step
 
@@ -450,7 +451,7 @@ def forward(self, inputs: torch.Tensor) -> torch.Tensor:
         # Scale channels by frequency.
         h = w * h
 
-        return torch.cat([inputs, torch.sin(h), torch.cos(h)], dim=1)
+        return torch.cat([inputs, torch.sin(h), torch.cos(h)], dim=1).to(original_dtype)
 
 
 class MochiEncoder3D(nn.Module):
 
@@ -156,14 +156,14 @@ def test_single_file_components_with_original_config_local_files_only(
     def test_single_file_format_inference_is_same_as_pretrained(self, expected_max_diff=1e-4):
         sf_pipe = self.pipeline_class.from_single_file(self.ckpt_path, safety_checker=None)
         sf_pipe.unet.set_attn_processor(AttnProcessor())
-        sf_pipe.enable_model_cpu_offload()
+        sf_pipe.enable_model_cpu_offload(device=torch_device)
 
         inputs = self.get_inputs(torch_device)
         image_single_file = sf_pipe(**inputs).images[0]
 
         pipe = self.pipeline_class.from_pretrained(self.repo_id, safety_checker=None)
         pipe.unet.set_attn_processor(AttnProcessor())
-        pipe.enable_model_cpu_offload()
+        pipe.enable_model_cpu_offload(device=torch_device)
 
         inputs = self.get_inputs(torch_device)
         image = pipe(**inputs).images[0]
 
@@ -22,17 +22,19 @@
     ControlNetModel,
 )
 from diffusers.utils.testing_utils import (
+    backend_empty_cache,
     enable_full_determinism,
-    require_torch_gpu,
+    require_torch_accelerator,
     slow,
+    torch_device,
 )
 
 
 enable_full_determinism()
 
 
 @slow
-@require_torch_gpu
+@require_torch_accelerator
 class ControlNetModelSingleFileTests(unittest.TestCase):
     model_class = ControlNetModel
     ckpt_path = "https://huggingface.co/lllyasviel/ControlNet-v1-1/blob/main/control_v11p_sd15_canny.pth"
@@ -41,12 +43,12 @@ class ControlNetModelSingleFileTests(unittest.TestCase):
     def setUp(self):
         super().setUp()
         gc.collect()
-        torch.cuda.empty_cache()
+        backend_empty_cache(torch_device)
 
     def tearDown(self):
         super().tearDown()
         gc.collect()
-        torch.cuda.empty_cache()
+        backend_empty_cache(torch_device)
 
     def test_single_file_components(self):
         model = self.model_class.from_pretrained(self.repo_id)
 
@@ -21,9 +21,11 @@
 from diffusers import StableCascadeUNet
 from diffusers.utils import logging
 from diffusers.utils.testing_utils import (
+    backend_empty_cache,
     enable_full_determinism,
-    require_torch_gpu,
+    require_torch_accelerator,
     slow,
+    torch_device,
 )
 
 
@@ -33,17 +35,17 @@
 
 
 @slow
-@require_torch_gpu
+@require_torch_accelerator
 class StableCascadeUNetSingleFileTest(unittest.TestCase):
     def setUp(self):
         super().setUp()
         gc.collect()
-        torch.cuda.empty_cache()
+        backend_empty_cache(torch_device)
 
     def tearDown(self):
         super().tearDown()
         gc.collect()
-        torch.cuda.empty_cache()
+        backend_empty_cache(torch_device)
 
     def test_single_file_components_stage_b(self):
         model_single_file = StableCascadeUNet.from_single_file(
 
@@ -22,10 +22,11 @@
     AutoencoderKL,
 )
 from diffusers.utils.testing_utils import (
+    backend_empty_cache,
     enable_full_determinism,
     load_hf_numpy,
     numpy_cosine_similarity_distance,
-    require_torch_gpu,
+    require_torch_accelerator,
     slow,
     torch_device,
 )
@@ -35,7 +36,7 @@
 
 
 @slow
-@require_torch_gpu
+@require_torch_accelerator
 class AutoencoderKLSingleFileTests(unittest.TestCase):
     model_class = AutoencoderKL
     ckpt_path = (
@@ -48,12 +49,12 @@ class AutoencoderKLSingleFileTests(unittest.TestCase):
     def setUp(self):
         super().setUp()
         gc.collect()
-        torch.cuda.empty_cache()
+        backend_empty_cache(torch_device)
 
     def tearDown(self):
         super().tearDown()
         gc.collect()
-        torch.cuda.empty_cache()
+        backend_empty_cache(torch_device)
 
     def get_file_format(self, seed, shape):
         return f"gaussian_noise_s={seed}_shape={'_'.join([str(s) for s in shape])}.npy"
 
@@ -8,9 +8,10 @@
 from diffusers.loaders.single_file_utils import _extract_repo_id_and_weights_name
 from diffusers.utils import load_image
 from diffusers.utils.testing_utils import (
+    backend_empty_cache,
     enable_full_determinism,
     numpy_cosine_similarity_distance,
-    require_torch_gpu,
+    require_torch_accelerator,
     slow,
     torch_device,
 )
@@ -27,7 +28,7 @@
 
 
 @slow
-@require_torch_gpu
+@require_torch_accelerator
 class StableDiffusionControlNetPipelineSingleFileSlowTests(unittest.TestCase, SDSingleFileTesterMixin):
     pipeline_class = StableDiffusionControlNetPipeline
     ckpt_path = (
@@ -41,12 +42,12 @@ class StableDiffusionControlNetPipelineSingleFileSlowTests(unittest.TestCase, SD
     def setUp(self):
         super().setUp()
         gc.collect()
-        torch.cuda.empty_cache()
+        backend_empty_cache(torch_device)
 
     def tearDown(self):
         super().tearDown()
         gc.collect()
-        torch.cuda.empty_cache()
+        backend_empty_cache(torch_device)
 
     def get_inputs(self, device, generator_device="cpu", dtype=torch.float32, seed=0):
         generator = torch.Generator(device=generator_device).manual_seed(seed)