From 3eea0b822a39dc46ab8883a4dabe72776870dbd3 Mon Sep 17 00:00:00 2001 From: Alireza Farashah Date: Wed, 22 Oct 2025 17:53:01 -0400 Subject: [PATCH 1/2] Fix small inconsistency in output dimension of t5 embeds when text_encoder_3 is None --- .../pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py | 2 +- .../stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py | 2 +- .../stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/src/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py b/src/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py index 1618f89a49e3..3b7b26dc636c 100644 --- a/src/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py +++ b/src/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3.py @@ -248,7 +248,7 @@ def _get_t5_prompt_embeds( return torch.zeros( ( batch_size * num_images_per_prompt, - self.tokenizer_max_length, + max_sequence_length, self.transformer.config.joint_attention_dim, ), device=device, diff --git a/src/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py b/src/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py index 7e97909f42ca..db047f19924d 100644 --- a/src/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py +++ b/src/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_img2img.py @@ -272,7 +272,7 @@ def _get_t5_prompt_embeds( return torch.zeros( ( batch_size * num_images_per_prompt, - self.tokenizer_max_length, + max_sequence_length, self.transformer.config.joint_attention_dim, ), device=device, diff --git a/src/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py b/src/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py index 5b2cca0378cd..c95fa530c8d7 100644 --- a/src/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py +++ b/src/diffusers/pipelines/stable_diffusion_3/pipeline_stable_diffusion_3_inpaint.py @@ -278,7 +278,7 @@ def _get_t5_prompt_embeds( return torch.zeros( ( batch_size * num_images_per_prompt, - self.tokenizer_max_length, + max_sequence_length, self.transformer.config.joint_attention_dim, ), device=device, From 5dd8a107086cef5cf730c042587625b4a9e65d87 Mon Sep 17 00:00:00 2001 From: Alireza Farashah Date: Fri, 24 Oct 2025 17:35:05 -0400 Subject: [PATCH 2/2] first commit --- .../controlnet_sd3/pipeline_stable_diffusion_3_controlnet.py | 2 +- .../pipeline_stable_diffusion_3_controlnet_inpainting.py | 2 +- src/diffusers/pipelines/pag/pipeline_pag_sd_3.py | 2 +- src/diffusers/pipelines/pag/pipeline_pag_sd_3_img2img.py | 2 +- 4 files changed, 4 insertions(+), 4 deletions(-) diff --git a/src/diffusers/pipelines/controlnet_sd3/pipeline_stable_diffusion_3_controlnet.py b/src/diffusers/pipelines/controlnet_sd3/pipeline_stable_diffusion_3_controlnet.py index c763411ab5f7..f67a0e211281 100644 --- a/src/diffusers/pipelines/controlnet_sd3/pipeline_stable_diffusion_3_controlnet.py +++ b/src/diffusers/pipelines/controlnet_sd3/pipeline_stable_diffusion_3_controlnet.py @@ -266,7 +266,7 @@ def _get_t5_prompt_embeds( return torch.zeros( ( batch_size * num_images_per_prompt, - self.tokenizer_max_length, + max_sequence_length, self.transformer.config.joint_attention_dim, ), device=device, diff --git a/src/diffusers/pipelines/controlnet_sd3/pipeline_stable_diffusion_3_controlnet_inpainting.py b/src/diffusers/pipelines/controlnet_sd3/pipeline_stable_diffusion_3_controlnet_inpainting.py index c33cf979c6d8..68984da4dc40 100644 --- a/src/diffusers/pipelines/controlnet_sd3/pipeline_stable_diffusion_3_controlnet_inpainting.py +++ b/src/diffusers/pipelines/controlnet_sd3/pipeline_stable_diffusion_3_controlnet_inpainting.py @@ -284,7 +284,7 @@ def _get_t5_prompt_embeds( return torch.zeros( ( batch_size * num_images_per_prompt, - self.tokenizer_max_length, + max_sequence_length, self.transformer.config.joint_attention_dim, ), device=device, diff --git a/src/diffusers/pipelines/pag/pipeline_pag_sd_3.py b/src/diffusers/pipelines/pag/pipeline_pag_sd_3.py index acb4e52340a6..bc281428e257 100644 --- a/src/diffusers/pipelines/pag/pipeline_pag_sd_3.py +++ b/src/diffusers/pipelines/pag/pipeline_pag_sd_3.py @@ -237,7 +237,7 @@ def _get_t5_prompt_embeds( return torch.zeros( ( batch_size * num_images_per_prompt, - self.tokenizer_max_length, + max_sequence_length, self.transformer.config.joint_attention_dim, ), device=device, diff --git a/src/diffusers/pipelines/pag/pipeline_pag_sd_3_img2img.py b/src/diffusers/pipelines/pag/pipeline_pag_sd_3_img2img.py index e1819a79fb30..22a8dac238f5 100644 --- a/src/diffusers/pipelines/pag/pipeline_pag_sd_3_img2img.py +++ b/src/diffusers/pipelines/pag/pipeline_pag_sd_3_img2img.py @@ -253,7 +253,7 @@ def _get_t5_prompt_embeds( return torch.zeros( ( batch_size * num_images_per_prompt, - self.tokenizer_max_length, + max_sequence_length, self.transformer.config.joint_attention_dim, ), device=device,