Skip to content

Commit 8b1e3ec

Browse files
yiyixuxusayakpaul
andauthored
[hunyuan-dit] refactor HunyuanCombinedTimestepTextSizeStyleEmbedding (#8761)
up Co-authored-by: Sayak Paul <[email protected]>
1 parent 4e57aef commit 8b1e3ec

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

src/diffusers/models/embeddings.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -730,6 +730,8 @@ def __init__(
730730
self.time_proj = Timesteps(num_channels=256, flip_sin_to_cos=True, downscale_freq_shift=0)
731731
self.timestep_embedder = TimestepEmbedding(in_channels=256, time_embed_dim=embedding_dim)
732732

733+
self.size_proj = Timesteps(num_channels=256, flip_sin_to_cos=True, downscale_freq_shift=0)
734+
733735
self.pooler = HunyuanDiTAttentionPool(
734736
seq_len, cross_attention_dim, num_heads=8, output_dim=pooled_projection_dim
735737
)
@@ -758,7 +760,7 @@ def forward(self, timestep, encoder_hidden_states, image_meta_size, style, hidde
758760

759761
if self.use_style_cond_and_image_meta_size:
760762
# extra condition2: image meta size embdding
761-
image_meta_size = get_timestep_embedding(image_meta_size.view(-1), 256, True, 0)
763+
image_meta_size = self.size_proj(image_meta_size.view(-1))
762764
image_meta_size = image_meta_size.to(dtype=hidden_dtype)
763765
image_meta_size = image_meta_size.view(-1, 6 * 256) # (N, 1536)
764766

0 commit comments

Comments
 (0)