Skip to content

Commit 8aa458e

Browse files
copies
1 parent 5029dbf commit 8aa458e

File tree

3 files changed

+66
-6
lines changed

3 files changed

+66
-6
lines changed

src/diffusers/pipelines/hunyuan_video1_5/pipeline_hunyuan_video1_5_image2video.py

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -92,7 +92,7 @@ def format_text_input(prompt: List[str], system_message: str) -> List[Dict[str,
9292
return template
9393

9494

95-
# Copied from diffusers.pipelines.hunyuan_image.pipeline_hunyuanimage.extract_glyph_text
95+
# Copied from diffusers.pipelines.hunyuan_video1_5.pipeline_hunyuan_video1_5.extract_glyph_texts
9696
def extract_glyph_texts(prompt: str) -> List[str]:
9797
"""
9898
Extract glyph texts from prompt using regex pattern.
@@ -281,7 +281,7 @@ def _get_mllm_prompt_embeds(
281281
text_encoder: Qwen2_5_VLTextModel,
282282
tokenizer: Qwen2Tokenizer,
283283
prompt: Union[str, List[str]],
284-
device: Optional[torch.device] = None,
284+
device: torch.device,
285285
tokenizer_max_length: int = 1000,
286286
num_hidden_layers_to_skip: int = 2,
287287
# fmt: off
@@ -494,10 +494,10 @@ def encode_prompt(
494494
prompt_embeds_mask_2 = prompt_embeds_mask_2.repeat(1, num_videos_per_prompt, 1)
495495
prompt_embeds_mask_2 = prompt_embeds_mask_2.view(batch_size * num_videos_per_prompt, seq_len_2)
496496

497-
prompt_embeds = prompt_embeds.to(device=device, dtype=dtype)
498-
prompt_embeds_mask = prompt_embeds_mask.to(device=device, dtype=dtype)
499-
prompt_embeds_2 = prompt_embeds_2.to(device=device, dtype=dtype)
500-
prompt_embeds_mask_2 = prompt_embeds_mask_2.to(device=device, dtype=dtype)
497+
prompt_embeds = prompt_embeds.to(dtype=dtype, device=device)
498+
prompt_embeds_mask = prompt_embeds_mask.to(dtype=dtype, device=device)
499+
prompt_embeds_2 = prompt_embeds_2.to(dtype=dtype, device=device)
500+
prompt_embeds_mask_2 = prompt_embeds_mask_2.to(dtype=dtype, device=device)
501501

502502
return prompt_embeds, prompt_embeds_mask, prompt_embeds_2, prompt_embeds_mask_2
503503

src/diffusers/utils/dummy_pt_objects.py

Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -468,6 +468,21 @@ def from_pretrained(cls, *args, **kwargs):
468468
requires_backends(cls, ["torch"])
469469

470470

471+
class AutoencoderKLHunyuanVideo15(metaclass=DummyObject):
472+
_backends = ["torch"]
473+
474+
def __init__(self, *args, **kwargs):
475+
requires_backends(self, ["torch"])
476+
477+
@classmethod
478+
def from_config(cls, *args, **kwargs):
479+
requires_backends(cls, ["torch"])
480+
481+
@classmethod
482+
def from_pretrained(cls, *args, **kwargs):
483+
requires_backends(cls, ["torch"])
484+
485+
471486
class AutoencoderKLLTXVideo(metaclass=DummyObject):
472487
_backends = ["torch"]
473488

@@ -993,6 +1008,21 @@ def from_pretrained(cls, *args, **kwargs):
9931008
requires_backends(cls, ["torch"])
9941009

9951010

1011+
class HunyuanVideo15Transformer3DModel(metaclass=DummyObject):
1012+
_backends = ["torch"]
1013+
1014+
def __init__(self, *args, **kwargs):
1015+
requires_backends(self, ["torch"])
1016+
1017+
@classmethod
1018+
def from_config(cls, *args, **kwargs):
1019+
requires_backends(cls, ["torch"])
1020+
1021+
@classmethod
1022+
def from_pretrained(cls, *args, **kwargs):
1023+
requires_backends(cls, ["torch"])
1024+
1025+
9961026
class HunyuanVideoFramepackTransformer3DModel(metaclass=DummyObject):
9971027
_backends = ["torch"]
9981028

src/diffusers/utils/dummy_torch_and_transformers_objects.py

Lines changed: 30 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1142,6 +1142,36 @@ def from_pretrained(cls, *args, **kwargs):
11421142
requires_backends(cls, ["torch", "transformers"])
11431143

11441144

1145+
class HunyuanVideo15ImageToVideoPipeline(metaclass=DummyObject):
1146+
_backends = ["torch", "transformers"]
1147+
1148+
def __init__(self, *args, **kwargs):
1149+
requires_backends(self, ["torch", "transformers"])
1150+
1151+
@classmethod
1152+
def from_config(cls, *args, **kwargs):
1153+
requires_backends(cls, ["torch", "transformers"])
1154+
1155+
@classmethod
1156+
def from_pretrained(cls, *args, **kwargs):
1157+
requires_backends(cls, ["torch", "transformers"])
1158+
1159+
1160+
class HunyuanVideo15Pipeline(metaclass=DummyObject):
1161+
_backends = ["torch", "transformers"]
1162+
1163+
def __init__(self, *args, **kwargs):
1164+
requires_backends(self, ["torch", "transformers"])
1165+
1166+
@classmethod
1167+
def from_config(cls, *args, **kwargs):
1168+
requires_backends(cls, ["torch", "transformers"])
1169+
1170+
@classmethod
1171+
def from_pretrained(cls, *args, **kwargs):
1172+
requires_backends(cls, ["torch", "transformers"])
1173+
1174+
11451175
class HunyuanVideoFramepackPipeline(metaclass=DummyObject):
11461176
_backends = ["torch", "transformers"]
11471177

0 commit comments

Comments
 (0)