Skip to content

Commit 9ed54c1

Browse files
committed
fix bugs
1 parent e3f8a57 commit 9ed54c1

File tree

4 files changed

+7
-39
lines changed

4 files changed

+7
-39
lines changed

diffsynth/pipelines/sd_video.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -257,10 +257,10 @@ def __call__(
257257
progress_bar_st.progress(progress_id / len(self.scheduler.timesteps))
258258

259259
# Decode image
260-
image = self.decode_video(latents, **tiler_kwargs)
260+
output_frames = self.decode_video(latents, **tiler_kwargs)
261261

262262
# Post-process
263263
if smoother is not None and (num_inference_steps in smoother_progress_ids or -1 in smoother_progress_ids):
264264
output_frames = smoother(output_frames, original_frames=input_frames)
265265

266-
return image
266+
return output_frames

diffsynth/pipelines/sdxl_video.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -214,10 +214,10 @@ def __call__(
214214
progress_bar_st.progress(progress_id / len(self.scheduler.timesteps))
215215

216216
# Decode image
217-
image = self.decode_video(latents, **tiler_kwargs)
217+
output_frames = self.decode_video(latents, **tiler_kwargs)
218218

219219
# Post-process
220220
if smoother is not None and (num_inference_steps in smoother_progress_ids or -1 in smoother_progress_ids):
221221
output_frames = smoother(output_frames, original_frames=input_frames)
222222

223-
return image
223+
return output_frames

examples/ExVideo/ExVideo_svd_train.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
from einops import rearrange, repeat
55
import lightning as pl
66
from diffsynth import ModelManager, SVDImageEncoder, SVDUNet, SVDVAEEncoder, ContinuousODEScheduler, load_state_dict
7-
from diffsynth.pipelines.stable_video_diffusion import SVDCLIPImageProcessor
7+
from diffsynth.pipelines.svd_video import SVDCLIPImageProcessor
88
from diffsynth.models.svd_unet import TemporalAttentionBlock
99

1010

@@ -131,14 +131,14 @@ def __init__(self, learning_rate=1e-5, svd_ckpt_path=None, add_positional_conv=1
131131
self.image_encoder.requires_grad_(False)
132132

133133
self.unet = SVDUNet(add_positional_conv=add_positional_conv).to(dtype=torch.float16, device=self.device)
134-
self.unet.load_state_dict(SVDUNet.state_dict_converter().from_civitai(state_dict), strict=False)
134+
self.unet.load_state_dict(SVDUNet.state_dict_converter().from_civitai(state_dict, add_positional_conv=add_positional_conv), strict=False)
135135
self.unet.train()
136136
self.unet.requires_grad_(False)
137137
for block in self.unet.blocks:
138138
if isinstance(block, TemporalAttentionBlock):
139139
block.requires_grad_(True)
140140

141-
self.vae_encoder = SVDVAEEncoder.to(dtype=torch.float16, device=self.device)
141+
self.vae_encoder = SVDVAEEncoder().to(dtype=torch.float16, device=self.device)
142142
self.vae_encoder.load_state_dict(SVDVAEEncoder.state_dict_converter().from_civitai(state_dict))
143143
self.vae_encoder.eval()
144144
self.vae_encoder.requires_grad_(False)

examples/image_synthesis/sd3_text_to_image_textual_inversion.py

Lines changed: 0 additions & 32 deletions
This file was deleted.

0 commit comments

Comments
 (0)