File tree Expand file tree Collapse file tree 3 files changed +8
-11
lines changed Expand file tree Collapse file tree 3 files changed +8
-11
lines changed Original file line number Diff line number Diff line change 2323 params :
2424 time_embed_dim : 512
2525 elementwise_affine : True
26- num_frames : 81
26+ num_frames : 81 # for 5 seconds and 161 for 10 seconds
2727 time_compressed_rate : 4
2828 latent_width : 300
2929 latent_height : 300
Original file line number Diff line number Diff line change @@ -25,11 +25,10 @@ model:
2525 network_config :
2626 target : dit_video_concat.DiffusionTransformer
2727 params :
28- # space_interpolation: 1.875
2928 ofs_embed_dim : 512
3029 time_embed_dim : 512
3130 elementwise_affine : True
32- num_frames : 81
31+ num_frames : 81 # for 5 seconds and 161 for 10 seconds
3332 time_compressed_rate : 4
3433 latent_width : 300
3534 latent_height : 300
Original file line number Diff line number Diff line change 11args :
2- image2video : False # True for image2video, False for text2video
2+ # image2video: True # True for image2video, False for text2video
33 latent_channels : 16
44 mode : inference
55 load : " {your CogVideoX SAT folder}/transformer" # This is for Full model without lora adapter
6- # load: "{your lora folder} such as zRzRzRzRzRzRzR/lora-disney-08-20-13-28" # This is for Full model without lora adapter
76 batch_size : 1
87 input_type : txt
98 input_file : configs/test.txt
10- sampling_image_size : [480, 720]
11- sampling_num_frames : 13 # Must be 13, 11 or 9
12- sampling_fps : 8
13- # fp16: True # For CogVideoX-2B
14- bf16 : True # For CogVideoX-5B and CoGVideoX-5B-I2V
15- output_dir : outputs/
9+ sampling_image_size : [768, 1360] # remove this for I2V
10+ sampling_num_frames : 22 # 42 for 10 seconds and 22 for 5 seconds
11+ sampling_fps : 16
12+ bf16 : True
13+ output_dir : outputs
1614 force_inference : True
You can’t perform that action at this time.
0 commit comments