Merge version 1.5.15

AustinMroz · web-flow · commit ab96cf260896 · 2025-04-02T11:47:31.000-05:00
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,7 +1,7 @@
 [project]
 name = "comfyui-videohelpersuite"
 description = "Nodes related to video workflows"
-version = "1.5.14"
+version = "1.5.15"
 license = { file = "LICENSE" }
 dependencies = ["opencv-python", "imageio-ffmpeg"]
 
diff --git a/video_formats/ProRes.json b/video_formats/ProRes.json
@@ -3,9 +3,9 @@
     [
         "-n", "-c:v", "prores_ks",
         "-profile:v", ["profile",["1","2","3","4"], {"default": "3"}],
-        "-colorspace", "1", "-color_primaries", "1", "-color_trc", "1"
-
+        "-vf", "scale=out_color_matrix=bt709"
     ],
+    "fake_trc": "bt709",
     "audio_pass": ["-c:a", "pcm_s16le"],
     "extension": "mov"
 }
diff --git a/video_formats/av1-webm.json b/video_formats/av1-webm.json
@@ -4,9 +4,9 @@
         "-n", "-c:v", "libsvtav1",
         "-pix_fmt", ["pix_fmt", ["yuv420p10le", "yuv420p"]],
         "-crf", ["crf","INT", {"default": 23, "min": 0, "max": 100, "step": 1}],
-        "-vf", "colorspace=all=bt709:iall=bt601-6-625:fast=1",
-        "-colorspace", "1", "-color_primaries", "1", "-color_trc", "1"
+        "-vf", "scale=out_color_matrix=bt709"
     ],
+    "fake_trc": "bt709",
     "audio_pass": ["-c:a", "libopus"],
     "input_color_depth": ["input_color_depth", ["8bit", "16bit"]],
     "save_metadata": ["save_metadata", "BOOLEAN", {"default": true}],
diff --git a/video_formats/gifski.json b/video_formats/gifski.json
@@ -1,7 +1,8 @@
 {
     "main_pass":
     [
-        "-pix_fmt", "yuv420p"
+        "-pix_fmt", "yuv420p",
+        "-vf", "scale=out_color_matrix=bt709"
     ],
     "extension": "gif",
     "gifski_pass": [
diff --git a/video_formats/h264-mp4.json b/video_formats/h264-mp4.json
@@ -4,9 +4,9 @@
         "-n", "-c:v", "libx264",
         "-pix_fmt", ["pix_fmt", ["yuv420p", "yuv420p10le"]],
         "-crf", ["crf","INT", {"default": 19, "min": 0, "max": 100, "step": 1}],
-        "-vf", "colorspace=all=bt709:iall=bt601-6-625:fast=1",
-        "-colorspace", "1", "-color_primaries", "1", "-color_trc", "1"
+        "-vf", "scale=out_color_matrix=bt709"
     ],
+    "fake_trc": "bt709",
     "audio_pass": ["-c:a", "aac"],
     "save_metadata": ["save_metadata", "BOOLEAN", {"default": true}],
     "trim_to_audio": ["trim_to_audio", "BOOLEAN", {"default": false}],
diff --git a/video_formats/h265-mp4.json b/video_formats/h265-mp4.json
@@ -6,10 +6,10 @@
         "-pix_fmt", ["pix_fmt", ["yuv420p10le", "yuv420p"]],
         "-crf", ["crf","INT", {"default": 22, "min": 0, "max": 100, "step": 1}],
         "-preset", "medium",
-        "-vf", "colorspace=all=bt709:iall=bt601-6-625:fast=1",
-        "-colorspace", "1", "-color_primaries", "1", "-color_trc", "1",
+        "-vf", "scale=out_color_matrix=bt709",
         "-x265-params", "log-level=quiet"
     ],
+    "fake_trc": "bt709",
     "audio_pass": ["-c:a", "aac"],
     "save_metadata": ["save_metadata", "BOOLEAN", {"default": true}],
     "extension": "mp4"
diff --git a/video_formats/nvenc_h264-mp4.json b/video_formats/nvenc_h264-mp4.json
@@ -2,8 +2,10 @@
     "main_pass":
     [
         "-n", "-c:v", "h264_nvenc",
-        "-pix_fmt", ["pix_fmt", ["yuv420p", "yuv420p10le", "rgba"]]
+        "-pix_fmt", ["pix_fmt", ["yuv420p", "yuv420p10le"]],
+        "-vf", "scale=out_color_matrix=bt709"
     ],
+    "fake_trc": "bt709",
     "audio_pass": ["-c:a", "aac"],
     "bitrate": ["bitrate","INT", {"default": 10, "min": 1, "max": 999, "step": 1 }],
     "megabit": ["megabit","BOOLEAN", {"default": true}],
diff --git a/video_formats/nvenc_hevc-mp4.json b/video_formats/nvenc_hevc-mp4.json
@@ -3,8 +3,10 @@
     [
         "-n", "-c:v", "hevc_nvenc",
         "-vtag", "hvc1",
-        "-pix_fmt", ["pix_fmt", ["yuv420p", "yuv420p10le", "rgba"]]
+        "-pix_fmt", ["pix_fmt", ["yuv420p", "yuv420p10le"]],
+        "-vf", "scale=out_color_matrix=bt709"
     ],
+    "fake_trc": "bt709",
     "audio_pass": ["-c:a", "aac"],
     "bitrate": ["bitrate","INT", {"default": 10, "min": 1, "max": 999, "step": 1 }],
     "megabit": ["megabit","BOOLEAN", {"default": true}],
diff --git a/video_formats/webm.json b/video_formats/webm.json
@@ -5,8 +5,9 @@
         "-pix_fmt", ["pix_fmt",["yuv420p","yuva420p"]],
         "-crf", ["crf","INT", {"default": 20, "min": 0, "max": 100, "step": 1}],
         "-b:v", "0",
-        "-colorspace", "1", "-color_primaries", "1", "-color_trc", "1"
+        "-vf", "scale=out_color_matrix=bt709"
     ],
+    "fake_trc": "bt709",
     "audio_pass": ["-c:a", "libvorbis"],
     "save_metadata": ["save_metadata", "BOOLEAN", {"default": true}],
     "trim_to_audio": ["trim_to_audio", "BOOLEAN", {"default": false}],
diff --git a/videohelpersuite/nodes.py b/videohelpersuite/nodes.py
@@ -165,12 +165,13 @@ def ffmpeg_process(args, video_format, video_metadata, file_path, env):
     if len(res) > 0:
         print(res.decode(*ENCODE_ARGS), end="", file=sys.stderr)
 
-def gifski_process(args, video_format, file_path, env):
+def gifski_process(args, dimensions, video_format, file_path, env):
     frame_data = yield
     with subprocess.Popen(args + video_format['main_pass'] + ['-f', 'yuv4mpegpipe', '-'],
                           stderr=subprocess.PIPE, stdin=subprocess.PIPE,
                           stdout=subprocess.PIPE, env=env) as procff:
         with subprocess.Popen([gifski_path] + video_format['gifski_pass']
+                              + ['-W', f'{dimensions[0]}', '-H', f'{dimensions[1]}']
                               + ['-q', '-o', file_path, '-'], stderr=subprocess.PIPE,
                               stdin=procff.stdout, stdout=subprocess.PIPE,
                               env=env) as procgs:
@@ -417,12 +418,11 @@ def pad(image):
                     padded = padfunc(image.to(dtype=torch.float32))
                     return padded.permute((1,2,0))
                 images = map(pad, images)
-                new_dims = (-first_image.shape[1] % dim_alignment + first_image.shape[1],
-                            -first_image.shape[0] % dim_alignment + first_image.shape[0])
-                dimensions = f"{new_dims[0]}x{new_dims[1]}"
+                dimensions = (-first_image.shape[1] % dim_alignment + first_image.shape[1],
+                              -first_image.shape[0] % dim_alignment + first_image.shape[0])
                 logger.warn("Output images were not of valid resolution and have had padding applied")
             else:
-                dimensions = f"{first_image.shape[1]}x{first_image.shape[0]}"
+                dimensions = (first_image.shape[1], first_image.shape[0])
             if loop_count > 0:
                 loop_args = ["-vf", "loop=loop=" + str(loop_count)+":size=" + str(num_frames)]
             else:
@@ -450,7 +450,18 @@ def pad(image):
             if bitrate is not None:
                 bitrate_arg = ["-b:v", str(bitrate) + "M" if video_format.get('megabit') == 'True' else str(bitrate) + "K"]
             args = [ffmpeg_path, "-v", "error", "-f", "rawvideo", "-pix_fmt", i_pix_fmt,
-                    "-s", dimensions, "-r", str(frame_rate), "-i", "-"] \
+                    # The image data is in an undefined generic RGB color space, which in practice means sRGB.
+                    # sRGB has the same primaries and matrix as BT.709, but a different transfer function (gamma),
+                    # called by the sRGB standard name IEC 61966-2-1. However, video hosting platforms like YouTube
+                    # standardize on full BT.709 and will convert the colors accordingly. This last minute change
+                    # in colors can be confusing to users. We can counter it by lying about the transfer function
+                    # on a per format basis, i.e. for video we will lie to FFmpeg that it is already BT.709. Also,
+                    # because the input data is in RGB (not YUV) it is more efficient (fewer scale filter invocations)
+                    # to specify the input color space as RGB and then later, if the format actually wants YUV,
+                    # to convert it to BT.709 YUV via FFmpeg's -vf "scale=out_color_matrix=bt709".
+                    "-color_range", "full", "-colorspace", "rgb", "-color_primaries", "bt709",
+                    "-color_trc", video_format.get("fake_trc", "iec61966-2-1"),
+                    "-s", f"{dimensions[0]}x{dimensions[1]}", "-r", str(frame_rate), "-i", "-"] \
                     + loop_args
 
             images = map(lambda x: x.tobytes(), images)
@@ -479,8 +490,9 @@ def pad(image):
                 args = args[:13] + video_format['inputs_main_pass'] + args[13:]
 
             if output_process is None:
+                format = 'image/gif'
                 if 'gifski_pass' in video_format:
-                    output_process = gifski_process(args, video_format, file_path, env)
+                    output_process = gifski_process(args, dimensions, video_format, file_path, env)
                 else:
                     args += video_format['main_pass'] + bitrate_arg
                     merge_filter_args(args)

Original file line number	Diff line number	Diff line change
`@@ -3,9 +3,9 @@`
`3`	`3`	`[`
`4`	`4`	`"-n", "-c:v", "prores_ks",`
`5`	`5`	`"-profile:v", ["profile",["1","2","3","4"], {"default": "3"}],`
`6`		`- "-colorspace", "1", "-color_primaries", "1", "-color_trc", "1"`
`7`		`-`
	`6`	`+ "-vf", "scale=out_color_matrix=bt709"`
`8`	`7`	`],`
	`8`	`+ "fake_trc": "bt709",`
`9`	`9`	`"audio_pass": ["-c:a", "pcm_s16le"],`
`10`	`10`	`"extension": "mov"`
`11`	`11`	`}`
Original file line number	Diff line number	Diff line change
`@@ -1,7 +1,8 @@`
`1`	`1`	`{`
`2`	`2`	`"main_pass":`
`3`	`3`	`[`
`4`		`- "-pix_fmt", "yuv420p"`
	`4`	`+ "-pix_fmt", "yuv420p",`
	`5`	`+ "-vf", "scale=out_color_matrix=bt709"`
`5`	`6`	`],`
`6`	`7`	`"extension": "gif",`
`7`	`8`	`"gifski_pass": [`