Rename _to_poseinterface. Add video conversion bits

sfmig · sfmig · commit dc09c573e90c · 2026-03-27T13:02:04.000Z
diff --git a/examples/SWC-plusmaze_to_benchmark.py b/examples/SWC-plusmaze_to_benchmark.py
@@ -13,7 +13,7 @@
 import shutil
 from pathlib import Path
 
-from poseinterface.io import annotations_to_coco
+from poseinterface.io import annotations_to_poseinterface
 
 # %%
 # Background
@@ -102,7 +102,7 @@
 # Here we use the :func:`annotations_to_coco` function from `poseinterface.io`
 # which wraps around `sleap_io` functionality to perform the conversion.
 
-annotations_to_coco(
+annotations_to_poseinterface(
     input_path=source_annotations_path,
     output_json_path=target_annotations_path,
     sub_id=subject_id,
diff --git a/poseinterface/io.py b/poseinterface/io.py
@@ -1,11 +1,14 @@
 import copy
 import json
+import logging
 import re
+import shutil
 from pathlib import Path
 from typing import Literal
 
 import sleap_io as sio
 from sleap_io.io import coco
+from sleap_io.io.cli import _get_video_encoding_info, _is_ffmpeg_available
 from sleap_io.io.dlc import is_dlc_file
 
 _EMPTY_LABELS_ERROR_MSG = {
@@ -24,8 +27,21 @@
 
 POSEINTERFACE_FRAME_REGEXP = r"frame-(\d+)"
 
+# We support sleap's MediaVideo files
+EXPECTED_SUFFIX = ".mp4"
+EXPECTED_ENCODING = {
+    "pixelformat": "yuv420p",
+    "codec": "h264",  # codec name
+}
+REENCODING_PARAMS = {
+    **EXPECTED_ENCODING,
+    "codec": "libx264",  # overwrite with encoder to use
+    "crf": 25,
+    "preset": "superfast",
+}
 
-def annotations_to_coco(
+
+def annotations_to_poseinterface(
     input_path: Path,
     output_json_path: Path,
     *,
@@ -246,3 +262,102 @@ def _pad_integers_to_same_width(input: list[int]) -> list[str]:
     width = len(str(max(input)))
     padded_numbers = [str(number).zfill(width) for number in input]
     return padded_numbers
+
+
+def video_to_poseinterface(
+    input_video: Path | str,
+    output_video_dir: Path | str,
+    *,
+    sub_id: str,
+    ses_id: str,
+    cam_id: str,
+) -> Path:
+    """Reencode and rename video."""
+    # Check if ffmpeg is available
+    _check_ffmpeg()
+
+    # Compute output_video_path
+    output_video = (
+        Path(output_video_dir) / f"sub-{sub_id}_ses-{ses_id}_cam-{cam_id}.mp4"
+    )
+    # Ensure parent directories exist
+    Path(output_video_dir).mkdir(parents=True, exist_ok=True)
+
+    # Check if reencoding is required
+    if not _needs_reencoding(input_video):
+        # If not, copy file and rename
+        shutil.copy(input_video, output_video)
+    else:
+        # Else, reencode video and rename
+        _reencode_video(input_video, output_video)
+
+    return output_video
+
+
+def _check_ffmpeg():
+    "Check FFMPEG availability"
+    sio.set_default_video_plugin("ffmpeg")
+    if not _is_ffmpeg_available():
+        raise RuntimeError("ffmpeg is required but not found")
+
+
+def _needs_reencoding(input_video_path: str | Path) -> bool:
+    """Check if reencoding is required."""
+    input_video_path = Path(input_video_path)
+    logging.info(f"Input video: {input_video_path}")
+
+    # Check if suffix is mp4
+    if input_video_path.suffix.lower() != EXPECTED_SUFFIX:
+        return True
+
+    # Check codec and pixelformat
+    encoding = _get_codec_pixelformat(input_video_path)
+    if encoding != EXPECTED_ENCODING:
+        logging.warning(
+            f"Video encoding {encoding} does not match "
+            f"expected {EXPECTED_ENCODING}. Please reencode "
+            "using the `reencode_video()` function."
+        )
+        return True
+    return False
+
+
+def _get_codec_pixelformat(input_video_path: str | Path) -> dict:
+    """Get video encoding parameters as dictionary.
+
+    It wraps sleap-io's _get_video_encoding_info, which
+    uses `ffmpeg -i` to extract metadata without requiring ffprobe in PATH.
+
+    `_get_video_encoding_info` returns a VideoEncodingInfo object
+    with attributes:
+      codec: Video codec name (e.g., "h264", "hevc").
+      codec_profile: Codec profile (e.g., "Main", "High").
+      pixel_format: Pixel format (e.g., "yuv420p").
+      bitrate_kbps: Bitrate in kilobits per second.
+      fps: Frames per second.
+      gop_size: Group of pictures size (keyframe interval).
+      container: Container format (e.g., "mov", "avi").
+
+    """
+    info = _get_video_encoding_info(input_video_path)
+    return {
+        "codec": info.codec,
+        "pixelformat": info.pixel_format,
+    }
+
+
+def _reencode_video(
+    input_video_path: str | Path,
+    output_video_path: str | Path,
+) -> Path:
+    """Reencode video to default format."""
+    # Read and save reencoded video
+    video = sio.load_video(Path(input_video_path))
+    reencoded_video_path = sio.save_video(
+        video,
+        filename=output_video_path,
+        fps=video.fps,
+        **REENCODING_PARAMS,
+    )
+    logging.info(f"Re-encoded video saved to {reencoded_video_path}")
+    return reencoded_video_path
diff --git a/tests/test_integration/test_io.py b/tests/test_integration/test_io.py
@@ -1,6 +1,6 @@
 import pytest
 
-from poseinterface.io import annotations_to_coco
+from poseinterface.io import annotations_to_poseinterface
 
 
 @pytest.mark.parametrize(
@@ -18,6 +18,6 @@ def test_annotations_to_coco(input_path, tmp_path, test_ids, request):
     input_path = request.getfixturevalue(input_path)
     output_json_path = tmp_path / "output.json"
 
-    annotations_to_coco(input_path, output_json_path, **test_ids)
+    annotations_to_poseinterface(input_path, output_json_path, **test_ids)
 
     assert output_json_path.exists()
diff --git a/tests/test_unit/test_io.py b/tests/test_unit/test_io.py
@@ -12,7 +12,7 @@
     _generate_poseinterface_filenames,
     _pad_integers_to_same_width,
     _update_image_ids,
-    annotations_to_coco,
+    annotations_to_poseinterface,
 )
 
 
@@ -35,7 +35,7 @@ def test_annotations_to_coco(
     # Run function to test
     input_csv = tmp_path / "input.csv"
     output_path = tmp_path / "output.json"
-    result = annotations_to_coco(
+    result = annotations_to_poseinterface(
         input_csv,
         output_path,
         **test_ids,
@@ -83,7 +83,7 @@ def test_annotations_to_coco_invalid(
     with pytest.raises(
         ValueError, match=_EMPTY_LABELS_ERROR_MSG[error_message]
     ):
-        annotations_to_coco(
+        annotations_to_poseinterface(
             input_file,
             tmp_path / "output.json",
             **test_ids,
@@ -111,7 +111,7 @@ def test_annotations_to_coco_not_single_video(
         ValueError,
         match=(r"The annotations refer to multiple videos.*Please check .*"),
     ):
-        annotations_to_coco(
+        annotations_to_poseinterface(
             tmp_path / "input.csv",
             tmp_path / "output.json",
             **test_ids,