vertexcover-io
diff --git a/‎README.md‎
Lines changed: 0 additions & 2 deletions b/‎README.md‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎examples/basic_usage.py‎
Lines changed: 23 additions & 8 deletions b/‎examples/basic_usage.py‎
Lines changed: 23 additions & 8 deletions
diff --git a/‎src/sceneflow/api/__init__.py‎
Lines changed: 1 addition & 2 deletions b/‎src/sceneflow/api/__init__.py‎
Lines changed: 1 addition & 2 deletions
diff --git a/‎src/sceneflow/api/_internal.py‎
Lines changed: 170 additions & 0 deletions b/‎src/sceneflow/api/_internal.py‎
Lines changed: 170 additions & 0 deletions
@@ -165,8 +165,6 @@ print(f"Best cut point: {best_cut.timestamp:.2f}s (score: {best_cut.score:.4f})"
 | `energy_threshold_db` | float | 8.0 | All | Minimum dB drop for refinement |
 | `energy_lookback_frames` | int | 20 | All | Max frames to search backward |
 | `disable_visual_analysis` | bool | False | All | Skip visual ranking, use speech end only |
-| `use_silence_cleaning` | bool | False | All | Remove incomplete speech segments |
-| `incomplete_threshold` | float | 0.5 | All | Max gap for incomplete segments (seconds) |
 | `openai_api_key` | str | None | All | OpenAI API key (or use env var) |
 | `airtable_access_token` | str | None | All | Airtable token (or use env var) |
 | `airtable_base_id` | str | None | All | Airtable base ID (or use env var) |
 
@@ -5,6 +5,7 @@
 - Finds the best cut point and saves the video
 - Saves annotated frames and detailed logs
 - Works with local video files
+- Demonstrates custom configuration options
 """
 
 import logging
@@ -16,29 +17,43 @@
 )
 
 
-def main():
-    video_path = "new_dataset/videos/scene4.mp4"
-    output_path = "output/scene4_cut.mp4"
+def basic_example():
+    """
+    Basic example: Using custom energy threshold and sample rate.
 
-    print("SceneFlow - Basic Usage Example")
+    Demonstrates:
+    - Custom energy threshold for speech end detection
+    - Higher sample rate (1) for more precise frame analysis
+    - Full frame annotation and logging
+    """
+    video_path = "Video_Path"
+    output_path = "output/demo.mp4"
+
+    print("\nSceneFlow - Advanced Configuration Example")
     print("=" * 60)
-    print(f"Finding best cut point in: {video_path}")
+    print(f"Finding cut point with custom settings in: {video_path}")
     print(f"Output will be saved to: {output_path}")
     print()
+
     best_time = cut_video(
         video_path,
         output_path,
         save_frames=True,
         save_logs=True,
         use_energy_refinement=True,
-        use_llm_selection=True
+        # use_llm_selection=True,
+        # disable_visual_analysis=True,
+        energy_threshold_db=10,
+        sample_rate=1,
     )
+
     print()
     print("=" * 60)
-    print(f"✓ Best cut point: {best_time:.2f} seconds")
+    print(f"✓ Cut point found: {best_time:.2f} seconds")
     print(f"✓ Cut video saved to: {output_path}")
     print("=" * 60)
+    print("\nCustom settings provide more control over speech detection and frame analysis")
 
 
 if __name__ == "__main__":
-    main()
+    basic_example()
@@ -4,11 +4,10 @@
 cut points in videos.
 """
 
-from sceneflow.api.public import get_cut_frame, get_ranked_cut_frames, cut_video, _upload_to_airtable
+from sceneflow.api.public import get_cut_frame, get_ranked_cut_frames, cut_video
 
 __all__ = [
     'get_cut_frame',
     'get_ranked_cut_frames',
     'cut_video',
-    '_upload_to_airtable',
 ]
@@ -0,0 +1,170 @@
+"""Internal pipeline functions for SceneFlow API.
+
+This module contains implementation details and should not be imported directly.
+Use the public API functions from sceneflow.api instead.
+"""
+
+import logging
+from typing import Dict, List, Optional, Tuple
+
+from sceneflow.shared.config import RankingConfig
+from sceneflow.detection import EnergyRefiner
+from sceneflow.shared.models import RankedFrame, FrameScore, FrameFeatures
+from sceneflow.core import CutPointRanker
+from sceneflow.detection import SpeechDetector
+from sceneflow.selection import LLMFrameSelector
+from sceneflow.utils.video import get_video_duration
+
+logger = logging.getLogger(__name__)
+
+
+def detect_speech_end(
+    video_path: str,
+    use_energy_refinement: bool,
+    energy_threshold_db: float,
+    energy_lookback_frames: int,
+) -> Tuple[float, float, List[Dict[str, float]]]:
+    """Detect when speech ends in video using VAD and optional refinements."""
+    logger.info("Stage 1: Detecting speech end time...")
+    detector = SpeechDetector()
+
+    vad_speech_end_time, vad_timestamps = detector.get_speech_timestamps(video_path)
+    logger.info("VAD detected speech end at: %.4fs", vad_speech_end_time)
+
+    speech_end_time = vad_speech_end_time
+    pre_refinement_time = vad_speech_end_time
+
+    if use_energy_refinement:
+        logger.info("Stage 1.5: Refining VAD-detected speech end time with energy analysis...")
+
+        before_energy = speech_end_time
+
+        refiner = EnergyRefiner(
+            threshold_db=energy_threshold_db,
+            lookback_frames=energy_lookback_frames
+        )
+        result = refiner.refine_speech_end(
+            speech_end_time,
+            video_path
+        )
+
+        speech_end_time = result.refined_timestamp
+
+        if result.frames_adjusted > 0:
+            logger.info(
+                "Energy refinement adjusted timestamp by %d frames",
+                result.frames_adjusted
+            )
+            pre_refinement_time = before_energy
+        else:
+            logger.info("Energy refinement: No adjustment needed")
+
+    visual_search_end_time = pre_refinement_time if speech_end_time < pre_refinement_time else -1.0
+
+    return speech_end_time, visual_search_end_time, vad_timestamps
+
+
+def rank_frames(
+    video_path: str,
+    speech_end_time: float,
+    duration: float,
+    config: Optional[RankingConfig],
+    sample_rate: int,
+    visual_search_end_time: float = -1.0,
+    return_internals: bool = False
+) -> Tuple[List[RankedFrame], Optional[List[FrameFeatures]], Optional[List[FrameScore]]]:
+    """Rank frames after speech ends."""
+    end_time = visual_search_end_time if visual_search_end_time > 0 else duration
+
+    logger.info("Stage 2: Ranking frames based on visual quality...")
+    logger.info("Analyzing frames from %.4fs to %.4fs", speech_end_time, end_time)
+
+    ranker = CutPointRanker(config)
+
+    if return_internals:
+        ranked_frames, features, scores = ranker.rank_frames(
+            video_path=video_path,
+            start_time=speech_end_time,
+            end_time=end_time,
+            sample_rate=sample_rate,
+            return_internals=True
+        )
+        return ranked_frames, features, scores
+    else:
+        ranked_frames = ranker.rank_frames(
+            video_path=video_path,
+            start_time=speech_end_time,
+            end_time=end_time,
+            sample_rate=sample_rate,
+        )
+        return ranked_frames, None, None
+
+
+def select_best_with_llm(
+    video_path: str,
+    ranked_frames: List[RankedFrame],
+    speech_end_time: float,
+    duration: float,
+    scores: List[FrameScore],
+    features: List[FrameFeatures],
+    openai_api_key: Optional[str]
+) -> RankedFrame:
+    """Use LLM to select best frame from top candidates."""
+    if len(ranked_frames) < 2:
+        return ranked_frames[0]
+    try:
+        selector = LLMFrameSelector(api_key=openai_api_key)
+        return selector.select_best_frame(
+            video_path=video_path,
+            ranked_frames=ranked_frames,
+            speech_end_time=speech_end_time,
+            video_duration=duration,
+        )
+    except Exception as e:
+        logger.warning("LLM selection failed: %s, using top result", e)
+        return ranked_frames[0]
+
+
+def upload_to_airtable(
+    video_path: str,
+    best_frame: RankedFrame,
+    scores: List[FrameScore],
+    features: List[FrameFeatures],
+    speech_end_time: float,
+    duration: float,
+    config: Optional[RankingConfig],
+    sample_rate: int,
+    airtable_access_token: Optional[str],
+    airtable_base_id: Optional[str],
+    airtable_table_name: Optional[str]
+) -> str:
+    """Upload analysis results to Airtable."""
+    from sceneflow.integration import upload_to_airtable as airtable_upload
+
+    best_score = next((s for s in scores if s.frame_index == best_frame.frame_index), None)
+    best_features = next((f for f in features if f.frame_index == best_frame.frame_index), None)
+
+    if not best_score or not best_features:
+        raise RuntimeError("Could not upload to Airtable - missing data")
+
+    config_dict = {
+        "sample_rate": sample_rate,
+        "weights": {
+            "eye": config.eye_weight if config else 0.4,
+            "mouth": config.mouth_weight if config else 0.6,
+        }
+    }
+
+    record_id = airtable_upload(
+        video_path=video_path,
+        best_frame=best_frame,
+        frame_score=best_score,
+        frame_features=best_features,
+        speech_end_time=speech_end_time,
+        duration=duration,
+        config_dict=config_dict,
+        access_token=airtable_access_token,
+        base_id=airtable_base_id,
+        table_name=airtable_table_name
+    )
+    return record_id