VectorInstitute
diff --git a/‎src/aieng_bot_maintain/auto_merger/pr_processor.py‎
Lines changed: 24 additions & 6 deletions b/‎src/aieng_bot_maintain/auto_merger/pr_processor.py‎
Lines changed: 24 additions & 6 deletions
diff --git a/‎src/aieng_bot_maintain/auto_merger/status_poller.py‎
Lines changed: 122 additions & 33 deletions b/‎src/aieng_bot_maintain/auto_merger/status_poller.py‎
Lines changed: 122 additions & 33 deletions
diff --git a/‎src/aieng_bot_maintain/auto_merger/workflow_client.py‎
Lines changed: 52 additions & 17 deletions b/‎src/aieng_bot_maintain/auto_merger/workflow_client.py‎
Lines changed: 52 additions & 17 deletions
@@ -131,7 +131,7 @@ def _trigger_rebase(self, pr: PRQueueItem) -> bool:
         1. Dependabot comments ("already up-to-date", error messages)
         2. PR head SHA changes (indicates successful force-push)
 
-        For pre-commit.ci PRs, skips rebase (not supported) and proceeds directly.
+        For pre-commit.ci PRs, manual rebase is synchronous - no polling needed.
 
         Parameters
         ----------
@@ -156,7 +156,7 @@ def _trigger_rebase(self, pr: PRQueueItem) -> bool:
             pr.last_updated = datetime.now(UTC).isoformat()
             return False
 
-        # Get current head SHA before triggering rebase
+        # Get current head SHA before triggering rebase (for Dependabot polling)
         initial_head_sha = self.workflow_client.get_pr_head_sha(pr)
         if not initial_head_sha:
             pr.error_message = "Failed to get PR head SHA"
@@ -167,7 +167,9 @@ def _trigger_rebase(self, pr: PRQueueItem) -> bool:
         log_info(f"Current head SHA: {initial_head_sha[:7]}")
 
         # Trigger bot-specific rebase
-        if not self.workflow_client.trigger_rebase(pr):
+        success, new_sha, sha_changed = self.workflow_client.trigger_rebase(pr)
+
+        if not success:
             pr.error_message = "Failed to trigger rebase"
             pr.status = PRStatus.FAILED
             pr.last_updated = datetime.now(UTC).isoformat()
@@ -177,9 +179,25 @@ def _trigger_rebase(self, pr: PRQueueItem) -> bool:
         pr.rebase_started_at = datetime.now(UTC).isoformat()
         pr.last_updated = datetime.now(UTC).isoformat()
 
-        # Poll for rebase completion
-        # - Dependabot: polls for comments + SHA changes
-        # - pre-commit.ci: polls for SHA changes (manual rebase via git)
+        # For manual rebases (pre-commit.ci), rebase completed synchronously
+        if new_sha is not None:
+            if sha_changed:
+                log_success(
+                    f"Rebase completed (SHA changed: {initial_head_sha[:7]} → {new_sha[:7]})"
+                )
+                # Wait longer for CI to start checks after new commits
+                log_info("Waiting 45s for CI to trigger checks after rebase...")
+                time.sleep(45)
+            else:
+                log_success(
+                    "Branch already up-to-date with base, proceeding to check monitoring"
+                )
+                # Brief wait for API to update, then check existing checks
+                log_info("Waiting 15s for GitHub API to update...")
+                time.sleep(15)
+            return False  # Proceed to check monitoring
+
+        # For async rebases (Dependabot), poll for completion
         return self._poll_rebase_completion(pr, initial_head_sha)
 
     def _poll_rebase_completion(self, pr: PRQueueItem, initial_head_sha: str) -> bool:
 
@@ -286,6 +286,97 @@ def is_check_failed(check: dict) -> bool:
         log_warning("  Mergeable status still UNKNOWN after retries")
         return all_passed, has_failures, "UNKNOWN"
 
+    def _handle_no_checks(
+        self, rollup: list[dict], attempt: int, check_interval: int
+    ) -> CheckStatus | None:
+        """Handle case when no checks are found.
+
+        Parameters
+        ----------
+        rollup : list[dict]
+            Raw check rollup from GitHub API.
+        attempt : int
+            Current attempt number.
+        check_interval : int
+            Seconds to wait between checks.
+
+        Returns
+        -------
+        CheckStatus | None
+            "NO_CHECKS" if no checks found after initial attempts, None to continue.
+
+        """
+        if not rollup:
+            if attempt > 2:  # Give checks time to start
+                log_warning("    No checks found")
+                return "NO_CHECKS"
+            time.sleep(check_interval)
+            return None
+
+        # Filter out phantom checks
+        relevant_checks = [c for c in rollup if self._should_check_be_counted(c)]
+        if not relevant_checks:
+            if attempt > 2:
+                log_warning("    No relevant checks found")
+                return "NO_CHECKS"
+            time.sleep(check_interval)
+            return None
+
+        # Continue with relevant checks
+        return None
+
+    def _evaluate_check_status(
+        self,
+        relevant_checks: list[dict],
+        stable_count_duration: int,
+        min_stable_duration: int,
+    ) -> CheckStatus | None:
+        """Evaluate status of relevant checks.
+
+        Parameters
+        ----------
+        relevant_checks : list[dict]
+            Filtered checks to evaluate.
+        stable_count_duration : int
+            How long check count has been stable (seconds).
+        min_stable_duration : int
+            Minimum stability duration before declaring failure (seconds).
+
+        Returns
+        -------
+        CheckStatus | None
+            Final status if determined, None to continue waiting.
+
+        """
+        any_running = any(self._is_check_running(c) for c in relevant_checks)
+        any_failed = any(self._is_check_failed(c) for c in relevant_checks)
+        all_passed = all(self._is_check_passed(c) for c in relevant_checks)
+        all_finalized = all(self._has_finalized_conclusion(c) for c in relevant_checks)
+
+        if not any_running and all_finalized:
+            if any_failed:
+                # Wait for check count to stabilize before declaring failure
+                if stable_count_duration >= min_stable_duration:
+                    log_error("  Checks failed")
+                    return "FAILED"
+                log_info(
+                    f"    ⏳ Some checks failed, but waiting for check count to "
+                    f"stabilize ({stable_count_duration}s/{min_stable_duration}s) "
+                    "to ensure all checks have appeared..."
+                )
+            elif all_passed:
+                log_success("  Checks completed successfully")
+                return "COMPLETED"
+            else:
+                log_info("    ⏳ Checks finalized but not all passed, waiting...")
+        elif not any_running and not all_finalized:
+            log_info(
+                "    ⏳ Checks appear done but conclusions not finalized yet, "
+                "waiting..."
+            )
+
+        return None
+
     def wait_for_checks_completion(
         self,
         pr: PRQueueItem,
@@ -296,6 +387,10 @@ def wait_for_checks_completion(
         Polls every 30 seconds up to timeout_minutes.
         Similar to fix-remote-pr.yml:603-673.
 
+        To prevent premature failure detection, we track check count stability.
+        We only return "FAILED" after the check count has been stable for 60s,
+        ensuring all checks have appeared in GitHub's API.
+
         Parameters
         ----------
         pr : PRQueueItem
@@ -311,6 +406,11 @@ def wait_for_checks_completion(
         """
         check_interval = 30
         max_attempts = (timeout_minutes * 60) // check_interval
+        min_stable_duration = 60
+
+        # Track check count stability to ensure all checks have appeared
+        last_check_count = 0
+        stable_count_duration = 0
 
         log_info(
             f"  ⏳ Waiting up to {timeout_minutes} minutes for checks to complete..."
@@ -335,48 +435,37 @@ def wait_for_checks_completion(
             data = json.loads(status_json)
             rollup = data.get("statusCheckRollup") or []
 
-            if not rollup:
-                if attempt > 2:  # Give checks time to start
-                    log_warning("    No checks found")
-                    return "NO_CHECKS"
-                time.sleep(check_interval)
+            # Handle no checks case
+            result = self._handle_no_checks(rollup, attempt, check_interval)
+            if result == "NO_CHECKS":
+                return result
+            if result is None and not rollup:
                 continue
 
-            # Filter out checks that should be ignored (phantom entries)
+            # Get relevant checks (already filtered by _handle_no_checks)
             relevant_checks = [c for c in rollup if self._should_check_be_counted(c)]
-
             if not relevant_checks:
-                if attempt > 2:  # Give checks time to start
-                    log_warning("    No relevant checks found")
-                    return "NO_CHECKS"
-                time.sleep(check_interval)
                 continue
 
-            # Check status of relevant checks
-            any_running = any(self._is_check_running(c) for c in relevant_checks)
-            any_failed = any(self._is_check_failed(c) for c in relevant_checks)
-            all_passed = all(self._is_check_passed(c) for c in relevant_checks)
-            all_finalized = all(
-                self._has_finalized_conclusion(c) for c in relevant_checks
-            )
-
-            if not any_running and all_finalized:
-                if any_failed:
-                    log_error("  Checks failed")
-                    return "FAILED"
-                if all_passed:
-                    log_success("  Checks completed successfully")
-                    return "COMPLETED"
-                # Checks are finalized but not all passed - still waiting
-                log_info("    ⏳ Checks finalized but not all passed, waiting...")
-
-            # Debug: Show why we're still waiting
-            if not any_running and not all_finalized:
+            # Track check count stability
+            current_check_count = len(relevant_checks)
+            if current_check_count == last_check_count:
+                stable_count_duration += check_interval
+            else:
+                stable_count_duration = 0
+                last_check_count = current_check_count
                 log_info(
-                    "    ⏳ Checks appear done but conclusions not finalized yet, "
-                    "waiting..."
+                    f"    Check count changed to {current_check_count}, "
+                    "resetting stability timer"
                 )
 
+            # Evaluate check status
+            status = self._evaluate_check_status(
+                relevant_checks, stable_count_duration, min_stable_duration
+            )
+            if status:
+                return status
+
             if attempt < max_attempts:
                 time.sleep(check_interval)
 
 
@@ -157,11 +157,11 @@ def get_pr_head_sha(self, pr: PRQueueItem) -> str | None:
             log_error(f"Failed to get PR head SHA: {e}")
             return None
 
-    def trigger_rebase(self, pr: PRQueueItem) -> bool:
+    def trigger_rebase(self, pr: PRQueueItem) -> tuple[bool, str | None, bool]:
         """Trigger bot-specific rebase command.
 
-        For Dependabot: Post @dependabot rebase comment
-        For pre-commit.ci: Manually rebase via git operations
+        For Dependabot: Post @dependabot rebase comment (async)
+        For pre-commit.ci: Manually rebase via git operations (sync)
 
         Parameters
         ----------
@@ -170,11 +170,14 @@ def trigger_rebase(self, pr: PRQueueItem) -> bool:
 
         Returns
         -------
-        bool
-            True on success, False on failure.
+        tuple[bool, str | None, bool]
+            (success, new_sha, sha_changed) where:
+            - success: True if rebase triggered/succeeded, False on failure
+            - new_sha: New head SHA (only for manual rebases, None for async)
+            - sha_changed: True if SHA changed (only for manual rebases, True for async to trigger polling)
 
         """
-        # Dependabot PRs use comment-based rebase
+        # Dependabot PRs use comment-based rebase (async)
         if pr.pr_author == "app/dependabot":
             try:
                 self._run_gh_command(
@@ -190,21 +193,21 @@ def trigger_rebase(self, pr: PRQueueItem) -> bool:
                     ]
                 )
                 log_success(f"  Rebase triggered for {pr.repo}#{pr.pr_number}")
-                return True
+                return (True, None, True)  # Async, will poll for SHA change
             except subprocess.CalledProcessError as e:
                 log_error(f"  Failed to trigger rebase: {e}")
-                return False
+                return (False, None, False)
 
-        # pre-commit.ci PRs use manual git rebase
+        # pre-commit.ci PRs use manual git rebase (sync)
         if pr.pr_author == "app/pre-commit-ci":
             log_info("  Manually rebasing pre-commit.ci PR via git operations")
             return self._manual_rebase(pr)
 
         # Unknown bot author
         log_error(f"  Unknown bot author: {pr.pr_author}, cannot rebase")
-        return False
+        return (False, None, False)
 
-    def _manual_rebase(self, pr: PRQueueItem) -> bool:
+    def _manual_rebase(self, pr: PRQueueItem) -> tuple[bool, str | None, bool]:
         """Manually rebase a PR branch via git operations.
 
         Clones the repo, checks out PR branch, rebases onto base, and force-pushes.
@@ -216,8 +219,11 @@ def _manual_rebase(self, pr: PRQueueItem) -> bool:
 
         Returns
         -------
-        bool
-            True on success, False on failure.
+        tuple[bool, str | None, bool]
+            (success, new_sha, sha_changed) where:
+            - success: True if rebase succeeded, False on failure
+            - new_sha: New head SHA after rebase (None on failure)
+            - sha_changed: True if rebase created new commits, False if already up-to-date
 
         """
         try:
@@ -313,6 +319,16 @@ def _manual_rebase(self, pr: PRQueueItem) -> bool:
                     capture_output=True,
                 )
 
+                # Get SHA before rebase
+                result = subprocess.run(
+                    ["git", "rev-parse", "HEAD"],
+                    cwd=repo_dir,
+                    check=True,
+                    capture_output=True,
+                    text=True,
+                )
+                sha_before = result.stdout.strip()
+
                 # Fetch latest base branch
                 subprocess.run(
                     ["git", "fetch", "origin", base_ref],
@@ -330,7 +346,26 @@ def _manual_rebase(self, pr: PRQueueItem) -> bool:
                     capture_output=True,
                 )
 
-                # Force push to PR branch
+                # Get SHA after rebase
+                result = subprocess.run(
+                    ["git", "rev-parse", "HEAD"],
+                    cwd=repo_dir,
+                    check=True,
+                    capture_output=True,
+                    text=True,
+                )
+                sha_after = result.stdout.strip()
+
+                # Check if rebase created new commits
+                sha_changed = sha_after != sha_before
+
+                if not sha_changed:
+                    log_success(
+                        f"  Branch already up-to-date with {base_ref}, no rebase needed"
+                    )
+                    return (True, sha_after, False)
+
+                # Force push to PR branch (only if SHA changed)
                 # Using --force instead of --force-with-lease because the shallow clone
                 # doesn't set up remote tracking properly, causing "stale info" errors.
                 # This is safe because we just fetched and we're the only ones modifying
@@ -344,16 +379,16 @@ def _manual_rebase(self, pr: PRQueueItem) -> bool:
                 )
 
                 log_success(f"  Successfully rebased {pr.repo}#{pr.pr_number}")
-                return True
+                return (True, sha_after, True)
 
         except subprocess.CalledProcessError as e:
             log_error(f"  Failed to manually rebase: {e}")
             if e.stderr:
                 log_error(f"  Error output: {e.stderr.decode()}")
-            return False
+            return (False, None, False)
         except Exception as e:
             log_error(f"  Unexpected error during manual rebase: {e}")
-            return False
+            return (False, None, False)
 
     def trigger_fix_workflow(self, pr: PRQueueItem) -> str | None:
         """Trigger fix-remote-pr.yml workflow.