[benchmarking] Updates Slack sink to address table size limitation (#1480)

rlratzel · web-flow · commit eeaa0a5a6f95 · 2026-02-17T17:47:10.000Z
diff --git a/benchmarking/Dockerfile b/benchmarking/Dockerfile
@@ -36,6 +36,7 @@ RUN cd /opt/Curator \
     pynvml \
     pyyaml \
     rich \
+    slack_sdk \
   && uv cache prune
 
 # Add the Curator repo to the safe.directory list to avoid GitPython warnings
diff --git a/benchmarking/README.md b/benchmarking/README.md
@@ -148,7 +148,7 @@ sinks:
     experiment: my-experiment
   - name: slack
     enabled: true
-    webhook_url: ${SLACK_WEBHOOK_URL}
+    channel_id: ${SLACK_CHANNEL_ID}
     default_metrics: ["exec_time_s"]  # Metrics to report by default for all entries
   - name: gdrive
     enabled: false
@@ -223,7 +223,7 @@ Configuration values can reference environment variables using `${VAR_NAME}` syn
 results_path: "${HOME}/benchmarks/results"
 sinks:
   - name: slack
-    webhook_url: ${SLACK_WEBHOOK_URL}
+    channel_id: ${SLACK_CHANNEL_ID}
   - name: mlflow
     tracking_uri: ${MLFLOW_TRACKING_URI}
 ```
@@ -311,7 +311,7 @@ This command:
 - Reads the configuration file and extracts `results_path` and `datasets_path`
 - Automatically creates volume mounts to map these paths into the container
 - Runs the benchmarking framework with the Curator code built into the Docker image
-- Passes environment variables like `SLACK_WEBHOOK_URL` and `MLFLOW_TRACKING_URI` to the container
+- Passes environment variables like `SLACK_BOT_TOKEN`, `SLACK_CHANNEL_ID`, and `MLFLOW_TRACKING_URI` to the container
 
 ### Using Host Curator Sources
 
@@ -459,11 +459,13 @@ Posts results to Slack channels:
 ```yaml
 sinks:
   - name: slack
-    webhook_url: https://hooks.slack.com/services/YOUR/WEBHOOK/URL
+    channel_id: C1234567890  # Your Slack channel ID
     enabled: true
 ```
 
-Results are formatted as interactive Slack messages with environment info and metrics.
+Results are posted as interactive Slack messages with environment info and metrics. Requires:
+- `SLACK_BOT_TOKEN` environment variable set to your Slack Bot User OAuth Token
+- `SLACK_CHANNEL_ID` in config or environment variable for the target channel
 
 #### Google Drive Sink
 
diff --git a/benchmarking/nightly-benchmark.yaml b/benchmarking/nightly-benchmark.yaml
@@ -73,7 +73,8 @@ sinks:
 #    experiment: ray-curator-common-crawl
   - name: slack
     enabled: true
-    webhook_url: ${SLACK_WEBHOOK_URL}
+    live_updates: true
+    channel_id: ${SLACK_CHANNEL_ID}
     default_metrics: ["exec_time_s"]
 #  - name: gdrive
 #    enabled: false
diff --git a/benchmarking/run.py b/benchmarking/run.py
@@ -255,15 +255,15 @@ def run_entry(
             shutil.rmtree(scratch_path, ignore_errors=True)
 
 
-def main() -> int:  # noqa: C901
+def main() -> int:  # noqa: C901, PLR0912
     parser = argparse.ArgumentParser(description="Runs the benchmarking application")
     parser.add_argument(
         "--config",
         type=Path,
         action="append",
         required=True,
         help=(
-            "Path to YAML config for benchmark matrix, machine paths, etc. Can be "
+            "Path to YAML config for the benchmark entries, machine paths, etc. Can be "
             "specified multiple times to merge configs."
         ),
     )
@@ -322,7 +322,7 @@ def main() -> int:  # noqa: C901
     env_dict = dump_env(session_obj=session, output_path=session_path)
 
     for sink in session.sinks:
-        sink.initialize(session_name=session_name, matrix_config=session, env_dict=env_dict)
+        sink.initialize(session_name=session_name, session=session, env_dict=env_dict)
 
     # Print a summary of the entries that will be run in the for loop below
     # Disabled entries will not be printed
@@ -339,6 +339,10 @@ def main() -> int:  # noqa: C901
             "success": run_success,
         }
         logger.info(f"🚀 Running {entry.name} (run ID: {run_id})")
+
+        for sink in session.sinks:
+            sink.register_benchmark_entry_starting(result_dict=result_data, benchmark_entry=entry)
+
         try:
             run_success = run_entry(
                 entry=entry,
@@ -364,7 +368,7 @@ def main() -> int:  # noqa: C901
         finally:
             session_overall_success &= run_success
             for sink in session.sinks:
-                sink.process_result(result_dict=result_data, matrix_entry=entry)
+                sink.register_benchmark_entry_finished(result_dict=result_data, benchmark_entry=entry)
 
     for sink in session.sinks:
         sink.finalize()
diff --git a/benchmarking/runner/sinks/gdrive_sink.py b/benchmarking/runner/sinks/gdrive_sink.py
@@ -33,15 +33,15 @@ def __init__(self, sink_config: dict[str, Any]):
         super().__init__(sink_config)
         self.sink_config = sink_config
         self.results: list[dict[str, Any]] = []
-        self.session_name: str = None
-        self.matrix_config: Session = None
-        self.env_dict: dict[str, Any] = None
-        self.drive_folder_id: str = None
-        self.service_account_file: str = None
+        self.session_name: str | None = None
+        self.session: Session | None = None
+        self.env_dict: dict[str, Any] | None = None
+        self.drive_folder_id: str | None = None
+        self.service_account_file: str | None = None
 
-    def initialize(self, session_name: str, matrix_config: Session, env_dict: dict[str, Any]) -> None:
+    def initialize(self, session_name: str, session: Session, env_dict: dict[str, Any]) -> None:
         self.session_name = session_name
-        self.matrix_config = matrix_config
+        self.session = session
         self.env_dict = env_dict
         self.drive_folder_id = self.sink_config.get("drive_folder_id")
         if not self.drive_folder_id:
@@ -52,7 +52,10 @@ def initialize(self, session_name: str, matrix_config: Session, env_dict: dict[s
             msg = "GdriveSink: No service account file configured"
             raise ValueError(msg)
 
-    def process_result(self, result_dict: dict[str, Any], matrix_entry: Entry) -> None:
+    def register_benchmark_entry_starting(self, result_dict: dict[str, Any], benchmark_entry: Entry) -> None:
+        pass
+
+    def register_benchmark_entry_finished(self, result_dict: dict[str, Any], benchmark_entry: Entry) -> None:
         pass
 
     def finalize(self) -> None:
@@ -66,8 +69,8 @@ def finalize(self) -> None:
             self._delete_tar_file(tar_path)
 
     def _tar_results_and_artifacts(self) -> Path:
-        results_path = Path(self.matrix_config.results_path)
-        artifacts_path = Path(self.matrix_config.artifacts_dir)
+        results_path = Path(self.session.results_path)
+        artifacts_path = Path(self.session.artifacts_dir)
         tar_path = results_path / f"{self.session_name}.tar.gz"
         with tarfile.open(tar_path, "w:gz") as tar:
             tar.add(results_path, arcname=results_path.name)
diff --git a/benchmarking/runner/sinks/mlflow_sink.py b/benchmarking/runner/sinks/mlflow_sink.py
@@ -34,20 +34,23 @@ def __init__(self, sink_config: dict[str, Any]):
             msg = "MlflowSink: No experiment configured"
             raise ValueError(msg)
         self.results: list[dict[str, Any]] = []
-        self.session_name: str = None
-        self.matrix_config: Session = None
-        self.env_dict: dict[str, Any] = None
+        self.session_name: str | None = None
+        self.session: Session | None = None
+        self.env_dict: dict[str, Any] | None = None
 
-    def initialize(self, session_name: str, matrix_config: Session, env_dict: dict[str, Any]) -> None:
+    def initialize(self, session_name: str, session: Session, env_dict: dict[str, Any]) -> None:
         self.session_name = session_name
-        self.matrix_config = matrix_config
+        self.session = session
         self.env_dict = env_dict
 
-    def process_result(self, result_dict: dict[str, Any], matrix_entry: Entry) -> None:
-        # Use the matrix_entry to get any entry-specific settings for the Slack report
+    def register_benchmark_entry_starting(self, result_dict: dict[str, Any], benchmark_entry: Entry) -> None:
+        pass
+
+    def register_benchmark_entry_finished(self, result_dict: dict[str, Any], benchmark_entry: Entry) -> None:
+        # Use the benchmark_entry to get any entry-specific settings for the Slack report
         # such as additional metrics to include in the report.
-        if matrix_entry:
-            additional_metrics = matrix_entry.get_sink_data(self.name).get("additional_metrics", [])
+        if benchmark_entry:
+            additional_metrics = benchmark_entry.get_sink_data(self.name).get("additional_metrics", [])
         else:
             additional_metrics = []
         self.results.append((additional_metrics, result_dict))
diff --git a/benchmarking/runner/sinks/sink.py b/benchmarking/runner/sinks/sink.py
@@ -33,24 +33,33 @@ def __init__(self, sink_config: dict[str, Any]):
     def initialize(
         self,
         session_name: str,
-        matrix_config: Session,
+        session: Session,
         env_dict: dict[str, Any],
     ) -> None:
         """Initialize the sink for a benchmark session.
 
         Args:
             session_name: Name of the benchmark session.
-            matrix_config: Session configuration for the session.
+            session: Session configuration for the session.
             env_dict: Environment dictionary for the session.
         """
 
     @abstractmethod
-    def process_result(self, result_dict: dict[str, Any], matrix_entry: Entry) -> None:
-        """Process an individual benchmark result.
+    def register_benchmark_entry_starting(self, result_dict: dict[str, Any], benchmark_entry: Entry) -> None:
+        """Register that a benchmark entry is starting.
+
+        Args:
+            result_dict: Dictionary containing benchmark entry data.
+            benchmark_entry: Entry configuration.
+        """
+
+    @abstractmethod
+    def register_benchmark_entry_finished(self, result_dict: dict[str, Any], benchmark_entry: Entry) -> None:
+        """Register that a benchmark entry has finished.
 
         Args:
             result_dict: Dictionary containing benchmark result data.
-            matrix_entry: Entry configuration.
+            benchmark_entry: Entry configuration.
         """
 
     @abstractmethod
diff --git a/benchmarking/runner/sinks/slack_sink.py b/benchmarking/runner/sinks/slack_sink.py
diff --git a/benchmarking/tools/run.sh b/benchmarking/tools/run.sh