Remove unnecessary Curve metrics (facebook#2486)

mpolson64 · facebook-github-bot · commit 5e4044bd1a00 · 2024-07-31T14:08:16.000-07:00
Summary: Pull Request resolved: facebook#2486 Reviewed By: Balandat Differential Revision: D57922964 fbshipit-source-id: 893efaf9311023d6398c95d48261fac6bc9f2138
diff --git a/ax/metrics/curve.py b/ax/metrics/curve.py
@@ -18,20 +18,16 @@
 from logging import Logger
 from typing import Any, Dict, Iterable, Optional, Set, Union
 
-import numpy as np
 import pandas as pd
 from ax.core.base_trial import BaseTrial
 from ax.core.batch_trial import BatchTrial
 from ax.core.experiment import Experiment
 from ax.core.map_data import MapData, MapKeyInfo
 from ax.core.map_metric import MapMetric
 from ax.core.metric import Metric, MetricFetchE, MetricFetchResult
-from ax.core.trial import Trial
-from ax.early_stopping.utils import align_partial_results
 from ax.exceptions.core import UnsupportedError
 from ax.utils.common.logger import get_logger
 from ax.utils.common.result import Err, Ok
-from ax.utils.common.typeutils import checked_cast
 
 logger: Logger = get_logger(__name__)
 
@@ -268,66 +264,6 @@ def get_df_from_curve_series(
         )
 
 
-class AbstractScalarizedCurveMetric(AbstractCurveMetric):
-    """A linear scalarization of (partial) learning curves of ML model training jobs:
-
-        scalarized_curve = offset + sum_i(coefficients[i] * curve[i]).
-
-    It is assumed that the output of `get_curves_from_ids` contains all of the curves
-    necessary for performing the scalarization.
-    """
-
-    def __init__(
-        self,
-        name: str,
-        coefficients: Dict[str, float],
-        offset: float = 0.0,
-        lower_is_better: bool = True,
-        cumulative_best: bool = False,
-        smoothing_window: Optional[int] = None,
-    ) -> None:
-        """Construct a AbstractScalarizedCurveMetric.
-
-        Args:
-            name: Name of metric.
-            coefficients: A mapping from learning curve names to their
-                scalarization coefficients.
-            offset: The offset of the affine scalarization.
-            lower_is_better: If True, lower values (of the scalarized metric) are
-                considered better.
-            cumulative_best: If True, for each trial, apply cumulative best to
-                the curve (i.e., if lower is better, then we return a curve
-                representing the cumulative min of the raw curve).
-            smoothing_window: If not None, specifies the window size used for a
-                rolling mean applied to the raw curve data. This can be helpful
-                if the underlying data is expected to be very noisy.
-        """
-        MapMetric.__init__(self, name=name, lower_is_better=lower_is_better)
-        self.coefficients = coefficients
-        self.offset = offset
-        self.cumulative_best = cumulative_best
-        self.smoothing_window = smoothing_window
-
-    @property
-    def curve_names(self) -> Set[str]:
-        return set(self.coefficients.keys())
-
-    def get_df_from_curve_series(
-        self,
-        experiment: Experiment,
-        all_curve_series: Dict[Union[int, str], Dict[str, pd.Series]],
-        metrics: Iterable[Metric],
-        trial_idx_to_id: Dict[int, Union[int, str]],
-    ) -> Optional[pd.DataFrame]:
-        return get_df_from_scalarized_curve_series(
-            experiment=experiment,
-            all_curve_series=all_curve_series,
-            metrics=metrics,
-            trial_idx_to_id=trial_idx_to_id,
-            map_key=self.map_key_info.key,
-        )
-
-
 def get_df_from_curve_series(
     experiment: Experiment,
     all_curve_series: Dict[Union[int, str], Dict[str, pd.Series]],
@@ -377,91 +313,6 @@ def get_df_from_curve_series(
     return pd.concat(dfs, axis=0, ignore_index=True)
 
 
-def get_df_from_scalarized_curve_series(
-    experiment: Experiment,
-    all_curve_series: Dict[Union[int, str], Dict[str, pd.Series]],
-    metrics: Iterable[Metric],
-    trial_idx_to_id: Dict[int, Union[int, str]],
-    map_key: str,
-) -> Optional[pd.DataFrame]:
-    """Convert a `all_curve_series` dict (from `get_curves_from_ids`) into
-    a dataframe. For each metric, we first get all curves represented in
-    `coefficients` and then perform scalarization.
-
-    Args:
-        experiment: The experiment.
-        all_curve_series: A dict containing curve data, as output from
-            `get_curves_from_ids`.
-        metrics: The metrics from which data is being fetched.
-        trial_idx_to_id: A dict mapping trial index to ids.
-        map_key: The progression key of the metric's MapKeyInfo.
-
-    Returns:
-        A dataframe containing curve data or None if no curve data could be found.
-    """
-    dfs = []
-    complete_metrics_by_trial = {trial_idx: [] for trial_idx in trial_idx_to_id.keys()}
-    for trial_idx, id_ in trial_idx_to_id.items():
-        if id_ not in all_curve_series:
-            logger.info(f"Could not get curve data for id {id_}. Ignoring.")
-            continue
-        curve_series = all_curve_series[id_]
-        for m in metrics:
-            curve_dfs = []
-            for curve_name in m.coefficients.keys():  # pyre-ignore[16]
-                if curve_name in curve_series:
-                    curve_df = _get_single_curve(
-                        curve_series=curve_series,
-                        curve_name=curve_name,
-                        map_key=map_key,
-                        trial=experiment.trials[trial_idx],
-                        cumulative_best=m.cumulative_best,  # pyre-ignore[16]
-                        lower_is_better=m.lower_is_better,  # pyre-ignore[6]
-                        smoothing_window=m.smoothing_window,  # pyre-ignore[16]
-                    )
-                    curve_dfs.append(curve_df)
-                else:
-                    logger.info(
-                        f"{curve_name} not present in curves from {id_}, so the "
-                        f"scalarization for {m.name} cannot be computed. Returning "
-                        "without this metric."
-                    )
-                    break
-            if len(curve_dfs) == len(m.coefficients):
-                # only keep if all curves needed by the metric are available
-                dfs.extend(curve_dfs)
-                # mark metrics who have all underlying curves
-                complete_metrics_by_trial[trial_idx].append(m)
-
-    if len(dfs) == 0:
-        return None
-
-    all_data_df = pd.concat(dfs, axis=0, ignore_index=True)
-    sub_dfs = []
-    # Do not create a common index across trials, only across the curves
-    # involved in the scalarized metric.
-    for trial_idx, dfi in all_data_df.groupby("trial_index"):
-        # the `do_forward_fill = True` pads with the latest
-        # observation to handle situations where learning curves
-        # report different amounts of data.
-        trial_curves = dfi["metric_name"].unique().tolist()
-        dfs_mean, dfs_sem = align_partial_results(
-            dfi,
-            progr_key=map_key,
-            metrics=trial_curves,
-            do_forward_fill=True,
-        )
-        for metric in complete_metrics_by_trial[trial_idx]:
-            sub_df = _get_scalarized_curve_metric_sub_df(
-                dfs_mean=dfs_mean,
-                dfs_sem=dfs_sem,
-                metric=metric,
-                trial=checked_cast(Trial, experiment.trials[trial_idx]),
-            )
-            sub_dfs.append(sub_df)
-    return pd.concat(sub_dfs, axis=0, ignore_index=True)
-
-
 def _get_single_curve(
     curve_series: Dict[str, pd.Series],
     curve_name: str,
@@ -492,51 +343,3 @@ def _get_single_curve(
         dfi["mean"] = dfi["mean"].cummin() if lower_is_better else dfi["mean"].cummax()
     # pyre-fixme[7]: Expected `DataFrame` but got `Optional[DataFrame]`.
     return dfi.drop_duplicates()
-
-
-def _get_scalarized_curve_metric_sub_df(
-    dfs_mean: Dict[str, pd.DataFrame],
-    dfs_sem: Dict[str, pd.DataFrame],
-    metric: AbstractScalarizedCurveMetric,
-    trial: Trial,
-) -> pd.DataFrame:
-    """Helper to construct sub-dfs for a ScalarizedCurveMetric.
-
-    Args:
-        df_mean: A mapping from Curve metric names to a dataframe
-            containing the means of the respective metric. The progression
-            indices are assumed to be aliged across metrics (e.g. as
-            obtained via `align_partial_results`).
-        df_sem: A mapping from Curve metric names to a dataframe
-            containing the sems of the respective metric. If empty,
-            assume the metrics are subject to noise of unknown magnitude.
-        metric: The ScalarizedCurveMetric to perform the aggregation for.
-        trial: The trial associated with the data in `df_mean` and `df_sem`.
-
-    Returns:
-        A dataframe with the scalarized mean and sem in `mean` and `sem`
-        columns, respectively.
-    """
-    sub_df = metric.offset + sum(
-        coeff * dfs_mean[metric] for metric, coeff in metric.coefficients.items()
-    )
-    sub_df = sub_df.rename(columns={trial.index: "mean"})  # pyre-ignore [16]
-    if dfs_sem:
-        var_df = sum(
-            (coeff * dfs_sem[metric]) ** 2
-            for metric, coeff in metric.coefficients.items()
-        )
-        sem_df = var_df.apply(np.sqrt).rename(  # pyre-ignore [16]
-            columns={trial.index: "sem"}
-        )
-        sub_df = pd.concat([sub_df, sem_df], axis=1)
-    else:
-        sub_df["sem"] = float("nan")
-    sub_df = sub_df.reset_index()
-    sub_df["trial_index"] = trial.index
-    sub_df["arm_name"] = trial.arm.name  # pyre-ignore [16]
-    sub_df["metric_name"] = metric.name
-    # When scalarizing curves, sometimes the last progression will be different
-    # across curves, even for the same trial. This dropna() will only keep the
-    # progressions that are available for all curves.
-    return sub_df.dropna(subset=["mean"])