improves structure

spjuhel · spjuhel · commit 5ab8bda38a3f · 2025-09-16T15:12:54.000+02:00
diff --git a/climada/trajectories/risk_trajectory.py b/climada/trajectories/risk_trajectory.py
@@ -288,7 +288,7 @@ def _compute_period_metrics(
         df = self._generic_metrics(
             npv=npv, metric_name=metric_name, metric_meth=metric_meth, **kwargs
         )
-        return self._date_to_period_agg(df)
+        return self._date_to_period_agg(df, grouper=self._grouper)
 
     def _compute_metrics(
         self, metric_name: str, metric_meth: str, npv: bool = True, **kwargs
@@ -506,47 +506,47 @@ def _get_risk_periods(
             )
         ]
 
+    @staticmethod
+    def identify_continuous_periods(group, time_unit):
+        # Calculate the difference between consecutive dates
+        if time_unit == "year":
+            group["date_diff"] = group["date"].dt.year.diff()
+        if time_unit == "month":
+            group["date_diff"] = group["date"].dt.month.diff()
+        if time_unit == "day":
+            group["date_diff"] = group["date"].dt.day.diff()
+        if time_unit == "hour":
+            group["date_diff"] = group["date"].dt.hour.diff()
+        # Identify breaks in continuity
+        group["period_id"] = (group["date_diff"] != 1).cumsum()
+        return group
+
     @classmethod
     def _date_to_period_agg(
         cls,
         df: pd.DataFrame,
+        grouper: list[str],
         time_unit: str = "year",
         colname: str | list[str] = "risk",
     ) -> pd.DataFrame | pd.Series:
         """Groups per date risk metric to periods."""
 
         ## I'm thinking this does not work with RPs... As you can't just sum impacts
         ## Not sure what to do with it. -> Fixed I take the avg RP impact of the period
-
-        def identify_continuous_periods(group, time_unit):
-            # Calculate the difference between consecutive dates
-            if time_unit == "year":
-                group["date_diff"] = group["date"].dt.year.diff()
-            if time_unit == "month":
-                group["date_diff"] = group["date"].dt.month.diff()
-            if time_unit == "day":
-                group["date_diff"] = group["date"].dt.day.diff()
-            if time_unit == "hour":
-                group["date_diff"] = group["date"].dt.hour.diff()
-            # Identify breaks in continuity
-            group["period_id"] = (group["date_diff"] != 1).cumsum()
-            return group
-
         def conditional_agg(group):
             if "rp" in group.name[2]:
                 return group.mean()
             else:
                 return group.sum()
 
-        grouper = cls._grouper
         if "group" in df.columns and "group" not in grouper:
             grouper = ["group"] + grouper
 
         df_sorted = df.sort_values(by=cls._grouper + ["date"])
         # Apply the function to identify continuous periods
         df_periods = df_sorted.groupby(
             grouper, dropna=False, group_keys=False, observed=True
-        ).apply(identify_continuous_periods, time_unit)
+        ).apply(cls.identify_continuous_periods, time_unit)
 
         if isinstance(colname, str):
             colname = [colname]
@@ -572,7 +572,7 @@ def conditional_agg(group):
             df_periods.groupby(grouper + ["period_id"], dropna=False, observed=True)[
                 colname
             ]
-            .apply(lambda group: conditional_agg(group))
+            .apply(conditional_agg)
             .reset_index()
         )
         df_periods = pd.merge(
@@ -588,7 +588,7 @@ def per_period_risk_metrics(
     ) -> pd.DataFrame | pd.Series:
         """Returns a tidy dataframe of the risk metrics with the total for each different period."""
         df = self.per_date_risk_metrics(metrics=metrics, **kwargs)
-        return self._date_to_period_agg(df, **kwargs)
+        return self._date_to_period_agg(df, grouper=self._grouper, **kwargs)
 
     def _calc_waterfall_plot_data(
         self,
diff --git a/climada/trajectories/test/test_risk_trajectory.py b/climada/trajectories/test/test_risk_trajectory.py
@@ -660,7 +660,7 @@ def test_per_period_risk_multiple_risk_cols(self):
             }
         )
         result_df = RiskTrajectory._date_to_period_agg(
-            df_input, colname=["base risk", "exposure contribution"]
+            df_input, col_agg_dict=["base risk", "exposure contribution"]
         )
 
         expected_df = pd.DataFrame(

Original file line number	Diff line number	Diff line change
`@@ -660,7 +660,7 @@ def test_per_period_risk_multiple_risk_cols(self):`
`660`	`660`	`}`
`661`	`661`	`)`
`662`	`662`	`result_df = RiskTrajectory._date_to_period_agg(`
`663`		`- df_input, colname=["base risk", "exposure contribution"]`
	`663`	`+ df_input, col_agg_dict=["base risk", "exposure contribution"]`
`664`	`664`	`)`
`665`	`665`
`666`	`666`	`expected_df = pd.DataFrame(`