stan-dev
diff --git a/‎cmdstanpy/cmdstan_args.py‎
Lines changed: 4 additions & 0 deletions b/‎cmdstanpy/cmdstan_args.py‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎cmdstanpy/stanfit/gq.py‎
Lines changed: 3 additions & 3 deletions b/‎cmdstanpy/stanfit/gq.py‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎cmdstanpy/stanfit/laplace.py‎
Lines changed: 3 additions & 1 deletion b/‎cmdstanpy/stanfit/laplace.py‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎cmdstanpy/stanfit/mcmc.py‎
Lines changed: 50 additions & 23 deletions b/‎cmdstanpy/stanfit/mcmc.py‎
Lines changed: 50 additions & 23 deletions
diff --git a/‎cmdstanpy/stanfit/metadata.py‎
Lines changed: 48 additions & 2 deletions b/‎cmdstanpy/stanfit/metadata.py‎
Lines changed: 48 additions & 2 deletions
diff --git a/‎cmdstanpy/stanfit/runset.py‎
Lines changed: 24 additions & 0 deletions b/‎cmdstanpy/stanfit/runset.py‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎cmdstanpy/utils/logging.py‎
Lines changed: 3 additions & 1 deletion b/‎cmdstanpy/utils/logging.py‎
Lines changed: 3 additions & 1 deletion
@@ -273,6 +273,10 @@ def compose(self, idx: int, cmd: list[str]) -> list[str]:
             cmd.append(f'window={self.adapt_metric_window}')
         if self.adapt_step_size is not None:
             cmd.append('term_buffer={}'.format(self.adapt_step_size))
+        if self.adapt_engaged:
+            cmd.append('save_metric=1')
+        # End adapt subsection
+
         if self.num_chains > 1:
             cmd.append('num_chains={}'.format(self.num_chains))
 
 
@@ -423,18 +423,18 @@ def draws_xr(
 
     @overload
     def draws_xr(
-        self: "CmdStanGQ[CmdStanMCMC]",
+        self: CmdStanGQ[CmdStanMCMC],
         vars: str | list[str] | None = None,
         inc_warmup: bool = False,
         inc_sample: bool = False,
-    ) -> "xr.Dataset": ...
+    ) -> xr.Dataset: ...
 
     def draws_xr(
         self,
         vars: str | list[str] | None = None,
         inc_warmup: bool = False,
         inc_sample: bool = False,
-    ) -> "xr.Dataset":
+    ) -> xr.Dataset:
         """
         Returns the generated quantities draws as a xarray Dataset.
 
 
@@ -2,6 +2,8 @@
 Container for the result of running a laplace approximation.
 """
 
+from __future__ import annotations
+
 from typing import Any, Hashable, MutableMapping
 
 import numpy as np
@@ -197,7 +199,7 @@ def draws_pd(
     def draws_xr(
         self,
         vars: str | list[str] | None = None,
-    ) -> "xr.Dataset":
+    ) -> xr.Dataset:
         """
         Returns the sampler draws as a xarray Dataset.
 
 
@@ -2,6 +2,8 @@
 Container for the result of running the sample (MCMC) method
 """
 
+from __future__ import annotations
+
 import math
 import os
 from io import StringIO
@@ -31,7 +33,7 @@
     stancsv,
 )
 
-from .metadata import InferenceMetadata
+from .metadata import InferenceMetadata, MetricInfo
 from .runset import RunSet
 
 
@@ -81,6 +83,7 @@ def __init__(
         # info from CSV values, instantiated lazily
         self._draws: np.ndarray = np.array(())
         # only valid when not is_fixed_param
+        self._metric_type: str | None = None
         self._metric: np.ndarray = np.array(())
         self._step_size: np.ndarray = np.array(())
         self._divergences: np.ndarray = np.zeros(self.runset.chains, dtype=int)
@@ -92,6 +95,8 @@ def __init__(
         # info from CSV header and initial and final comment blocks
         config = self._validate_csv_files()
         self._metadata: InferenceMetadata = InferenceMetadata(config)
+        self._chain_metric_info: list[MetricInfo] = []
+
         if not self._is_fixed_param:
             self._check_sampler_diagnostics()
 
@@ -216,11 +221,13 @@ def metric_type(self) -> str | None:
         to CmdStan arg 'metric'.
         When sampler algorithm 'fixed_param' is specified, metric_type is None.
         """
-        return (
-            self._metadata.cmdstan_config['metric']
-            if not self._is_fixed_param
-            else None
-        )
+        if self._is_fixed_param:
+            return None
+
+        if self._metric_type is None:
+            self._parse_metric_info()
+
+        return self._metric_type
 
     @property
     def inv_metric(self) -> np.ndarray | None:
@@ -230,10 +237,15 @@ def inv_metric(self) -> np.ndarray | None:
         a ``nchains x nparams x nparams`` array when metric_type is 'dense_e',
         or ``None`` when metric_type is 'unit_e' or algorithm is 'fixed_param'.
         """
-        if self._is_fixed_param or self.metric_type == 'unit_e':
+        if self._is_fixed_param:
+            return None
+
+        if self._metric_type is None:
+            self._parse_metric_info()
+
+        if self.metric_type == 'unit_e':
             return None
 
-        self._assemble_draws()
         return self._metric
 
     @property
@@ -242,8 +254,13 @@ def step_size(self) -> np.ndarray | None:
         Step size used by sampler for each chain.
         When sampler algorithm 'fixed_param' is specified, step size is None.
         """
-        self._assemble_draws()
-        return self._step_size if not self._is_fixed_param else None
+        if self._is_fixed_param:
+            return None
+
+        if self._metric_type is None:
+            self._parse_metric_info()
+
+        return self._step_size
 
     @property
     def thin(self) -> int:
@@ -382,6 +399,27 @@ def _validate_csv_files(self) -> dict[str, Any]:
                     self._max_treedepths[i] = drest['ct_max_treedepth']
         return dzero
 
+    def _parse_metric_info(self) -> None:
+        """Extracts metric type, inv_metric, and step size information from the
+        parsed metric JSONs."""
+        self._chain_metric_info = []
+        for mf in self.runset.metric_files:
+            with open(mf) as f:
+                self._chain_metric_info.append(
+                    MetricInfo.model_validate_json(f.read())
+                )
+
+        metric_types = {cmi.metric_type for cmi in self._chain_metric_info}
+        if len(metric_types) != 1:
+            raise ValueError("Inconsistent metric types found across chains")
+        self._metric_type = self._chain_metric_info[0].metric_type
+        self._metric = np.asarray(
+            [cmi.inv_metric for cmi in self._chain_metric_info]
+        )
+        self._step_size = np.asarray(
+            [cmi.stepsize for cmi in self._chain_metric_info]
+        )
+
     def _check_sampler_diagnostics(self) -> None:
         """
         Warn if any iterations ended in divergences or hit maxtreedepth.
@@ -424,13 +462,11 @@ def _assemble_draws(self) -> None:
             dtype=np.float64,
             order='F',
         )
-        self._step_size = np.empty(self.chains, dtype=np.float64)
 
-        mass_matrix_per_chain = []
         for chain in range(self.chains):
             try:
                 (
-                    comments,
+                    _,
                     header,
                     draws,
                 ) = stancsv.parse_comments_header_and_draws(
@@ -443,20 +479,11 @@ def _assemble_draws(self) -> None:
                     draws_np = np.empty((0, n_cols))
 
                 self._draws[:, chain, :] = draws_np
-                if not self._is_fixed_param:
-                    (
-                        self._step_size[chain],
-                        mass_matrix,
-                    ) = stancsv.parse_hmc_adaptation_lines(comments)
-                    mass_matrix_per_chain.append(mass_matrix)
             except Exception as exc:
                 raise ValueError(
                     f"Parsing output from {self.runset.csv_files[chain]} failed"
                 ) from exc
 
-        if all(mm is not None for mm in mass_matrix_per_chain):
-            self._metric = np.array(mass_matrix_per_chain)
-
         assert self._draws is not None
 
     def summary(
@@ -652,7 +679,7 @@ def draws_pd(
 
     def draws_xr(
         self, vars: str | list[str] | None = None, inc_warmup: bool = False
-    ) -> "xr.Dataset":
+    ) -> xr.Dataset:
         """
         Returns the sampler draws as a xarray Dataset.
 
 
@@ -1,10 +1,14 @@
 """Container for metadata parsed from the output of a CmdStan run"""
 
+from __future__ import annotations
+
 import copy
+import math
 import os
-from typing import Any, Iterator
+from typing import Any, Iterator, Literal
 
 import stanio
+from pydantic import BaseModel, field_validator, model_validator
 
 from cmdstanpy.utils import stancsv
 
@@ -34,7 +38,7 @@ def __init__(
     @classmethod
     def from_csv(
         cls, stan_csv: str | os.PathLike | Iterator[bytes]
-    ) -> 'InferenceMetadata':
+    ) -> InferenceMetadata:
         try:
             comments, header, _ = stancsv.parse_comments_header_and_draws(
                 stan_csv
@@ -79,3 +83,45 @@ def stan_vars(self) -> dict[str, stanio.Variable]:
         These are the user-defined variables in the Stan program.
         """
         return self._stan_vars
+
+
+class MetricInfo(BaseModel):
+    """Structured representation of HMC-NUTS metric information,
+    as output by CmdStan"""
+
+    stepsize: float
+    metric_type: Literal["diag_e", "dense_e", "unit_e"]
+    inv_metric: list[float] | list[list[float]]
+
+    @field_validator("stepsize")
+    @classmethod
+    def validate_stepsize(cls, v: float) -> float:
+        if not math.isnan(v) and v <= 0:
+            raise ValueError("stepsize must be greater than 0 or NaN")
+        return v
+
+    @model_validator(mode="after")
+    def validate_inv_metric_shape(self) -> MetricInfo:
+        if not self.inv_metric:  # Empty inv_metric, e.g. from no parameters
+            return self
+
+        is_1d = isinstance(self.inv_metric[0], float)
+
+        if self.metric_type in ("diag_e", "unit_e") and not is_1d:
+            raise ValueError(
+                "inv_metric must be 1D for diag_e and unit_e metric type"
+            )
+        if self.metric_type == "dense_e":
+            if is_1d:
+                raise ValueError("Dense inv_metric must be 2D")
+
+            if any(not row for row in self.inv_metric):
+                raise ValueError("Dense inv_metric cannot contain empty rows")
+
+            n_rows = len(self.inv_metric)
+            if not all(
+                len(row) == n_rows for row in self.inv_metric  # type: ignore
+            ):
+                raise ValueError("Dense inv_metric must be square")
+
+        return self
@@ -57,6 +57,7 @@ def __init__(
         self._stdout_files, self._profile_files = [], []
         self._csv_files, self._diagnostic_files = [], []
         self._config_files = []
+        self._metric_files = []
 
         # per-process output files
         if one_process_per_chain and chains > 1:
@@ -87,6 +88,10 @@ def __init__(
         # per-chain output files
         if chains == 1:
             self._csv_files = [self.gen_file_name(".csv")]
+            if args.method == Method.SAMPLE:
+                self._metric_files = [
+                    self.gen_file_name(".json", extra="metric")
+                ]
             if args.save_latent_dynamics:
                 self._diagnostic_files = [
                     self.gen_file_name(".csv", extra="diagnostic")
@@ -95,6 +100,20 @@ def __init__(
             self._csv_files = [
                 self.gen_file_name(".csv", id=id) for id in self._chain_ids
             ]
+            if args.method == Method.SAMPLE:
+                if one_process_per_chain:
+                    self._metric_files = [
+                        os.path.join(
+                            self._outdir,
+                            f"{self._base_outfile}_{id}_metric.json",
+                        )
+                        for id in self._chain_ids
+                    ]
+                else:
+                    self._metric_files = [
+                        self.gen_file_name(".json", extra="metric", id=id)
+                        for id in self._chain_ids
+                    ]
             if args.save_latent_dynamics:
                 self._diagnostic_files = [
                     self.gen_file_name(".csv", extra="diagnostic", id=id)
@@ -222,6 +241,11 @@ def profile_files(self) -> list[str]:
         """List of paths to CmdStan profiler files."""
         return self._profile_files
 
+    @property
+    def metric_files(self) -> list[str]:
+        """List of paths to CmdStan NUTS-HMC sampler metric files."""
+        return self._metric_files
+
     def gen_file_name(
         self, suffix: str, *, extra: str = "", id: int | None = None
     ) -> str:
 
@@ -2,6 +2,8 @@
 CmdStanPy logging
 """
 
+from __future__ import annotations
+
 import functools
 import logging
 import types
@@ -39,7 +41,7 @@ def __init__(self, disable: bool) -> None:
     def __repr__(self) -> str:
         return ""
 
-    def __enter__(self) -> "ToggleLogging":
+    def __enter__(self) -> ToggleLogging:
         self.logger.disabled = self.disable
         return self