Merge pull request #75 from scipp/stitch-curves

jokasimr · web-flow · commit 9c7e949a915e · 2024-09-23T09:45:06.000+02:00
feat: add basic stitching procedure
diff --git a/docs/api-reference/index.md b/docs/api-reference/index.md
@@ -32,6 +32,7 @@
    orso
    supermirror
    types
+   tools
 ```
 
 ## Amor
diff --git a/docs/user-guide/amor/amor-reduction.ipynb b/docs/user-guide/amor/amor-reduction.ipynb
@@ -163,6 +163,31 @@
     "sc.plot(results, norm='log', vmin=1e-4)"
    ]
   },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from ess.reflectometry.tools import scale_reflectivity_curves_to_overlap\n",
+    "results_scaled = dict(zip(\n",
+    "    results.keys(),\n",
+    "    scale_reflectivity_curves_to_overlap(results.values()),\n",
+    "    strict=True\n",
+    "))\n",
+    "sc.plot(results_scaled, norm='log', vmin=1e-5)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from ess.reflectometry.tools import combine_curves\n",
+    "combine_curves(results_scaled.values(), workflow.compute(QBins)).plot(norm='log')"
+   ]
+  },
   {
    "cell_type": "markdown",
    "metadata": {},
@@ -354,7 +379,8 @@
    "mimetype": "text/x-python",
    "name": "python",
    "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3"
+   "pygments_lexer": "ipython3",
+   "version": "3.10.14"
   }
  },
  "nbformat": 4,
diff --git a/requirements/base.txt b/requirements/base.txt
@@ -53,7 +53,7 @@ jedi==0.19.1
     # via ipython
 jupyterlab-widgets==3.0.13
     # via ipywidgets
-kiwisolver==1.4.6
+kiwisolver==1.4.7
     # via matplotlib
 locket==1.0.0
     # via partd
diff --git a/requirements/nightly.txt b/requirements/nightly.txt
@@ -52,7 +52,7 @@ jedi==0.19.1
     # via ipython
 jupyterlab-widgets==3.0.13
     # via ipywidgets
-kiwisolver==1.4.6
+kiwisolver==1.4.7
     # via matplotlib
 locket==1.0.0
     # via partd
diff --git a/src/ess/reflectometry/tools.py b/src/ess/reflectometry/tools.py
@@ -1,7 +1,11 @@
 # SPDX-License-Identifier: BSD-3-Clause
 # Copyright (c) 2023 Scipp contributors (https://github.com/scipp)
+from collections.abc import Sequence
+from itertools import chain
+
 import numpy as np
 import scipp as sc
+import scipy.optimize as opt
 
 _STD_TO_FWHM = sc.scalar(2.0) * sc.sqrt(sc.scalar(2.0) * sc.log(sc.scalar(2.0)))
 
@@ -108,3 +112,161 @@ def linlogspace(
         grids.append(mesh[dim, start:])
 
     return sc.concat(grids, dim)
+
+
+def _sort_by(a, by):
+    return [x for x, _ in sorted(zip(a, by, strict=True), key=lambda x: x[1])]
+
+
+def _find_interval_overlaps(intervals):
+    '''Returns the intervals where at least
+    two or more of the provided intervals
+    are overlapping.'''
+    edges = list(chain.from_iterable(intervals))
+    is_start_edge = list(chain.from_iterable((True, False) for _ in intervals))
+    edges_sorted = sorted(edges)
+    is_start_edge_sorted = _sort_by(is_start_edge, edges)
+
+    number_overlapping = 0
+    overlap_intervals = []
+    for x, is_start in zip(edges_sorted, is_start_edge_sorted, strict=True):
+        if number_overlapping == 1 and is_start:
+            start = x
+        if number_overlapping == 2 and not is_start:
+            overlap_intervals.append((start, x))
+        if is_start:
+            number_overlapping += 1
+        else:
+            number_overlapping -= 1
+    return overlap_intervals
+
+
+def _searchsorted(a, v):
+    for i, e in enumerate(a):
+        if e > v:
+            return i
+    return len(a)
+
+
+def _create_qgrid_where_overlapping(qgrids):
+    '''Given a number of Q-grids, construct a new grid
+    covering the regions where (any two of the) provided grids overlap.'''
+    pieces = []
+    for start, end in _find_interval_overlaps([(q.min(), q.max()) for q in qgrids]):
+        interval_sliced_from_qgrids = [
+            q[max(_searchsorted(q, start) - 1, 0) : _searchsorted(q, end) + 1]
+            for q in qgrids
+        ]
+        densest_grid_in_interval = max(interval_sliced_from_qgrids, key=len)
+        pieces.append(densest_grid_in_interval)
+    return sc.concat(pieces, dim='Q')
+
+
+def _interpolate_on_qgrid(curves, grid):
+    return sc.concat(
+        [sc.lookup(c, grid.dim)[sc.midpoints(grid)] for c in curves], dim='curves'
+    )
+
+
+def scale_reflectivity_curves_to_overlap(
+    curves: Sequence[sc.DataArray],
+    return_scaling_factors=False,
+) -> list[sc.DataArray] | list[sc.scalar]:
+    '''Make the curves overlap by scaling all except the first by a factor.
+    The scaling factors are determined by a maximum likelihood estimate
+    (assuming the errors are normal distributed).
+
+    All curves must be have the same unit for data and the Q-coordinate.
+
+    Parameters
+    ---------
+    curves:
+        the reflectivity curves that should be scaled together
+    return_scaling_factor:
+        If True the return value of the function
+        is a list of the scaling factors that should be applied.
+        If False (default) the function returns the scaled curves.
+
+    Returns
+    ---------
+    :
+        A list of scaled reflectivity curves or a list of scaling factors.
+    '''
+    if len({c.data.unit for c in curves}) != 1:
+        raise ValueError('The reflectivity curves must have the same unit')
+    if len({c.coords['Q'].unit for c in curves}) != 1:
+        raise ValueError('The Q-coordinates must have the same unit for each curve')
+
+    qgrid = _create_qgrid_where_overlapping([c.coords['Q'] for c in curves])
+
+    r = _interpolate_on_qgrid(map(sc.values, curves), qgrid).values
+    v = _interpolate_on_qgrid(map(sc.variances, curves), qgrid).values
+
+    def cost(scaling_factors):
+        scaling_factors = np.concatenate([[1.0], scaling_factors])[:, None]
+        r_scaled = scaling_factors * r
+        v_scaled = scaling_factors**2 * v
+        v_scaled[v_scaled == 0] = np.nan
+        inv_v_scaled = 1 / v_scaled
+        r_avg = np.nansum(r_scaled * inv_v_scaled, axis=0) / np.nansum(
+            inv_v_scaled, axis=0
+        )
+        return np.nansum((r_scaled - r_avg) ** 2 * inv_v_scaled)
+
+    sol = opt.minimize(cost, [1.0] * (len(curves) - 1))
+    scaling_factors = (1.0, *sol.x)
+    if return_scaling_factors:
+        return [sc.scalar(x) for x in scaling_factors]
+    return [
+        scaling_factor * curve
+        for scaling_factor, curve in zip(scaling_factors, curves, strict=True)
+    ]
+
+
+def combine_curves(
+    curves: Sequence[sc.DataArray],
+    qgrid: sc.Variable | None = None,
+) -> sc.DataArray:
+    '''Combines the given curves by interpolating them
+    on a grid and merging them by the requested method.
+    The default method is a weighted mean where the weights
+    are proportional to the variances.
+
+    Unless the curves are already scaled correctly they might
+    need to be scaled using :func:`scale_reflectivity_curves_to_overlap`.
+
+    All curves must be have the same unit for data and the Q-coordinate.
+
+    Parameters
+    ----------
+    curves:
+        the reflectivity curves that should be combined
+    qgrid:
+        the Q-grid of the resulting combined reflectivity curve
+
+    Returns
+    ---------
+    :
+        A data array representing the combined reflectivity curve
+    '''
+    if len({c.data.unit for c in curves}) != 1:
+        raise ValueError('The reflectivity curves must have the same unit')
+    if len({c.coords['Q'].unit for c in curves}) != 1:
+        raise ValueError('The Q-coordinates must have the same unit for each curve')
+
+    r = _interpolate_on_qgrid(map(sc.values, curves), qgrid).values
+    v = _interpolate_on_qgrid(map(sc.variances, curves), qgrid).values
+
+    v[v == 0] = np.nan
+    inv_v = 1.0 / v
+    r_avg = np.nansum(r * inv_v, axis=0) / np.nansum(inv_v, axis=0)
+    v_avg = 1 / np.nansum(inv_v, axis=0)
+    return sc.DataArray(
+        data=sc.array(
+            dims='Q',
+            values=r_avg,
+            variances=v_avg,
+            unit=next(iter(curves)).data.unit,
+        ),
+        coords={'Q': qgrid},
+    )
diff --git a/tests/tools_test.py b/tests/tools_test.py
@@ -0,0 +1,127 @@
+# SPDX-License-Identifier: BSD-3-Clause
+# Copyright (c) 2023 Scipp contributors (https://github.com/scipp)
+import scipp as sc
+from ess.reflectometry.tools import combine_curves, scale_reflectivity_curves_to_overlap
+from scipp.testing import assert_allclose
+
+
+def curve(d, qmin, qmax):
+    return sc.DataArray(data=d, coords={'Q': sc.linspace('Q', qmin, qmax, len(d) + 1)})
+
+
+def test_reflectivity_curve_scaling():
+    data = sc.concat(
+        (
+            sc.ones(dims=['Q'], shape=[10], with_variances=True),
+            0.5 * sc.ones(dims=['Q'], shape=[15], with_variances=True),
+        ),
+        dim='Q',
+    )
+    data.variances[:] = 0.1
+
+    curves = scale_reflectivity_curves_to_overlap(
+        (curve(data, 0, 0.3), curve(0.8 * data, 0.2, 0.7), curve(0.1 * data, 0.6, 1.0)),
+    )
+
+    assert_allclose(curves[0].data, data, rtol=sc.scalar(1e-5))
+    assert_allclose(curves[1].data, 0.5 * data, rtol=sc.scalar(1e-5))
+    assert_allclose(curves[2].data, 0.25 * data, rtol=sc.scalar(1e-5))
+
+
+def test_reflectivity_curve_scaling_return_factors():
+    data = sc.concat(
+        (
+            sc.ones(dims=['Q'], shape=[10], with_variances=True),
+            0.5 * sc.ones(dims=['Q'], shape=[15], with_variances=True),
+        ),
+        dim='Q',
+    )
+    data.variances[:] = 0.1
+
+    factors = scale_reflectivity_curves_to_overlap(
+        (curve(data, 0, 0.3), curve(0.8 * data, 0.2, 0.7), curve(0.1 * data, 0.6, 1.0)),
+        return_scaling_factors=True,
+    )
+
+    assert_allclose(factors[0], sc.scalar(1.0), rtol=sc.scalar(1e-5))
+    assert_allclose(factors[1], sc.scalar(0.5 / 0.8), rtol=sc.scalar(1e-5))
+    assert_allclose(factors[2], sc.scalar(0.25 / 0.1), rtol=sc.scalar(1e-5))
+
+
+def test_combined_curves():
+    qgrid = sc.linspace('Q', 0, 1, 26)
+    data = sc.concat(
+        (
+            sc.ones(dims=['Q'], shape=[10], with_variances=True),
+            0.5 * sc.ones(dims=['Q'], shape=[15], with_variances=True),
+        ),
+        dim='Q',
+    )
+    data.variances[:] = 0.1
+    curves = (
+        curve(data, 0, 0.3),
+        curve(0.5 * data, 0.2, 0.7),
+        curve(0.25 * data, 0.6, 1.0),
+    )
+
+    combined = combine_curves(curves, qgrid)
+    assert_allclose(
+        combined.data,
+        sc.array(
+            dims='Q',
+            values=[
+                1.0,
+                1,
+                1,
+                0.5,
+                0.5,
+                0.5,
+                0.5,
+                0.5,
+                0.5,
+                0.5,
+                0.25,
+                0.25,
+                0.25,
+                0.25,
+                0.25,
+                0.25,
+                0.25,
+                0.25,
+                0.25,
+                0.125,
+                0.125,
+                0.125,
+                0.125,
+                0.125,
+                0.125,
+            ],
+            variances=[
+                0.1,
+                0.1,
+                0.1,
+                0.1,
+                0.1,
+                0.02,
+                0.02,
+                0.025,
+                0.025,
+                0.025,
+                0.025,
+                0.025,
+                0.025,
+                0.025,
+                0.025,
+                0.005,
+                0.005,
+                0.00625,
+                0.00625,
+                0.00625,
+                0.00625,
+                0.00625,
+                0.00625,
+                0.00625,
+                0.00625,
+            ],
+        ),
+    )

-Original file line number
+Diff line change
    orso
    supermirror
    types
 +   tools
 ```
 ## Amor