bcdev
diff --git a/‎README.md‎
Lines changed: 4 additions & 5 deletions b/‎README.md‎
Lines changed: 4 additions & 5 deletions
diff --git a/‎kaleidoscope/algorithms/randomize.py‎
Lines changed: 104 additions & 17 deletions b/‎kaleidoscope/algorithms/randomize.py‎
Lines changed: 104 additions & 17 deletions
diff --git a/‎kaleidoscope/config/config.reader.json‎
Lines changed: 13 additions & 1 deletion b/‎kaleidoscope/config/config.reader.json‎
Lines changed: 13 additions & 1 deletion
diff --git a/‎kaleidoscope/config/config.writer.json‎
Lines changed: 13 additions & 1 deletion b/‎kaleidoscope/config/config.writer.json‎
Lines changed: 13 additions & 1 deletion
diff --git a/‎kaleidoscope/config/config.yml‎
Lines changed: 6 additions & 3 deletions b/‎kaleidoscope/config/config.yml‎
Lines changed: 6 additions & 3 deletions
diff --git a/‎kaleidoscope/generators.py‎
Lines changed: 9 additions & 9 deletions b/‎kaleidoscope/generators.py‎
Lines changed: 9 additions & 9 deletions
@@ -21,17 +21,17 @@ processor. The processor is invoked from the command line. Typing
 will print a detailed usage message to the screen
 
     usage: kaleidoscope [-h] [--chunk-size-lat CHUNK_SIZE_LAT]
-                        [--chunk-size-lon CHUNK_SIZE_LON]
+                        [--chunk-size-lon CHUNK_SIZE_LON] [--selector SELECTOR]
                         [--engine-reader {h5netcdf,netcdf4,zarr}]
                         [--engine-writer {h5netcdf,netcdf4,zarr}]
                         [--log-level {debug,info,warning,error,off}]
                         [--mode {multithreading,synchronous}]
                         [--workers {1,2,3,4,5,6,7,8}] [--progress]
                         [--no-progress] [--stack-traces] [--no-stack-traces]
-                        [--test] [--no-test] [--tmpdir TMPDIR] [-v]
+                        [--tmpdir TMPDIR] [-v]
                         source_file target_file
 
-    This scientific processor simulates measurement errors.
+    This scientific processor simulates measurementerrors.
 
     positional arguments:
       source_file           the file path of the source dataset.
@@ -51,6 +51,7 @@ will print a detailed usage message to the screen
                             value of `-1` refers to full longitudinal chunk size
                             and a value of `0` refers to the chunk size used in
                             the source file. (default: None)
+      --selector SELECTOR   the Monte Carlo stream selector. (default: None)
       --engine-reader {h5netcdf,netcdf4,zarr}
                             specify the engine used to read the source product
                             file. (default: None)
@@ -72,8 +73,6 @@ will print a detailed usage message to the screen
       --no-progress         disable progress bar display. (default: True)
       --stack-traces        enable Python stack traces. (default: False)
       --no-stack-traces     disable Python stack traces. (default: True)
-      --test                enable test mode. (default: False)
-      --no-test             disable test mode. (default: True)
       --tmpdir TMPDIR       specify the path to the temporary directory.
                             (default: None)
       -v, --version         show program's version number and exit
 
@@ -4,19 +4,91 @@
 """
 This module provides the algorithm to randomize data.
 """
+from typing import Any
+from typing import Literal
 
 import dask.array as da
 import numpy as np
+from numpy.random import SeedSequence
 from typing_extensions import override
 
-from ..interface.algorithm import BlockAlgorithm
+from ..generators import DefaultNormal
+from ..interface.algorithm import InformedBlockAlgorithm
+from ..interface.generating import Normal
 
 
-class Randomize(BlockAlgorithm):
+def _block_seed(
+    block_id: tuple[int, ...], root_seed: np.ndarray
+) -> np.ndarray:
+    """Returns a random seed array for a given block."""
+    work_seed = SeedSequence(_hash(block_id)).generate_state(1)
+    return np.array([i for i in work_seed] + [i for i in root_seed])
+
+
+def _hash(block_id: tuple[int, ...]) -> int:
+    """Returns a positive hash value."""
+    h = 1
+    for i in block_id:
+        h = 31 * h + i
+    return h
+
+
+def _chlorophyll(
+    seed: np.ndarray, x: np.ndarray, u: np.ndarray
+) -> np.ndarray:
+    """
+    Returns randomized values for ESA CCI ocean colour chlorophyll.
+
+    Uses ESA CCI OC PUG (Equation 2.10).
+    """
+    return _lognormal(
+        seed, x, x * np.sqrt(np.exp(np.square(np.log(10.0) * u)) - 1.0)
+    )
+
+
+def _lognormal(seed: np.ndarray, x: np.ndarray, u: np.ndarray) -> np.ndarray:
+    """Returns randomized values for log-normally distributed errors."""
+    v = np.log(1.0 + np.square(u / x))
+    m = np.log(x) - 0.5 * v
+    return np.exp(_normal(seed, m, np.sqrt(v)))
+
+
+def _normal(seed: np.ndarray, x: np.ndarray, u: np.ndarray) -> np.ndarray:
+    """Returns randomized values for normally distributed errors."""
+    z: Normal = DefaultNormal(seed)
+    return x + u * z.randoms(np.empty(x.shape, x.dtype))
+
+
+class Randomize(InformedBlockAlgorithm):
     """
     The algorithm to randomize data.
     """
 
+    _dist: Literal["normal", "lognormal", "chlorophyll"] | str
+    """The type of measurement error distribution."""
+
+    _root_seed: np.ndarray
+    """The root seed."""
+
+    def __init__(
+        self,
+        dtype: np.dtype,
+        m: int,
+        dist: Literal["normal", "lognormal", "chlorophyll"] | str = "normal",
+        entropy: int | list[int] | None = None,
+    ):
+        """
+        Creates a new algorithm instance.
+
+        :param dtype: The result data type.
+        :param m: The number of input array dimensions.
+        :param dist: The type of measurement error distribution.
+        :param entropy: The entropy to create the seed sequence.
+        """
+        super().__init__(dtype, m, m)
+        self._dist = dist
+        self._root_seed = SeedSequence(entropy).generate_state(8)
+
     @override
     def chunks(self, *inputs: da.Array) -> tuple[int, ...] | None:
         return None
@@ -31,31 +103,46 @@ def created_axes(self) -> list[int] | None:
     def dropped_axes(self) -> list[int]:
         return []
 
-    # noinspection PyMethodMayBeStatic
     def randomize(
-        self, data: np.ndarray, *, test: bool = False
+        self,
+        *data: np.ndarray,
+        coverage_factor: Any = 1.0,
+        relative: bool = False,
+        **kwargs,
     ) -> np.ndarray:
         """
         Randomizes data.
 
         :param data: The data.
-        :param test: Run in test mode.
-        :return: The randomized data.
+        :param coverage_factor: The uncertainty coverage factor.
+        :param relative: Uncertainty is given in relative terms.
+        :return: The measurement values randomized.
         """
-        return data if test else self.simulate(data, data)
+        seed = _block_seed(kwargs["block_id"], self._root_seed)
 
-    compute_block = randomize
+        x = data[0]
+        u = (
+            data[1]
+            if len(data) == 2
+            else np.sqrt(np.square(data[1]) - np.square(data[2]))
+        )
+        if coverage_factor != 1.0:
+            u = u / coverage_factor
+        if relative:
+            u = u * x
 
-    # noinspection PyMethodMayBeStatic
-    def simulate(self, x: np.ndarray, u: np.ndarray):
-        """
-        Simulates measurement errors.
+        match self._dist:
+            case "normal":
+                y = _normal(seed, x, u)
+            case "lognormal":
+                y = _lognormal(seed, x, u)
+            case "chlorophyll":
+                y = _chlorophyll(seed, x, u)
+            case _:
+                y = x
+        return y
 
-        :param x: The measurement.
-        :param u: The measurement uncertainty.
-        :return: The simulated measurements.
-        """
-        return x
+    compute_block = randomize
 
     @property
     @override
 
@@ -8,7 +8,19 @@
     "config.reader.chunks": {
         "time": 1,
         "lat": 720,
-        "lon": 720
+        "lon": 720,
+
+        "esa-cci-oc": {
+            "time": 0,
+            "lat": 2160,
+            "lon": 2160
+        },
+
+        "_": {
+            "time": 0,
+            "lat": 0,
+            "lon": 0
+        }
     },
 
     "config.reader.engine": "h5netcdf",
 
@@ -8,7 +8,19 @@
     "config.writer.chunks": {
         "time": 0,
         "lat": 0,
-        "lon": 0
+        "lon": 0,
+
+        "esa-cci-oc": {
+            "time": 0,
+            "lat": 270,
+            "lon": 270
+        },
+
+        "_": {
+            "time": 0,
+            "lat": 0,
+            "lon": 0
+        }
     },
 
     "config.writer.engine": "h5netcdf",
 
@@ -7,6 +7,12 @@ chunk_size_lat:
 ## The chunk size is determined by the reader
 chunk_size_lon:
 
+## No default product type.
+product_type:
+
+## The default selector.
+selector: 0
+
 ## Detect the reader engine automatically
 engine_reader:
 
@@ -28,8 +34,5 @@ progress: False
 ## Disable stack traces.
 stack_traces: False
 
-## Disable test mode.
-test: False
-
 ## Use the working directory for temporary files.
 tmpdir: "."
@@ -58,7 +58,7 @@ def __init__(self, seed: int | np.ndarray | BitGenerator | None = None):
         self._g = default_generator(seed)
 
     @overrides
-    def next_int64(self) -> int:
+    def next(self) -> int:
         return self._g.integers(0x8000000000000000)
 
 
@@ -80,13 +80,13 @@ def get(self, i: int) -> Univariate:
         return self
 
     @overrides
-    def next_double(self) -> float:
+    def random(self) -> float:
         return self._g.random()
 
     @overrides
-    def next_doubles(self, doubles: np.ndarray) -> np.ndarray:
-        self._g.random(out=doubles)
-        return doubles
+    def randoms(self, randoms: np.ndarray) -> np.ndarray:
+        self._g.standard_normal(dtype=randoms.dtype, out=randoms)
+        return randoms
 
 
 class DefaultNormal(Normal):
@@ -107,10 +107,10 @@ def get(self, i: int) -> Univariate:
         return self
 
     @overrides
-    def next_double(self) -> float:
+    def random(self) -> float:
         return self._g.standard_normal()
 
     @overrides
-    def next_doubles(self, doubles: np.ndarray) -> np.ndarray:
-        self._g.standard_normal(out=doubles)
-        return doubles
+    def randoms(self, randoms: np.ndarray) -> np.ndarray:
+        self._g.standard_normal(dtype=randoms.dtype, out=randoms)
+        return randoms