wavestoweather
diff --git a/‎.gitlab-ci.yml‎
Lines changed: 38 additions & 6 deletions b/‎.gitlab-ci.yml‎
Lines changed: 38 additions & 6 deletions
diff --git a/‎CMakeLists.txt‎
Lines changed: 4 additions & 1 deletion b/‎CMakeLists.txt‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎README.md‎
Lines changed: 4 additions & 4 deletions b/‎README.md‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎configs/Readme.md‎
Lines changed: 124 additions & 0 deletions b/‎configs/Readme.md‎
Lines changed: 124 additions & 0 deletions
diff --git a/‎configs/james_sens_config.json‎
Lines changed: 1 addition & 12 deletions b/‎configs/james_sens_config.json‎
Lines changed: 1 addition & 12 deletions
@@ -1,9 +1,9 @@
-image: "mahieronymus/ad_sensitivity:2.12"
+image: "mahieronymus/ad_sensitivity:3.0"
 
 stages:
   - Static Analysis CPP
   - build
-
+  - test
 
 lint:
   stage: Static Analysis CPP
@@ -21,20 +21,52 @@ build:
   script:
     - mkdir build
     - cd build && 
-      cmake .. -DCMAKE_BUILD_TYPE=release -DTARGET=simulation -DTRUSTED_DATA:BOOL=ON -DB_EIGHT:BOOL=ON -DCCN_AKM:BOOL=ON && 
+      cmake .. -DCMAKE_BUILD_TYPE=release -DTARGET=simulation -DTRUSTED_DATA:BOOL=ON -DIN_SAT_ADJ:BOOL=ON  -DB_EIGHT:BOOL=ON -DCCN_AKM:BOOL=ON && 
       make -j4
     - cd .. && mkdir build_interface
     - cd build_interface && 
-      cmake .. -DCMAKE_BUILD_TYPE=release -DTARGET=python_interface  -DTRUSTED_DATA:BOOL=ON -DB_EIGHT:BOOL=ON -DCCN_AKM:BOOL=ON && 
+      cmake .. -DCMAKE_BUILD_TYPE=release -DTARGET=python_interface  -DTRUSTED_DATA:BOOL=ON -DIN_SAT_ADJ:BOOL=ON  -DB_EIGHT:BOOL=ON -DCCN_AKM:BOOL=ON && 
       make -j4
     - cd .. && mkdir build_regrid
     - cd build_regrid &&
-      cmake .. -DCMAKE_BUILD_TYPE=release -DTARGET=regrid -DCOMPRESSION_LEVEL=6 -DTRUSTED_DATA:BOOL=ON -DB_EIGHT:BOOL=ON -DCCN_AKM:BOOL=ON &&
+      cmake .. -DCMAKE_BUILD_TYPE=release -DTARGET=regrid -DCOMPRESSION_LEVEL=6 -DTRUSTED_DATA:BOOL=ON -DIN_SAT_ADJ:BOOL=ON  -DB_EIGHT:BOOL=ON -DCCN_AKM:BOOL=ON &&
       make -j4
     - cd .. && mkdir build_loom
     - cd build_loom &&
-      cmake .. -DCMAKE_BUILD_TYPE=release -DTARGET=loom -DCOMPRESS_OUTPUT:BOOL=ON -DCOMPRESSION_LEVEL=6 -DTRUSTED_DATA:BOOL=ON -DB_EIGHT:BOOL=ON -DCCN_AKM:BOOL=ON &&
+      cmake .. -DCMAKE_BUILD_TYPE=release -DTARGET=loom -DCOMPRESS_OUTPUT:BOOL=ON -DCOMPRESSION_LEVEL=6 -DTRUSTED_DATA:BOOL=ON -DIN_SAT_ADJ:BOOL=ON -DB_EIGHT:BOOL=ON -DCCN_AKM:BOOL=ON &&
       make -j4
   tags:
     - make
   allow_failure: false
+
+test:
+  stage: test
+  dependencies:
+    - build
+  script:
+    - source /app/venv/bin/activate
+    - export AD_SENS_HOME=`pwd`
+    - ls
+    - pwd
+    - mkdir -p data/test_files_simulated
+    - mpirun -n 4 build/bin/./trajectories
+      -w 20000
+      -a 3
+      -t 0
+      -f 234600
+      -d 30
+      -i 1
+      -b 1
+      -o data/test_files_simulated/artificial_test.nc
+      -e 1
+      -p 500
+      -g 0
+      -l data/artificial_test.nc
+      -s configs/qv_qr_lat_config.json
+      -u 180
+    - cd /app/ad_sensitivity_analysis/tests/end_to_end && python test_output.py --input /builds/mahieron/process_plot_scripts/data/test_files_simulated/ --test_nan_dims
+      --test_physics /builds/mahieron/process_plot_scripts/build_interface/lib/libpython_interface.so --test_phases --test_nan_vars --calc_phases --test_sensitivities --test_amounts --test_saturation
+      --verbosity 4 --table_path /builds/mahieron/process_plot_scripts/dmin_wetgrowth_lookup.dat
+  tags:
+    - test
+  allow_failure: false
@@ -241,7 +241,10 @@ if (LINE_INFO)
     set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -g")
     message("${BoldYellow}~~~ Compiling with -g.${ColourReset}")
 endif()
-
+if (IN_SAT_ADJ)
+    set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -DIN_SAT_ADJ")
+    message("${BoldYellow}~~~ Saturation adjustment is done at the start of each RK4 step and in the end of RK4")
+endif()
 message(STATUS "Searching for necessary libraries")
 
 include_directories(${AD_SIM_HOME})
 
@@ -17,15 +17,15 @@ the time step at which perturbing a parameter is necessary with a random forest
 of about 75% for each model parameter and hydrometeor. \
 In [another paper](https://doi.org/10.5194/gmd-16-4617-2023) we use [Met.3D](https://met3d.wavestoweather.de/met-3d.html)
 to analyze the output further.
-This version is used in a third paper where we analyze a WCB case with more than 16,000 trajectories associated
+This version is also used in a [third paper](https://doi.org/10.1016/j.jocs.2025.102614) where we analyze a WCB case with more than 16,000 trajectories associated
 with an extratropycal cyclone from 18 UTC 03 October 2016 and the following 66 hours.
 
 This repository consists of an implementation of a two-moment scheme (similar to [ICON](https://www.dwd.de/EN/research/weatherforecasting/num_modelling/01_num_weather_prediction_modells/icon_description.html)) 
 with [AD using CoDiPack](https://github.com/scicompkl/codipack) where environment and initial variables are read from [NetCDF](https://www.unidata.ucar.edu/software/netcdf/) files. 
 Python scripts are used for post-processing and data analysis. For the C++ code we follow the
 [doxygen standard](http://www.doxygen.nl/manual/docblocks.html). \
 We recommend using the docker image 
-[mahieronymus/ad_sensitivity:2.12](https://hub.docker.com/repository/docker/mahieronymus/ad_sensitivity/general) 
+[mahieronymus/ad_sensitivity:3.0](https://hub.docker.com/repository/docker/mahieronymus/ad_sensitivity/general) 
 which provides the Python scripts for analyzing and plotting the data and all necessary prerequisites. 
 Alternatively, you may use an [anaconda](https://www.anaconda.com/) environment with `pyproject.toml`. 
 
@@ -51,7 +51,7 @@ C++ Prerequisites
 - [NetCDF](https://www.unidata.ucar.edu/software/netcdf/) (v4.9.2)
 - [HDF5](https://www.hdfgroup.org/solutions/hdf5/) (v1.12 or above; tested with v1.14.2)
 - [Boost](https://www.boost.org/) (1.74.0 or above; tested with v1.81.0)
-- [CoDiPack](https://www.scicomp.uni-kl.de/software/codi/) (v2.0 or above: tested with v2.2.0)
+- [CoDiPack](https://www.scicomp.uni-kl.de/software/codi/) (v2.0 or above: tested with v3.0.0)
 - [CMake](https://cmake.org/) (v3.7.2 or above; tested with v3.26.4)
 - [nlohmann/json](https://github.com/nlohmann/json) (v3.9.1 or above; tested with v3.11.2)
 - [(optional) PnetCDF](https://parallel-netcdf.github.io/) (v1.12.2; only if you want to use classic NetCDF-files)
@@ -125,7 +125,7 @@ Default: off
 
 Analyzing the output
 --------------------
-We recommend [our docker image]((https://hub.docker.com/repository/docker/mahieronymus/ad_sensitivity/general)) (v2.12).
+We recommend [our docker image]((https://hub.docker.com/repository/docker/mahieronymus/ad_sensitivity/general)) (v2.14).
 This docker image provides multiple scripts to analyze the data with Jupyter notebooks.
 The data of the sensitivity simulation is stored under `data/simulation/*.nc`.
 Within `ad_sensitivity_analysis/interactive/`, there are different functions that can be called with the 
 
@@ -0,0 +1,124 @@
+# Configuration files
+There are two types of configuration files:
+- Configure gradient output
+- Configure ensemble simulations
+  All configuration files are using the [JSON-format](https://ecma-international.org/publications-and-standards/standards/ecma-404/). This makes the configurations human-readable and easy to generate and read thanks to the extensive support in many languages. This code uses [JSON for Modern C++](https://github.com/nlohmann/json) to load the data.
+
+## Configure gradient output
+This configuration is needed whenever a sensitivity analysis is done. It defines which targets, i.e., model state variables, are differentiated using `model_state_variable` and a list of ids of the desired targets. The ids are defined in `include/microphysics/constants.h` and are as follows:
+Target | Index
+---|----
+Pressure | 0
+Temperature | 1
+Vertical ascent velocity | 2
+Saturation | 3
+Cloud droplet mixing ratio | 4
+Rain droplet mixing | 5
+Water vapor mixing ratio | 6
+Number of cloud droplets | 7
+Number of rain droplets | 8
+Ice mixing ratio | 9
+Number of ice crystals | 10
+Snow mixing ratio | 11
+Number of snow particles | 12
+Graupel mixing ratio | 13
+Number of graupel particles | 14
+Hail mixing ratio | 15
+Number of hail particles | 16
+Ice mixing ratio precipitation | 17
+Snow mixing ratio precipitation | 18
+Rain mixing ratio precipitation | 19
+Graupel mixing ratio precipitation | 20
+Hail mixing ratio precipitation | 21
+Latent heating | 22
+Latent cooling | 23
+Ice particles precipitation | 24
+Snow particles ratio precipitation | 25
+Rain droplets ratio precipitation | 26
+Graupel particles ratio precipitation | 27
+Hail particles ratio precipitation | 28
+
+The model parameters for which sensitivities are computed are defined by a list `out_params` by name such as `db_ccn_1` or `dcloud_a_geo`. Note the 'd' which usually indicates a derivative. An overview of all model parameters is available in variable `output_grad_idx` in `include/microphysics/constants.h`. You may define your own model parameters here if you add different physics. An example can be seen with `CCN_AKM` which is a preprocessor instruction for the C++-code that defines a different CCN activation.
+A full example that calculates the sensitivities of water vapor mixing ratio, latent heating and cooling to several parameters is:
+```
+{
+  "model_state_variable": [
+    6, 22, 23
+  ],
+  "out_params": [
+    "db_ccn_1",
+    "db_ccn_2",
+    "dc_ccn_1",
+    "dc_ccn_2"
+  ]
+}
+```
+
+## Configure ensemble simulations
+The ensemble simulations are organized in segments where each segment defines when the perturbed member is started, how many members there are, which parameters are perturbed and how the perturbation is calculated. While it is technically possible to define multiple segments with different perturbations each, it is easier to create multiple configuration files and run each independently when executing it on a cluster.
+The conditions for the ensembles are asserted and executed in the function `parameter_check()` in `src/microphysics/trajectories.cpp`.
+
+### When to perturb
+The parameter `when_method` defines when to perturb the ensemble member. Possible options are
+- `full_perturbation`: Run the perturbation from the beginning.
+- `repeated_time`: Start the ensemble every `when_value` seconds.
+- `impact_change`: Start an ensemble simulation when the parameter with the highest derivative changes.
+- `sign_flip`: Start an ensemble when the gradient of a predefined target to a predefined parameter changes. See below for setting the parameter and target.
+- `value`: Start an ensemble if the gradient of a predefined target to a predefined parameter reaches a given value defined in `when_value` (within some tolerance).
+  Further variables are:
+- `duration`: If `when_method` is not `full_perturbation`, you can limit the length of the ensemble simulation with this variable (in seconds).
+- `amount`: Define the number of ensemble members (including the unperturbed simulation).
+- `params`: A list that defines which parameters are perturbed and how.
+  Each entry of `params` must define the parmater to be perturbed, how and by how much it is perturbed:
+- `name`: Name of the parameter to be perturbed such as `a_ccn_1` or `a_geo`.
+- `type`: Type of the parameter such as `model` if it is purely a model parameter such as `a_ccn_1` or the hydrometeor type of the parameter such as `cloud` for `a_geo`.
+- `rand_func`: The random number generator or function to be used. Possible options are:
+    - `fixed`: Perturb by a fixed amount where the parameters is increased by the fixed amount for every second member and reduced otherwise.
+    - `uniform`: Draw a random number from a uniform distribution.
+    - `normal`: Draw from a normal distribution.
+- `sigma`: (We use $p$ for the parameter value in the following)
+    - If `rand_func` is `uniform`: The uniform distribution is bound by the [$p - \sigma, p + \sigma$].
+    - If `rand_func` is `normal`: The normal distribution is defined by $\mathcal{N}(p, \sigma)$ where $\sigma$ is the standard deviation.
+    - If `rand_func` is `fixed`: The parameter is set to $p - \sigma$ and $p + \sigma$ alternatively for each ensemble member.
+- `sigma_perc`: Same as `sigma` but the perturbation is done by a percentage of the parameter value, e.g., for `rand_func` set to `fixed`, the parameter is set to $p - \sigma_{perc} \cdot p$ and $p + \sigma_{perc} \cdot p$ alternatively.
+
+An example where `dcloud_a_geo` is perturbed by 10% where the ensemble is running from start to end with one member an increased and another with a decreased value:
+```
+{
+    "segments": [
+        {
+            "when_method": "full_perturbation",
+            "amount": 3,
+            "params": [
+                {
+                    "name": "a_geo",
+                    "sigma_perc": 10,
+                    "type": "cloud",
+                    "rand_func": "fixed"
+                }
+            ]
+        }
+    ]
+}
+```
+Another example where every 30 minutes an ensemble is started that runs for 30 minutes. There are 64 members with perturbed parameters drawn from a uniform distribution:
+```
+{
+    "segments": [
+        {
+            "when_method": "repeated_time",
+            "duration": 1800,
+            "when_value": 1800,
+            "amount": 65,
+            "params": [
+                {
+                    "name": "a_geo",
+                    "sigma_perc": 10,
+                    "type": "cloud",
+                    "rand_func": "uniform"
+                }
+            ]
+        }
+    ]
+}
+```
@@ -1,10 +1,6 @@
 {
     "model_state_variable": [
-        4, 5, 6, 7, 8, 9,
-        10, 11, 12, 13, 14,
-        15, 16, 17, 18, 19,
-        20, 21, 24, 25, 26,
-        27, 28
+        6, 22, 23
     ],
     "out_params": [
         "dD_conv_ig",
@@ -15,7 +11,6 @@
         "dsnow_a_vel",
         "dgraupel_min_x_sedimentation",
         "dice_b_geo",
-        "dinv_z",
         "dice_s_vel",
         "dgraupel_a_vel",
         "dsnow_b_vel",
@@ -125,7 +120,6 @@
         "dhail_max_x",
         "dice_min_x_evap",
         "dd_ccn_2",
-        "dconst4",
         "dk_1_conv",
         "drain_rho_v",
         "dice_d_crit_c",
@@ -135,8 +129,6 @@
         "dice_min_x_depo",
         "drain_a_vel",
         "dna_orga",
-        "dconst5",
-        "dconst0",
         "dsnow_min_x_depo",
         "dgraupel_min_x_riming",
         "dcloud_max_x",
@@ -163,9 +155,7 @@
         "dhail_a_ven",
         "dcloud_min_x_freezing",
         "dr_0",
-        "dN_avo",
         "dsnow_max_x",
-        "dconst3",
         "dsnow_vsedi_max",
         "dice_rho_v",
         "dgraupel_b_vel",
@@ -191,5 +181,4 @@
         "drain_alpha",
         "dice_max_x"
     ]
-
 }