CliMA
diff --git a/‎.buildkite/Manifest-v1.11.toml
Lines changed: 221 additions & 49 deletions b/‎.buildkite/Manifest-v1.11.toml
Lines changed: 221 additions & 49 deletions
diff --git a/‎.buildkite/Project.toml
Lines changed: 7 additions & 1 deletion b/‎.buildkite/Project.toml
Lines changed: 7 additions & 1 deletion
diff --git a/‎Artifacts.toml
Lines changed: 1 addition & 1 deletion b/‎Artifacts.toml
Lines changed: 1 addition & 1 deletion
diff --git a/‎experiments/calibration/PBS_calibration.pbs
Lines changed: 20 additions & 0 deletions b/‎experiments/calibration/PBS_calibration.pbs
Lines changed: 20 additions & 0 deletions
diff --git a/‎experiments/calibration/calibrate_land.jl
Lines changed: 113 additions & 0 deletions b/‎experiments/calibration/calibrate_land.jl
Lines changed: 113 additions & 0 deletions
@@ -6,6 +6,7 @@ CSV = "336ed68f-0bac-5ca0-87d4-7b16caf5d00b"
 CUDA = "052768ef-5323-5732-b1bb-66c8b64840ba"
 CairoMakie = "13f3f980-e62b-5c42-98c6-ff1f3baf88f0"
 ClimaAnalysis = "29b5916a-a76c-4e73-9657-3c8fd22e65e6"
+ClimaCalibrate = "4347a170-ebd6-470c-89d3-5c705c0cacc2"
 ClimaComms = "3a4d1b5c-c61d-41fd-a00a-5873ba7a1b0d"
 ClimaCore = "d414da3d-4745-48bb-8d80-42e94e092884"
 ClimaCoreMakie = "908f55d8-4145-4867-9c14-5dad1a479e4d"
@@ -17,6 +18,7 @@ ClimaUtilities = "b3f4f4ca-9299-4f7f-bd9b-81e1242a7513"
 DataFrames = "a93c6f00-e57d-5684-b7b6-d8193f3e46c0"
 Dates = "ade2ca70-3891-5945-98fb-dc099432e06a"
 DelimitedFiles = "8bb1440f-4735-579b-a4ab-409b98df4dab"
+EnsembleKalmanProcesses = "aa8a2aa5-91d8-4396-bcef-d4f2ec43552d"
 Flux = "587475ba-b771-5e3f-ad9e-33799f191a9c"
 Format = "1fa38f19-a742-5d3f-a2b9-30dd87b9d5f8"
 GeoMakie = "db073c08-6b98-4ee5-b6a4-5efafb3259c6"
@@ -38,11 +40,15 @@ StaticArrays = "90137ffa-7385-5640-81b9-e52037218182"
 Statistics = "10745b16-79ce-11e8-11f9-7d13ad32a3b2"
 StatsBase = "2913bbd2-ae8a-5f71-8c99-4fb6c76f3a91"
 SurfaceFluxes = "49b00bb7-8bd4-4f2b-b78c-51cd0450215f"
+TOML = "fa267f1f-6049-4f14-aa54-33bafae1ed76"
 Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
 Thermodynamics = "b60c26fb-14c3-4610-9d3e-2d17fe7ff00c"
 
 [compat]
-ClimaAnalysis = "0.5.16"
+ClimaAnalysis = "0.5.17"
 ClimaTimeSteppers = "0.7, 0.8"
+ClimaDiagnostics = "0.2.13"
+ClimaCalibrate = "0.0.15"
+EnsembleKalmanProcesses = "2.4.1"
 Flux = "0.15"
 Statistics = "1"
@@ -18,7 +18,7 @@ git-tree-sha1 = "cbbc6b3752d9cb9b667ec33cfbeb46819f8db418"
     [[landsea_mask_1deg.download]]
     sha256 = "3722b553c2fdf28a6574aea2e0b167d16ab050f34e5969ada45625b3a3ecb6da"
     url = "https://caltech.box.com/shared/static/b3u4dv0dsoswvqgp8y63bzj7awbhwztd.gz"
-    
+
 [soil_ic_2008_50m]
 git-tree-sha1 = "fd9cda235e203b4235136b6dcdcd07af788c00f6"
 
 
@@ -0,0 +1,20 @@
+#!/bin/bash
+#PBS -N derecho_calibration
+#PBS -o output.txt
+#PBS -e error.txt
+#PBS -l walltime=12:00:00
+#PBS -l select=1:ncpus=4:ngpus=1
+
+## Account number for CliMA
+#PBS -A UCIT0011
+#PBS -q main
+
+export PBS_ACCOUNT="UCIT0011"
+export MODULEPATH="/glade/campaign/univ/ucit0011/ClimaModules-Derecho:$MODULEPATH"
+module load climacommon
+
+export CLIMACOMMS_DEVICE="CUDA"
+export CLIMACOMMS_CONTEXT="SINGLETON"
+julia --project=.buildkite -e 'using Pkg; Pkg.instantiate(;verbose=true)'
+
+julia --project=.buildkite/ experiments/calibration/calibrate_land.jl
@@ -0,0 +1,113 @@
+######## CONFIGS ########
+# Most of the time users will just need to modify the settings below
+# Our goal is to make it flexible and easy to run different calibration setups
+# And to potentially iterate fast (e.g., low resolution, specific regions, few params, short simulation time...)
+#########################
+
+ENV["JULIA_WORKER_TIMEOUT"] = "1000.0" # This is a ClimaCalibrate setting. Wait time for workers.
+
+using Dates
+using Distributed
+import EnsembleKalmanProcesses as EKP
+import Random
+using ClimaLand
+import ClimaCalibrate: forward_model, parameter_path, path_to_ensemble_member
+import ClimaCalibrate as CAL
+rng_seed = 2
+rng = Random.MersenneTwister(rng_seed)
+FT = Float64
+
+# Calibrate the land model with:
+const variable_list = ["swu"] # variables you want to capture by adjusting your priors
+const n_iterations = 10 # 1 iterations takes ~ 1.5 hour with current settings (resolution, 2 year simulation)
+const spinup_period = Year(1)
+# potentially we could add time_for_calibration (currently 1 year)
+
+# Using the following priors:
+include(joinpath(@__DIR__, "priors.jl"))
+# potentially we could add loss-parameters pairing https://clima.github.io/EnsembleKalmanProcesses.jl/dev/update_groups/
+
+# With the forward model on GPUS. Note: the forward model needs to be adjusted to read priors!
+ekp_process = EKP.Unscented(prior)
+ensemble_size = ekp_process.N_ens
+# Config for workers
+addprocs(
+    CAL.PBSManager(ensemble_size), # simulations in parallel. User may change this to use less GPUs.
+    q = "main",
+    A = "UCIT0011",
+    l_select = "1:ngpus=1:ncpus=4",
+    l_walltime = "11:30:00",
+    l_job_priority = "premium",
+)
+# ClimaLand (forward model) - needs to read priors!
+@everywhere begin
+    using Dates # needs to be called again for workers
+    const nelements = (50, 10) # resolution - (horizontal elements (lon,lat), vertical elements (soil discretization))
+    const start_date = DateTime(2008, 12, 01) # this is the start of the forward model spinup
+    const caldir = "calibration_output_utki"
+    using ClimaLand
+    dir = pkgdir(ClimaLand)
+    include(joinpath(dir, "experiments/calibration/forward_model.jl"))
+end
+@assert month(start_date + spinup_period) == 12 "The start of your calibration period should be December."
+
+# And using those locations (currently all coordinates on land):
+include(joinpath(@__DIR__, "make_training_locations.jl"))
+training_locations = make_training_locations(nelements)
+# potentially we can add regional runs or specific lon lat bands or filter (e.g., regions with snow)
+
+# NOTE1: Don't forget to modify your forward model (land or bucket) to read and use your priors correctly.
+# NOTE2: The noise is set in observationseries_era5.jl - adjust if needed.
+# ^ current noise options: era5 inter-annual variance, era5 seasonal mean * factor, flat noise, weigh by lats.
+# NOTE3: Currently everything is set to use seasonal averages. We could add option to use e.g., monthly or other.
+# NOTE4: We could add option to calibrate single sites (change forward model, observationseries, observation_map).
+# ^ maybe Julia and Thanhthanh SURF?
+
+
+
+##########################
+# Most of the time you won't need to change the code below.
+# Unless you change EKP configurations, or other specific settings.
+##########################
+
+
+# observationseries - era5 data and noise object to compare to model output in EKP (to minimize the loss)
+include(joinpath(@__DIR__, "observationseries_era5.jl"))
+
+# l_obs is the length of Observation objects (observationseries for era5, observationmap for ClimaLand)
+n_locations = length(training_locations)
+n_variables = length(variable_list)
+n_time_points = 4 # 4 seasons (and not, for example, 12 months)
+l_obs = n_time_points * n_variables * n_locations
+
+# build observation from ClimaLand outputs - for one member
+include(joinpath(@__DIR__, "observation_map.jl"))
+
+# build observation from ClimaLand outputs - for all members
+function CAL.observation_map(iteration)
+    single_member_dims = (l_obs,)
+    G_ensemble = Array{Float64}(undef, single_member_dims..., ensemble_size)
+
+    for m in 1:ensemble_size
+        member_path = path_to_ensemble_member(caldir, iteration, m)
+        simdir_path =
+            joinpath(member_path, "global_diagnostics", "output_active")
+        simdir = SimDir(simdir_path)
+        G_ensemble[:, m] .=
+            process_member_data(simdir, training_locations, variable_list)
+    end
+
+    return G_ensemble
+end
+
+# Build the UTKI object - this is where you set EKP configurations
+utki = EKP.EnsembleKalmanProcess(
+    observationseries,
+    EKP.TransformUnscented(prior, impose_prior = true);
+    verbose = true,
+    rng,
+    scheduler = EKP.DataMisfitController(terminate_at = 100),
+)
+
+# Run the calibration via ClimaCalibrate using the arguments built above
+CAL.calibrate(CAL.WorkerBackend, utki, n_iterations, prior, caldir)