glacier_pinn/make_LOGO_figures.py at main · viola1593/glacier_pinn · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
"""Make predicitons of the LOGO test glaciers with the respective model trained without the glacier and save the predictions in a csv file.
Also we plot the predictions and the residual to the measured ice thicknesses. """

import argparse
import numpy as np
import os
import pandas as pd
import pytorch_lightning as pl
from pytorch_lightning.trainer import Trainer

import matplotlib.pyplot as plt
import matplotlib.font_manager as fm
from matplotlib.ticker import FormatStrFormatter, MaxNLocator, FuncFormatter
from matplotlib import ticker
from mpl_toolkits.axes_grid1.inset_locator import inset_axes
from mpl_toolkits.axes_grid1.anchored_artists import AnchoredSizeBar

from dataset_new import PL_GlacierDataset
from model import PL_PINN
from utils import read_config

SUBLABEL= ['(a)', '(b)', '(c)', '(d)', '(e)', '(f)', '(g)']
FONTSIZE_TINY=12
FONTSIZE_SMALL=14
FONTSIZE_BIG=20
FONTSIZE_MEDIUM=16

GLACIER_IDS = {
        'RGI60-07.00240': {'num_plot': 1, 'xticks': [15.7], 'yticks': [77.0]},
        'RGI60-07.00344': {'num_plot': 2, 'xticks': [16.3,], 'yticks': [78.0]},
        'RGI60-07.00496': {'num_plot': 3, 'xticks': [10.5, 11.5], 'yticks': [78.5, 79.5]},
        "RGI60-07.00497": {'num_plot': 4, 'xticks': [10.5, 11.5], 'yticks': [78.5, 79.5]},
        'RGI60-07.01100': {'num_plot': 5, 'xticks': [10.5, 11.5], 'yticks': [78.5, 79.5]},
        'RGI60-07.01481': {'num_plot': 6, 'xticks': [10.5, 11.5], 'yticks': [78.5, 79.5]},
        'RGI60-07.01482': {'num_plot': 7, 'xticks': [10.5, 11.5], 'yticks': [78.5, 79.5]}
        }

def format_yticks(y, _):
    y_new_unit = y / 1000  # Change unit from meters to kilometers
    return f"{y_new_unit:.0f} km"  # 2 decimal places

def ax_formatter(ax, x_grid, y_grid):

    ax.xaxis.set_major_formatter(FormatStrFormatter('%.2f° E'))
    ax.yaxis.set_major_formatter(FuncFormatter(format_yticks))

    # -------------------------------------
    # tick params
    # set number of x and y ticks, defines where and how many grid lines there are
    ax.xaxis.set_major_locator(MaxNLocator(nbins=1))  # Set number of x-ticks
    ax.yaxis.set_major_locator(MaxNLocator(nbins=1))  # Set number of y-ticks


    # if we show the tick labels we want them inside the plot, x axis should be rotated to fit along the gridlines
    ax.tick_params(axis='x', which='both', direction='in', length=0, labelsize=FONTSIZE_SMALL, pad=-100)
    ax.tick_params(axis='y', which='both', direction='in', length=1, labelsize=FONTSIZE_TINY, pad=-70, colors='grey')

    # only show the y tick labels
    ax.tick_params(labelbottom=False, labeltop=False, labelleft=True, labelright=False)

    ax.yaxis.grid(True,linestyle=':', linewidth=0.5, color='grey')  # Add grid lines for the y-axis only

    # -------------------------------------
    #Add scalebar
    # Define the length of the scale bar and the label
    # y direction
    scalebar_length = 1000  # 1000 meters = 1 km
    scalebar_label = "1 km"
    # Define the vertical extent of the scale bar and make it have the same extent in every plot although the extents of the plots vary
    extent = np.max(y_grid)-np.min(y_grid)
    scalebar_vertical = extent/60
    # Create a font properties object
    fontprops = fm.FontProperties(size=FONTSIZE_MEDIUM)
    # Create the scale bar
    scalebar = AnchoredSizeBar(ax.transData, scalebar_length, scalebar_label, 'upper right', pad=0.2, label_top=True,
                               color='black', frameon=False, size_vertical=scalebar_vertical, fontproperties=fontprops,
                               )
    # Add the scale bar to the axes
    scalebar_artist = ax.add_artist(scalebar)
    return scalebar_artist


def plot_velocity_predictions(position_grid, velocities, save_dir, rgi):

    max_value_x = abs(np.mean(velocities[:,0]))+3*np.std(velocities[:,0])
    max_value_y = abs(np.mean(velocities[:,1])) +3*np.std(velocities[:,1])
    #print(max_value_x, max_value_y)
    f, (ax1,ax2) = plt.subplots(1,2, figsize=(12,7), sharey=True, layout='constrained')
    scatter1=ax1.scatter(position_grid.iloc[:,0], position_grid.iloc[:,1], c=velocities[:,0],  cmap='coolwarm',vmax=max_value_x, vmin=-max_value_x,marker='.', s=10)
    ax_formatter(ax1, position_grid.iloc[:,0], position_grid.iloc[:,1])
    ax1.set_title('Depth-averaged velocity $ \overline{v}_x$ ', fontsize=FONTSIZE_BIG)

    cbar1 = plt.colorbar(scatter1, ax=ax1,extend='both')
    cbar1.set_label('Velocity [m a$^{-1}$]', fontsize=FONTSIZE_SMALL, labelpad=0)
    cbar1.ax.tick_params(labelsize=FONTSIZE_SMALL)
    ax1.text(-0.1, 1.05, '(a)', fontsize=FONTSIZE_BIG, transform=ax1.transAxes)


    scatter2 = ax2.scatter(position_grid.iloc[:,0], position_grid.iloc[:,1], c=velocities[:,1], cmap='coolwarm', vmax=max_value_y, vmin=-max_value_y,marker='.', s=10)
    scalebar_artist=ax_formatter(ax2, position_grid.iloc[:,0], position_grid.iloc[:,1])
    scalebar_artist.remove()
    ax2.set_ylabel('')
    ax2.tick_params(labelbottom=False, labeltop=False, labelleft=False, labelright=False)

    ax2.set_title('Depth-averaged velocity $ \overline{v}_y$', fontsize=FONTSIZE_BIG)
    cbar2 = plt.colorbar(scatter2, ax=ax2,extend='both')
    cbar2.set_label('Velocity [m a$^{-1}$]', fontsize=FONTSIZE_SMALL, labelpad=0)
    cbar2.ax.tick_params(labelsize=FONTSIZE_SMALL)
    ax2.text(-0.1, 1.05, '(b)', fontsize=FONTSIZE_BIG, transform=ax2.transAxes)


    f.savefig(os.path.join(save_dir,'LOGOvelocity_prediction'+rgi+'.png'), dpi=300)


def plot_residuals(grid_coords, measurement_coords, grid_thickness, residuals, fig, num_plot, rgi, res_or_thick='both'):
    if num_plot <5:
        ax = fig.add_subplot(2,4,num_plot)

    else:
        ax = fig.add_subplot(2,3,num_plot-1)

    ax.set_title(rgi, fontsize=FONTSIZE_BIG)

    # transform lat lon to meters
    x_grid, y_grid = grid_coords.iloc[:,0], grid_coords.iloc[:,1]
    x_measurement, y_measurement = measurement_coords.iloc[:,0], measurement_coords.iloc[:,1]

    # plot ice thickness and residuals depending on what is wanted
    if res_or_thick == 'thickness':
        p1 = ax.scatter(x_grid, y_grid, c=grid_thickness, cmap='viridis',marker='.', s=20, alpha=0.8)
        # -------------------------------------
        # colorbars
        cbar1 = plt.colorbar(p1, ax=ax)
        cbar1.ax.tick_params(labelsize=FONTSIZE_MEDIUM)
        # Set the number of ticks you want
        locator = ticker.MaxNLocator(nbins=3)
        cbar1.locator = locator
        cbar1.update_ticks()
        # Set the label of the colorbar only in the last plot
        if num_plot == 7:
            cbar1.ax.set_ylabel('Thickness $H_\mathrm{PINN}$ [m]', fontsize=FONTSIZE_BIG)

    if res_or_thick == 'residual':
        p1 = ax.scatter(x_grid, y_grid, c='#d8d8d8',marker='.', s=20, alpha=0.8)
        p2 = ax.scatter(x_measurement, y_measurement, c=residuals, cmap='RdBu', vmin=-100, vmax=100,marker='.', s=20)
        # -------------------------------------
        # colorbars
        if num_plot ==7:
            cbar2 = plt.colorbar(p2, ax=ax, extend='both')
            cbar2.ax.set_ylabel('$H_\mathrm{GPR}-H_\mathrm{PINN}$', fontsize=FONTSIZE_BIG)
            cbar2.ax.tick_params(labelsize=FONTSIZE_MEDIUM)
            locator = ticker.MaxNLocator(nbins=1)
            cbar2.locator = locator
            cbar2.update_ticks()

    if res_or_thick == 'both':
        p1 = ax.scatter(x_grid, y_grid, c=grid_thickness, cmap='viridis',marker='.', s=20, alpha=0.8)
        p2 = ax.scatter(x_measurement, y_measurement, c=residuals, cmap='RdBu', vmin=-50, vmax=50,marker='.', s=20)
        # -------------------------------------
        # colorbars
        # cbar1 is for the ice thickness
        cbar1 = plt.colorbar(p1, ax=ax)
        cbar1.ax.tick_params(labelsize=FONTSIZE_MEDIUM)
        # Set the number of ticks you want
        locator = ticker.MaxNLocator(nbins=3)
        cbar1.locator = locator
        cbar1.update_ticks()
        # Set the label of the colorbar only in the last plot
        if num_plot == 7:
            cbar1.ax.set_ylabel('Thickness $H_\mathrm{PINN}$ [m]', fontsize=FONTSIZE_BIG)
        # cbar2 is for the residuals, only show it in the first plot as an inset
        if num_plot ==1:
            cbaxes = inset_axes(ax, width="30%", height="3%", loc='upper right', borderpad=2)
            cbar2 = plt.colorbar(p2, cax=cbaxes,  orientation='horizontal', extend='both')
            cbar2.ax.set_xlabel('$H_\mathrm{GPR}-H_\mathrm{PINN}$', fontsize=FONTSIZE_MEDIUM)
            cbar2.ax.tick_params(labelsize=FONTSIZE_MEDIUM)
            locator = ticker.MaxNLocator(nbins=1)
            cbar2.locator = locator
            cbar2.update_ticks()


    ax_formatter(ax, x_grid, y_grid)
    # -------------------------------------
    # Add the labels to each plot
    if SUBLABEL is not None:
        if num_plot<5:
            ax.text(-0.1, 1.1, SUBLABEL[num_plot-1], fontsize=FONTSIZE_BIG, transform=ax.transAxes)
        else:
            ax.text(-0.1, 1.05, SUBLABEL[num_plot-1], fontsize=FONTSIZE_BIG, transform=ax.transAxes)

    return fig

def plot_all_residuals_from_df(grid_df, residuals_df, fig, savedir, res_or_thick='both' ):
    grouped_grid = grid_df.groupby('RGI_ID')
    grouped_residuals = residuals_df.groupby('RGI_ID')

    for rgi, grid in grouped_grid:
        num_plot = GLACIER_IDS[rgi]['num_plot']
        residuals = grouped_residuals.get_group(rgi)
        fig = plot_residuals(grid[['POINT_LON', 'POINT_LAT']], residuals[['POINT_LON', 'POINT_LAT']], grid['pinn_thickness'], residuals['residual'], fig, num_plot=num_plot, rgi=rgi, res_or_thick=res_or_thick)
        fig.subplots_adjust(hspace=0.2)
        plot_velocity_predictions(grid[['POINT_LON', 'POINT_LAT']], grid[['depth-averaged_velocity_x', 'depth-averaged_velocity_y']].values, savedir, rgi)
    return fig


def predict_and_plot(gpu: int, datadir:str, gridpath: str, measurementpath:str, figure, num_plot: int, rgi_id: str=None, saving_grid_df: pd.DataFrame=None, saving_residuals_df: pd.DataFrame=None, res_or_thick: str='both'):
    """Evaluate the model on the glacier of given rgi_id , saves the predictions in the given dataframe and plots the residuals to the measurements and the predicted depth-averaged velocity.
    Args:
        gpu (int): GPU to use.
        datadir (str): Directory where the model is saved.
        gridpath (str): Path to the gridded data.
        measurementpath (str): Path to the measurements.
        figure (plt.figure): Figure to plot the results.
        num_plot (int): Number of the plot in the figure.
        rgi_id (str): RGI ID of the glacier to predict ice thickness and depth-averaged velocity for.
        saving_grid_df (pd.DataFrame): Dataframe to save the predictions on the grid. If None, the predictions are not saved.
        saving_residuals_df (pd.DataFrame): Dataframe to save the residuals. If None, the residuals are not saved.
        res_or_thick (str): Plot only residuals or thickness or both.
    Returns:
        figure (plt.figure): Figure with the added plot."""
    pl.seed_everything(42, workers=True)

    try:
        config = read_config(datadir+'/config.yaml')
        loaded_model = PL_PINN.load_from_checkpoint(datadir+"/checkpoints/last.ckpt")
    except:
        print("Could not load model from ", datadir)
        return figure, saving_grid_df, saving_residuals_df
    trainer = Trainer(accelerator='gpu', devices=[gpu])


    ## prepare prediction on grid
    config["ds"]["labeled_sample_size"]=0
    config["ds"]["unlabeled_sample_size"]=1.0
    config["ds"]["data_dir_unlabeled"]=[gridpath]


    if 'num_points' in config["ds"]:
        del config["ds"]["num_points"]
    config["ds"]["glacier_ids"] = []
    if rgi_id is None:
        rgi_id = datadir.split("_")[-3]
        print(rgi_id)

    ## Prediction on grid
    gridded_dataset = PL_GlacierDataset(config)
    gridded_dataset.unlabeled_data = gridded_dataset.unlabeled_data[(gridded_dataset.unlabeled_data.RGI_ID==rgi_id)]


    predictions_on_grid = trainer.predict(loaded_model, datamodule = gridded_dataset)
    pred_thicknesses_on_grid = np.concatenate([thick[0] for thick in predictions_on_grid]).ravel()
    velocities_on_grid = np.concatenate([vel[1] for vel in predictions_on_grid])
    grid_coords = gridded_dataset.dataset.inputs[['POINT_LON', 'POINT_LAT']] # are in epsg25833

    # prepare predictions on measurements
    config["ds"]["data_dir_labeled"]=[measurementpath]
    config["ds"]["labeled_sample_size"]=1.0
    config["ds"]["unlabeled_sample_size"]=.0
    config["ds"]["min_years"]=2000
    measurement_dataset = PL_GlacierDataset(config)

    measurement_dataset.labeled_data = measurement_dataset.labeled_data[(measurement_dataset.labeled_data.RGI_ID==rgi_id)]

    ## Prediction on measurements
    predictions_on_measurements = trainer.predict(loaded_model, datamodule = measurement_dataset)
    eval = trainer.validate(loaded_model, datamodule = measurement_dataset)
    print(rgi_id, eval)
    pred_thicknesses_on_measurements = np.concatenate([thick[0] for thick in predictions_on_measurements]).ravel()

    residual_prediction_to_measurement = measurement_dataset.dataset.labeled_dataset.THICKNESS-pred_thicknesses_on_measurements
    measurement_coords = measurement_dataset.dataset.inputs[['POINT_LON', 'POINT_LAT']] # are in epsg25833

    # write predictions to dataframe if wanted
    if saving_grid_df is not None:
        df = pd.DataFrame({
                           'POINT_LON':grid_coords.iloc[:,0],
                           'POINT_LAT':grid_coords.iloc[:,1],
                           'pinn_thickness':pred_thicknesses_on_grid,
                           'depth-averaged_velocity_x':velocities_on_grid[:,0],
                           'depth-averaged_velocity_y':velocities_on_grid[:,1],
                           })
        df['RGI_ID'] = rgi_id
        saving_grid_df = pd.concat([saving_grid_df, df])


    if saving_residuals_df is not None:
        df = pd.DataFrame({
                           'POINT_LON':measurement_coords.iloc[:,0],
                           'POINT_LAT':measurement_coords.iloc[:,1],
                           'residual':residual_prediction_to_measurement})
        df['RGI_ID'] = rgi_id
        saving_residuals_df = pd.concat([saving_residuals_df, df])

    ## Plotting
    figure = plot_residuals(grid_coords, measurement_coords, pred_thicknesses_on_grid, residual_prediction_to_measurement, figure, num_plot, rgi_id, res_or_thick=res_or_thick)
    print("lowest predicted thickness: ", np.min(pred_thicknesses_on_grid))
    print('Root mean squared residual to measurement: ',np.sqrt(np.mean(residual_prediction_to_measurement**2)))

    plot_velocity_predictions(grid_coords, velocities_on_grid, datadir, rgi_id)

    return figure, saving_grid_df, saving_residuals_df

def make_LOGO_figure(gpu: int, directory:str, gridpath: str, measurementpath:str, res_or_thick='both'):
    """Make the figure for the LOGO test glaciers with the predictions and residuals to the measurements.
    Args:
        gpu (int): GPU to use.
        directory (str): Directory where the models are saved.
        gridpath (str): Path to the gridded data.
        measurementpath (str): Path to the measurements.
        res_or_thick (str): Plot only residuals or predicted ice thickness or both."""

    plt.style.use('default')
    figure = plt.figure(figsize=(16,12)) # (16,12) for paper

    # checking if the predictions are already saved, if not we make them
    if not os.path.exists(os.path.join(directory, 'LOGOglacierspredictions_on_grid.csv')):
        saving_grid_df = pd.DataFrame()
        saving_residuals_df = pd.DataFrame()
        for subdir in os.listdir(directory):
            subdir_path = os.path.join(directory, subdir)
            if os.path.isdir(subdir_path):
                rgi_id = subdir_path.split("_")[-3]

                figure, saving_grid_df, saving_residuals_df = predict_and_plot(gpu, subdir_path, gridpath, measurementpath, figure,
                                                        num_plot=GLACIER_IDS[rgi_id]['num_plot'],
                                                        saving_grid_df=saving_grid_df,
                                                        saving_residuals_df=saving_residuals_df,res_or_thick=res_or_thick)

        saving_grid_df.to_csv(os.path.join(directory,'LOGOglacierspredictions_on_grid.csv'))
        saving_residuals_df.to_csv(os.path.join(directory,'LOGOglaciersresiduals.csv'))
        figure.savefig(os.path.join(directory,'LOGOresiduals.png'))

    # if the predictions are already there we just load them and plot them
    else:
        saving_grid_df = pd.read_csv(os.path.join(directory, 'LOGOglacierspredictions_on_grid.csv'), low_memory=False)
        saving_residuals_df = pd.read_csv(os.path.join(directory, 'LOGOglaciersresiduals.csv'), low_memory=False)
        figure = plot_all_residuals_from_df(saving_grid_df, saving_residuals_df, figure, savedir=directory, res_or_thick=res_or_thick)
        if res_or_thick == 'both':
            figure.savefig(os.path.join(directory,'LOGOresiduals_new.png'), dpi=300)
        elif res_or_thick == 'thickness':
            figure.savefig(os.path.join(directory,'LOGOnoresidual_new.png'), dpi=300)
        else:
            figure.savefig(os.path.join(directory,'LOGOonlyresidual_new.png'), dpi=300)


def start():
    """Evaluation and prediction."""
    # Command line arguments
    parser = argparse.ArgumentParser(
        prog="predictLOGOglaciers.py", description="Makes predicitons for all the LOGO test glaciers and plots the ice thickness with the residuals to measurements."
    )
    parser.add_argument("--gpu", type=int, default=0, help="GPU to use.")
    parser.add_argument("--res_or_thick", type=str, default='both', help="Plot only residuals or thickness or both.")
    args = parser.parse_args()

    directory = "CV/allunmappedglaciers_notsurging/reproduce_tests/test30_spitsbergen_completedhdt_correct_depth_avg_moredata"
    # get datasets
    measurementpath = "data/spitsbergen_measurements_aggregated_nosurges_dhdt2014smoothed_complete_moremeasurements.csv"
    gridpath ="data/spitsbergen_allunmapped_griddeddata_nosurges_dhdt2014smoothed_complete.csv"

    make_LOGO_figure(args.gpu, directory, gridpath, measurementpath, res_or_thick=args.res_or_thick)


if __name__ == "__main__":
    start()