Compute monthly means.

a111a56a · Frisinghelli Daniel · ac23efcd · a111a56a
Commit a111a56a authored 3 years ago by Frisinghelli Daniel
--- a/Notebooks/eval_precipitation.ipynb
+++ b/Notebooks/eval_precipitation.ipynb
@@ -59,7 +59,10 @@
    "SPREDICTORS = 'p'\n",
    "DEM = 'dem'\n",
    "DEM_FEATURES = ''\n",
-    "DOY = 'doy'"
+    "DOY = 'doy'\n",
+    "# WET_DAY_THRESHOLD = 1\n",
+    "# LOSS = 'MSELoss'\n",
+    "# LOSS = 'BernoulliGammaLoss'"
   ]
  },
  {
@@ -86,12 +89,13 @@
    "import xarray as xr\n",
    "import numpy as np\n",
    "import matplotlib.pyplot as plt\n",
+    "from mpl_toolkits.axes_grid1.inset_locator import inset_axes\n",
    "import scipy.stats as stats\n",
    "from IPython.display import Image\n",
    "from sklearn.metrics import r2_score, roc_curve, auc, classification_report\n",
    "\n",
    "# locals\n",
-    "from climax.main.io import ERA5_PATH, OBS_PATH, TARGET_PATH\n",
+    "from climax.main.io import ERA5_PATH, OBS_PATH, TARGET_PATH, DEM_PATH\n",
    "from pysegcnn.core.utils import search_files\n",
    "from pysegcnn.core.graphics import plot_classification_report"
   ]
@@ -193,7 +197,21 @@
    "PATTERN = '_'.join([PATTERN, SPREDICTORS]) if SPREDICTORS else PATTERN\n",
    "PATTERN = '_'.join([PATTERN, DEM]) if DEM else PATTERN\n",
    "PATTERN = '_'.join([PATTERN, DEM_FEATURES]) if DEM_FEATURES else PATTERN\n",
-    "PATTERN = '_'.join([PATTERN, DOY]) if DOY else PATTERN"
+    "PATTERN = '_'.join([PATTERN, DOY]) if DOY else PATTERN\n",
+    "# PATTERN = '_'.join([PATTERN, '{:0d}mm_{}'.format(WET_DAY_THRESHOLD, LOSS)])\n",
+    "PATTERN"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ecaba394-f802-481f-8274-c44e2f5fdf1a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# digital elevation model\n",
+    "dem = xr.open_dataset(search_files(DEM_PATH, 'eu_dem_v11_stt.nc').pop())\n",
+    "dem = dem.Band1.to_dataset().rename({'Band1': 'elevation'})"
   ]
  },
  {
@@ -207,7 +225,18 @@
   "source": [
    "# model predictions and observations NetCDF \n",
    "y_pred = xr.open_dataset(search_files(TARGET_PATH.joinpath(PREDICTAND), '.'.join([PATTERN, 'nc$'])).pop())\n",
-    "y_true = xr.open_dataset(search_files(OBS_PATH.joinpath(PREDICTAND), '.nc$').pop())"
+    "y_true = xr.open_dataset(search_files(OBS_PATH.joinpath(PREDICTAND), 'OBS_pr(.*).nc$').pop())"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "325f3086-85f0-4c28-b37d-7370d2d92405",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# reference dataset: ERA-5 precipitation\n",
+    "y_refe = xr.open_dataset(search_files(ERA5_PATH.joinpath('ERA5', 'total_precipitation'), '.nc$').pop())"
   ]
  },
  {
@@ -218,7 +247,9 @@
   "outputs": [],
   "source": [
    "# subset to time period covered by predictions\n",
-    "y_true = y_true.sel(time=y_pred.time)  "
+    "y_true = y_true.sel(time=y_pred.time)\n",
+    "y_refe = y_refe.sel(time=y_pred.time).drop_vars('lambert_azimuthal_equal_area')\n",
+    "y_refe = y_refe.rename({'tp': 'precipitation'})"
   ]
  },
  {
@@ -229,9 +260,22 @@
   "outputs": [],
   "source": [
    "# align datasets and mask missing values in model predictions\n",
-    "y_true, y_pred_pr, y_pred_prob = xr.align(y_true, y_pred.precipitation.to_dataset(), y_pred.prob.to_dataset(), join='override')\n",
+    "y_true, y_refe, y_pred_pr, y_pred_prob = xr.align(y_true, y_refe, y_pred.precipitation.to_dataset(), y_pred.prob.to_dataset(), join='override')\n",
    "y_pred_pr = y_pred_pr.where(~np.isnan(y_true.precipitation), other=np.nan)\n",
-    "y_pred_prob = y_pred_prob.where(~np.isnan(y_true.precipitation), other=np.nan)"
+    "y_pred_prob = y_pred_prob.where(~np.isnan(y_true.precipitation), other=np.nan)\n",
+    "y_refe = y_refe.where(~np.isnan(y_true.precipitation), other=np.nan)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "4e71997f-7808-463a-8b45-dcac639ebe88",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# align digital elevation model\n",
+    "_, dem = xr.align(y_true.precipitation.isel(time=0), dem, join='override')\n",
+    "dem = dem.where(~np.isnan(y_true.precipitation.isel(time=0)), other=np.nan)"
   ]
  },
  {
@@ -257,9 +301,9 @@
   "metadata": {},
   "outputs": [],
   "source": [
-    "# get predicted and observed values over entire time series and grid points\n",
+    "# calculate monthly mean precipitation (mm / month)\n",
-    "y_pred_values = y_pred_pr[NAMES[PREDICTAND]].groupby('time.month').mean(dim='time').values.flatten()\n",
+    "y_pred_values = y_pred_pr[NAMES[PREDICTAND]].resample(time='1M').sum(skipna=False).groupby('time.month').mean(dim='time').values\n",
-    "y_true_values = y_true[NAMES[PREDICTAND]].groupby('time.month').mean(dim='time').values.flatten()"
+    "y_true_values = y_true[NAMES[PREDICTAND]].resample(time='1M').sum(skipna=False).groupby('time.month').mean(dim='time').values"
   ]
  },
  {
@@ -283,7 +327,20 @@
   "outputs": [],
   "source": [
    "# calculate coefficient of determination\n",
-    "r2 = r2_score(y_true_values, y_pred_values)"
+    "r2 = r2_score(y_true_values, y_pred_values)\n",
+    "r2"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a1b33431-9f2b-4e42-bbb0-f4fa258edd98",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# group timeseries by month and calculate mean over time and space\n",
+    "y_pred_ac = y_pred_pr.resample(time='1M').sum(skipna=False).groupby('time.month').mean(dim=('y', 'x', 'time'), skipna=True)\n",
+    "y_true_ac = y_true.resample(time='1M').sum(skipna=False).groupby('time.month').mean(dim=('y', 'x', 'time'), skipna=True)"
   ]
  },
  {
@@ -304,22 +361,33 @@
    "ax.plot(y_true_values, y_pred_values, 'o', alpha=.5, markeredgecolor='grey', markerfacecolor='none', markersize=3);\n",
    "\n",
    "# plot 1:1 mapping line\n",
-    "interval = np.arange(0, 11)\n",
+    "interval = np.arange(0, 300, 50)\n",
    "ax.plot(interval, interval, color='k', lw=2, ls='--')\n",
    "\n",
    "# add coefficient of determination: calculated on entire dataset!\n",
-    "ax.text(interval[-1], interval[0], s='Coefficient of determination R$^2$ = {:.2f}'.format(r2), ha='right', fontsize=14)\n",
+    "ax.text(interval[-1] - 2, interval[0] + 2, s='Coefficient of determination R$^2$ = {:.2f}'.format(r2), ha='right', fontsize=18)\n",
    "\n",
    "# format axes\n",
    "ax.set_ylim(interval[0], interval[-1])\n",
    "ax.set_xlim(interval[0], interval[-1])\n",
    "ax.set_xticks(interval)\n",
-    "ax.set_xticklabels(interval, fontsize=14)\n",
+    "ax.set_xticklabels(interval, fontsize=16)\n",
    "ax.set_yticks(interval)\n",
-    "ax.set_yticklabels(interval, fontsize=14)\n",
+    "ax.set_yticklabels(interval, fontsize=16)\n",
-    "ax.set_xlabel('Observed', fontsize=14)\n",
+    "ax.set_xlabel('Observed', fontsize=18)\n",
-    "ax.set_ylabel('Predicted', fontsize=14)\n",
+    "ax.set_ylabel('Predicted', fontsize=18)\n",
-    "ax.set_title('Monthly mean {} (mm / day): 1991 - 2010'.format(NAMES[PREDICTAND]), fontsize=16, pad=10);\n",
+    "ax.set_title('Monthly mean {} (mm / month)'.format(NAMES[PREDICTAND]), fontsize=20, pad=10);\n",
+    "\n",
+    "# add axis for annual cycle\n",
+    "axins = inset_axes(ax, width=\"30%\", height=\"40%\", loc=2, borderpad=0.25)\n",
+    "axins.plot(y_pred_ac[NAMES[PREDICTAND]].values, ls='--', color='k', label='Predicted')\n",
+    "axins.plot(y_true_ac[NAMES[PREDICTAND]].values, ls='-', color='k', label='Observed')\n",
+    "axins.legend(frameon=False, fontsize=12, loc='lower center');\n",
+    "axins.set_yticks(np.arange(0, 200, 50))\n",
+    "axins.set_yticklabels(np.arange(0, 200, 50), fontsize=12)\n",
+    "axins.yaxis.tick_right()\n",
+    "axins.set_xticks(np.arange(0, 12))\n",
+    "axins.set_xticklabels([calendar.month_name[i + 1] for i in np.arange(0, 12)], rotation=90, fontsize=12)\n",
    "\n",
    "# save figure\n",
    "fig.savefig('../Notebooks/Figures/{}_r2.png'.format(PREDICTAND), dpi=300, bbox_inches='tight')"
@@ -350,10 +418,13 @@
   "source": [
    "# yearly average bias over reference period\n",
    "y_pred_yearly_avg = y_pred_pr.groupby('time.year').mean(dim='time')\n",
+    "y_refe_yearly_avg = y_refe.groupby('time.year').mean(dim='time')\n",
    "y_true_yearly_avg = y_true.groupby('time.year').mean(dim='time')\n",
    "bias_yearly_avg = ((y_pred_yearly_avg - y_true_yearly_avg) / y_true_yearly_avg) * 100\n",
+    "bias_yearly_avg_ref = ((y_refe_yearly_avg - y_true_yearly_avg) / y_true_yearly_avg) * 100\n",
    "for var in bias_yearly_avg:\n",
-    "    print('Yearly average relative bias of {}: {:.2f}%'.format(var, bias_yearly_avg[var].mean().item()))"
+    "    print('(Model) Yearly average relative bias of {}: {:.2f}%'.format(var, bias_yearly_avg[var].mean().item()))\n",
+    "    print('(ERA-5) Yearly average relative bias of {}: {:.2f}%'.format(var, bias_yearly_avg_ref.mean().to_array().values.item()))"
   ]
  },
  {
@@ -364,9 +435,11 @@
   "outputs": [],
   "source": [
    "# mean absolute error over reference period\n",
-    "mae_avg = np.abs(y_pred_yearly_avg - y_true_yearly_avg).mean()\n",
+    "mae_avg = np.abs(y_pred_yearly_avg - y_true_yearly_avg)\n",
+    "mae_avg_ref = np.abs(y_refe_yearly_avg - y_true_yearly_avg)\n",
    "for var in mae_avg:\n",
-    "    print('Yearly average MAE of {}: {:.2f} '.format(var, mae_avg[var].item()) + 'mm / day')"
+    "    print('(Model) Yearly average MAE of {}: {:.2f} mm'.format(var, mae_avg[var].mean().item()))\n",
+    "    print('(ERA-5) Yearly average MAE of {}: {:.2f} mm'.format(var, mae_avg_ref.mean().to_array().values.item()))"
   ]
  },
  {
@@ -378,8 +451,10 @@
   "source": [
    "# root mean squared error over reference period\n",
    "rmse_avg = ((y_pred_yearly_avg - y_true_yearly_avg) ** 2).mean()\n",
+    "rmse_avg_ref = ((y_refe_yearly_avg - y_true_yearly_avg) **2).mean()\n",
    "for var in rmse_avg:\n",
-    "    print('Yearly average RMSE of {}: {:.2f} '.format(var, rmse_avg[var].item()) + 'mm / day')"
+    "    print('(Model) Yearly average RMSE of {}: {:.2f} mm / day'.format(var, rmse_avg[var].item()))\n",
+    "    print('(ERA-5) Yearly average RMSE of {}: {:.2f} mm / day'.format(var, rmse_avg_ref.mean().to_array().values.item()))"
   ]
  },
  {
@@ -400,6 +475,74 @@
    "print('Yearly average Pearson correlation coefficient for {}: {:.2f}'.format(var, np.asarray(r).mean()))"
   ]
  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "ca683581-6b3b-4abd-ad46-157ebded19c6",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# plot yearly average MAE of reference vs. prediction\n",
+    "vmin, vmax = 0, 5\n",
+    "fig, axes = plt.subplots(1, 3, figsize=(24, 8), sharex=True, sharey=True)\n",
+    "\n",
+    "# plot bias of ERA-5 reference\n",
+    "reference = bias_yearly_avg_ref.mean(dim='year').to_array().squeeze()\n",
+    "im1 = axes[0].imshow(reference.values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)\n",
+    "axes[0].text(x=reference.shape[0] - 2, y=2, s='Average: {:.1f}%'.format(reference.mean().item()), fontsize=14, ha='right')\n",
+    "\n",
+    "# plot MAE of model\n",
+    "prediction = bias_yearly_avg.mean(dim='year').to_array().squeeze()\n",
+    "im2 = axes[1].imshow(prediction.values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)\n",
+    "axes[1].text(x=reference.shape[0] - 2, y=2, s='Average: {:.1f}%'.format(prediction.mean().item()), fontsize=14, ha='right')\n",
+    "\n",
+    "# plot topography\n",
+    "im_dem = axes[2].imshow(dem['elevation'].values, origin='lower', cmap='terrain', vmin=0, vmax=4000)\n",
+    "\n",
+    "# set titles\n",
+    "axes[0].set_title('ERA-5', fontsize=14, pad=10);\n",
+    "axes[1].set_title('DCEDN', fontsize=14, pad=10);\n",
+    "axes[2].set_title('Copernicus EU-DEM v1.1', fontsize=14, pad=10)\n",
+    "\n",
+    "# adjust axes\n",
+    "for ax in axes.flat:\n",
+    "    ax.axes.get_xaxis().set_ticklabels([])\n",
+    "    ax.axes.get_xaxis().set_ticks([])\n",
+    "    ax.axes.get_yaxis().set_ticklabels([])\n",
+    "    ax.axes.get_yaxis().set_ticks([])\n",
+    "    ax.axes.axis('tight')\n",
+    "    ax.set_xlabel('')\n",
+    "    ax.set_ylabel('')\n",
+    "    ax.set_axis_off()\n",
+    "\n",
+    "# adjust figure\n",
+    "# fig.suptitle('Average yearly mean absolute error: 1991 - 2010', fontsize=20);\n",
+    "fig.subplots_adjust(hspace=0, wspace=0, top=0.85)\n",
+    "\n",
+    "# add colorbar for bias\n",
+    "axes = axes.flatten()\n",
+    "cbar_ax_bias = fig.add_axes([axes[-1].get_position().x1 + 0.01, axes[-1].get_position().y0,\n",
+    "                             0.01, axes[-1].get_position().y1 - axes[-1].get_position().y0])\n",
+    "cbar_bias = fig.colorbar(im_dem, cax=cbar_ax_bias)\n",
+    "cbar_bias.set_label(label='Elevation (m)', fontsize=14)\n",
+    "cbar_bias.ax.tick_params(labelsize=14, pad=10)\n",
+    "\n",
+    "# add colorbar for predictand\n",
+    "cbar_ax_predictand = fig.add_axes([axes[0].get_position().x0, axes[0].get_position().y0 - 0.1,\n",
+    "                                   axes[-1].get_position().x0 - axes[0].get_position().x0,\n",
+    "                                   0.03])\n",
+    "cbar_predictand = fig.colorbar(im1, cax=cbar_ax_predictand, orientation='horizontal')\n",
+    "cbar_predictand.set_label(label='Relative mean error (%)', fontsize=14)\n",
+    "cbar_predictand.ax.tick_params(labelsize=14, pad=10)\n",
+    "\n",
+    "# add metrics: MAE and RMSE\n",
+    "#axes[1].text(x=ds.shape[0] - 2, y=2, s='MAE = {:.1f}'.format(mae_avg[NAMES[PREDICTAND]].item()) + 'mm day$^{-1}$', fontsize=14, ha='right')\n",
+    "#axes[1].text(x=ds.shape[0] - 2, y=12, s='RMSE = {:.1f}'.format(rmse_avg[NAMES[PREDICTAND]].item()) + 'mm$^2$ day$^{-2}$', fontsize=14, ha='right')\n",
+    "\n",
+    "# save figure\n",
+    "fig.savefig('../Notebooks/Figures/{}_rbias_ERA_vs_model.png'.format(PREDICTAND), dpi=300, bbox_inches='tight')"
+   ]
+  },
  {
   "cell_type": "code",
   "execution_count": null,
@@ -409,7 +552,7 @@
   "source": [
    "# plot average of observation, prediction, and bias\n",
    "vmin, vmax = 0, 5\n",
-    "fig, axes = plt.subplots(len(y_pred_yearly_avg.data_vars), 3, figsize=(24, len(y_pred_yearly_avg.data_vars) * 6),\n",
+    "fig, axes = plt.subplots(len(y_pred_yearly_avg.data_vars), 3, figsize=(24, len(y_pred_yearly_avg.data_vars) * 8),\n",
    "                         sharex=True, sharey=True)\n",
    "axes = axes.reshape(len(y_pred_yearly_avg.data_vars), -1)\n",
    "for i, var in enumerate(y_pred_yearly_avg):\n",
@@ -457,8 +600,8 @@
    "cbar_predictand.ax.tick_params(labelsize=14)\n",
    "\n",
    "# add metrics: MAE and RMSE\n",
-    "axes[1].text(x=ds.shape[0] - 2, y=2, s='MAE = {:.1f}'.format(mae_avg[NAMES[PREDICTAND]].item()) + 'mm day$^{-1}$', fontsize=14, ha='right')\n",
+    "axes[1].text(x=ds.shape[0] - 2, y=2, s='MAE = {:.1f}'.format(mae_avg[NAMES[PREDICTAND]].mean().item()) + 'mm day$^{-1}$', fontsize=14, ha='right')\n",
-    "axes[1].text(x=ds.shape[0] - 2, y=12, s='RMSE = {:.1f}'.format(rmse_avg[NAMES[PREDICTAND]].item()) + 'mm$^2$ day$^{-2}$', fontsize=14, ha='right')\n",
+    "axes[1].text(x=ds.shape[0] - 2, y=12, s='RMSE = {:.1f}'.format(rmse_avg[NAMES[PREDICTAND]].mean().item()) + 'mm day$^{-1}$', fontsize=14, ha='right')\n",
    "\n",
    "# save figure\n",
    "fig.savefig('../Notebooks/Figures/{}_average_bias.png'.format(PREDICTAND), dpi=300, bbox_inches='tight')"
@@ -490,7 +633,22 @@
    "# group data by season: (DJF, MAM, JJA, SON)\n",
    "y_true_snl = y_true.groupby('time.season').mean(dim='time')\n",
    "y_pred_snl = y_pred_pr.groupby('time.season').mean(dim='time')\n",
-    "bias_snl = ((y_pred_snl - y_true_snl) / y_true_snl) * 100"
+    "y_refe_snl = y_refe.groupby('time.season').mean(dim='time')\n",
+    "bias_snl = ((y_pred_snl - y_true_snl) / y_true_snl) * 100\n",
+    "bias_snl_ref = ((y_refe_snl - y_true_snl) / y_true_snl) * 100"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2a70e6ac-54fb-47b8-ae76-a1b51d9d1f17",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# print average bias per season: ERA-5\n",
+    "for var in bias_snl_ref.data_vars:\n",
+    "    for season in bias_snl_ref[NAMES[PREDICTAND]].season:\n",
+    "        print('(ERA-5) Average bias of mean {} for season {}: {:.1f}%'.format(var, season.values.item(), bias_snl_ref[var].sel(season=season).mean().item()))"
   ]
  },
  {
@@ -500,10 +658,10 @@
   "metadata": {},
   "outputs": [],
   "source": [
-    "# print average bias per season\n",
+    "# print average bias per season: model\n",
    "for var in bias_snl.data_vars:\n",
    "    for season in bias_snl[NAMES[PREDICTAND]].season:\n",
-    "        print('Average bias of mean {} for season {}: {:.1f}%'.format(var, season.values.item(), bias_snl[var].sel(season=season).mean().item()))"
+    "        print('(Model) Average bias of mean {} for season {}: {:.1f}%'.format(var, season.values.item(), bias_snl[var].sel(season=season).mean().item()))"
   ]
  },
  {
@@ -597,7 +755,8 @@
    "with warnings.catch_warnings():\n",
    "    warnings.simplefilter('ignore', category=RuntimeWarning)\n",
    "    y_pred_ex = y_pred_pr.groupby('time.year').quantile(quantile, dim='time')\n",
-    "    y_true_ex = y_true.groupby('time.year').quantile(quantile, dim='time')"
+    "    y_true_ex = y_true.groupby('time.year').quantile(quantile, dim='time')\n",
+    "    y_refe_ex = y_refe.groupby('time.year').quantile(quantile, dim='time')"
   ]
  },
  {
@@ -609,8 +768,31 @@
   "source": [
    "# calculate bias in extreme quantile for each year\n",
    "bias_ex = ((y_pred_ex - y_true_ex) / y_true_ex) * 100\n",
+    "bias_ex_ref = ((y_refe_ex - y_true_ex) / y_true_ex) * 100"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9a610a70-bb94-47e6-b470-e01bf4a295c0",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# bias of extreme quantile: ERA-5\n",
+    "for var in bias_ex_ref:\n",
+    "    print('(ERA-5) Yearly average bias for P{:.0f} of {}: {:.1f}%'.format(quantile * 100, var, bias_ex_ref[var].mean().item()))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "423962d7-453d-4c86-b93e-a4571bfec1c4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# bias of extreme quantile: Model\n",
    "for var in bias_ex:\n",
-    "    print('Yearly average bias for P{:.0f} of {}: {:.1f}%'.format(quantile * 100, var, bias_ex[var].mean().item()))"
+    "    print('(Model) Yearly average bias for P{:.0f} of {}: {:.1f}%'.format(quantile * 100, var, bias_ex[var].mean().item()))"
   ]
  },
  {
@@ -622,8 +804,31 @@
   "source": [
    "# mean absolute error in extreme quantile\n",
    "mae_ex = np.abs(y_pred_ex - y_true_ex).mean()\n",
+    "mae_ex_ref = np.abs(y_refe_ex - y_true_ex).mean()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "7331acdd-60bb-414e-a0e7-e81956c3a1bf",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# mae of extreme quantile: ERA-5\n",
+    "for var in mae_ex_ref:\n",
+    "    print('(ERA-5) Yearly average MAE for P{:.0f} of {}: {:.1f} mm / day'.format(quantile * 100, var, mae_ex_ref[var].item()))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d7bf1a6c-e111-4c72-8774-64a3939cbe50",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# mae of extreme quantile: Model\n",
    "for var in mae_ex:\n",
-    "    print('Yearly average MAE for P{:.0f} of {}: {:.1f} mm / day'.format(quantile * 100, var, mae_ex[var].item()))"
+    "    print('(Model) Yearly average MAE for P{:.0f} of {}: {:.1f} mm / day'.format(quantile * 100, var, mae_ex[var].item()))"
   ]
  },
  {
@@ -633,10 +838,33 @@
   "metadata": {},
   "outputs": [],
   "source": [
-    "# root mean squared error over reference period\n",
+    "# root mean squared error in extreme quantile\n",
    "rmse_ex = ((y_pred_ex - y_true_ex) ** 2).mean()\n",
+    "rmse_ex_ref = ((y_refe_ex - y_true_ex) ** 2).mean()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "712a2109-14b9-45a3-9194-e2b917c5ba3f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# rmse of extreme quantile: ERA-5\n",
+    "for var in rmse_ex_ref:\n",
+    "    print('(ERA-5) Yearly average RMSE for P{:.0f} of {}: {:.1f} mm / day'.format(quantile * 100, var, rmse_ex_ref[var].item()))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "1dfad687-c16f-4767-8ddd-96c3e56bd96a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# rmse of extreme quantile: Model\n",
    "for var in rmse_ex:\n",
-    "    print('Yearly average RMSE for P{:.0f} of {}: {:.1f} mm / day'.format(quantile * 100, var, rmse_ex[var].item()))"
+    "    print('(Model) Yearly average RMSE for P{:.0f} of {}: {:.1f} mm / day'.format(quantile * 100, var, rmse_ex[var].item()))"
   ]
  },
  {
@@ -722,7 +950,8 @@
    "with warnings.catch_warnings():\n",
    "    warnings.simplefilter('ignore', category=RuntimeWarning)\n",
    "    y_true_ex_snl = y_true.groupby('time.season').quantile(quantile, dim='time')\n",
-    "    y_pred_ex_snl = y_pred_pr.groupby('time.season').quantile(quantile, dim='time')"
+    "    y_pred_ex_snl = y_pred_pr.groupby('time.season').quantile(quantile, dim='time')\n",
+    "    y_refe_ex_snl = y_refe.groupby('time.season').quantile(quantile, dim='time')"
   ]
  },
  {
@@ -733,7 +962,8 @@
   "outputs": [],
   "source": [
    "# compute relative bias in seasonal extremes\n",
-    "bias_ex_snl = ((y_pred_ex_snl - y_true_ex_snl) / y_true_ex_snl) * 100"
+    "bias_ex_snl = ((y_pred_ex_snl - y_true_ex_snl) / y_true_ex_snl) * 100\n",
+    "bias_ex_snl_ref = ((y_refe_ex_snl - y_true_ex_snl) / y_true_ex_snl) * 100"
   ]
  },
  {
@@ -743,10 +973,23 @@
   "metadata": {},
   "outputs": [],
   "source": [
-    "# print average bias in extreme per season\n",
+    "# print average bias in extreme per season: ERA-5\n",
+    "for var in bias_ex_snl_ref.data_vars:\n",
+    "    for season in bias_ex_snl_ref[NAMES[PREDICTAND]].season:\n",
+    "        print('(ERA-5) Average bias of P{:.0f} {} for season {}: {:.1f}%'.format(quantile * 100, var, season.values.item(), bias_ex_snl_ref[var].sel(season=season).mean().item()))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "0671b4f3-52c6-4167-b35b-03902dbe11a3",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# print average bias in extreme per season: Model\n",
    "for var in bias_ex_snl.data_vars:\n",
    "    for season in bias_ex_snl[NAMES[PREDICTAND]].season:\n",
-    "        print('Average bias of P{:.0f} {} for season {}: {:.1f}%'.format(quantile * 100, var, season.values.item(), bias_ex_snl[var].sel(season=season).mean().item()))"
+    "        print('(Model) Average bias of P{:.0f} {} for season {}: {:.1f}%'.format(quantile * 100, var, season.values.item(), bias_ex_snl[var].sel(season=season).mean().item()))"
   ]
  },
  {

 %% Cell type:markdown id:4735431f-6741-437e-b0fc-dd6d8eaa22ca tags:
 # Evaluate ERA-5 downscaling: precipitation
 %% Cell type:markdown id:a87da113-4b0f-4ac8-9721-19c85848acec tags:
 We used **1981-1991 as training** period and **1991-2010 as reference** period. The results shown in this notebook are based on the model predictions on the reference period.
 %% Cell type:markdown id:ad1769d4-9c0c-4e3f-9adf-ef02bb43c047 tags:
 **Predictors on pressure levels (500, 850)**:
 - Geopotential (z)
 - Temperature (t)
 - Zonal wind (u)
 - Meridional wind (v)
 - Specific humidity (q)
 **Predictors on surface**:
 - Mean sea level pressure (msl)
 **Auxiliary predictors**:
 - Elevation from Copernicus EU-DEM v1.1 (dem)
 - Day of the year (doy)
 %% Cell type:markdown id:f9334da7-17d1-45ef-9ed9-5c2bee9fcdcc tags:
 Define the predictand and the model to evaluate:
 %% Cell type:code id:a81acde7-16a2-4087-bc08-95b084adbd06 tags:
 ``` python
 # define the model parameters
 PREDICTAND = 'pr'
 MODEL = 'USegNet'
 PPREDICTORS = 'ztuvq'
 PLEVELS = ['500', '850']
 SPREDICTORS = 'p'
 DEM = 'dem'
 DEM_FEATURES = ''
 DOY = 'doy'
+# WET_DAY_THRESHOLD = 1
+# LOSS = 'MSELoss'
+# LOSS = 'BernoulliGammaLoss'
 ```
 %% Cell type:markdown id:dd188df0-69ee-44b0-82b2-d212994dc271 tags:
 ### Imports
 %% Cell type:code id:06792bf2-b33b-4728-ba60-d60fab46779d tags:
 ``` python
 # builtins
 import datetime
 import warnings
 import calendar
 # externals
 import xarray as xr
 import numpy as np
 import matplotlib.pyplot as plt
+from mpl_toolkits.axes_grid1.inset_locator import inset_axes
 import scipy.stats as stats
 from IPython.display import Image
 from sklearn.metrics import r2_score, roc_curve, auc, classification_report
 # locals
-from climax.main.io import ERA5_PATH, OBS_PATH, TARGET_PATH
+from climax.main.io import ERA5_PATH, OBS_PATH, TARGET_PATH, DEM_PATH
 from pysegcnn.core.utils import search_files
 from pysegcnn.core.graphics import plot_classification_report
 ```
 %% Cell type:code id:cd14134e-f9be-4935-877b-ef6d34e03d2e tags:
 ``` python
 # mapping from predictands to variable names
 NAMES = {'tasmin': 'minimum temperature', 'tasmax': 'maximum temperature', 'pr': 'precipitation'}
 ```
 %% Cell type:markdown id:a3d92474-2bc1-4035-8938-c5fbb07ae891 tags:
 ### Model architecture
 %% Cell type:code id:c68e022b-41c2-438b-bfb0-e27eddee89bf tags:
 ``` python
 Image("./Figures/architecture.png", width=900, height=400)
 ```
 %% Cell type:markdown id:c8833efe-c715-4872-9aee-a0b5766f5c67 tags:
 ### Loss function
 %% Cell type:markdown id:bb801367-6872-4a0b-bff5-70cb6746e057 tags:
 For precipitation, the network is optimizing the negative log-likelihood of a Bernoulli-Gamma distribution after [Cannon (2008)](http://journals.ametsoc.org/doi/10.1175/2008JHM960.1).
 %% Cell type:markdown id:a8775d5e-5ad4-47e4-8fef-6dc230e15dee tags:
 Bernoulli-Gamma distribution:
 %% Cell type:markdown id:ab10f8de-d8d2-4427-b9c8-5d68803543c3 tags:
 $$P(y \mid, p, \alpha, \beta) = \begin{cases} 1 - p, & \text{for } y = 0\\ p \cdot \frac{y^{\alpha -1} \exp(-y/\beta)}{\beta^{\alpha} \tau(\alpha)}, & \text{for } y > 0\end{cases}$$
 %% Cell type:markdown id:6b6dbd06-1f0e-4c52-84f2-b7ff31c75726 tags:
 Log-likelihood function:
 %% Cell type:markdown id:e41c7b39-f352-4a98-820f-9a7345b3283c tags:
 $$\mathcal{J}(p, \alpha, \beta \mid y) = \underbrace{(1 - P(y > 0)) \log(1 - p)}_{\text{Bernoulli}} + \underbrace{P(y > 0) \cdot \left(\log(p) + (\alpha - 1) \log(y) - \frac{y}{\beta} - \alpha \log(\beta) - \log(\tau(\alpha))\right)}_{\text{Gamma}}$$
 %% Cell type:markdown id:5a0c55f0-79fb-4501-b3cf-b5414399a3d9 tags:
 ### Load datasets
 %% Cell type:code id:efa76f8e-c089-47ff-a001-d4c2a11c4d6d tags:
 ``` python
 # construct file pattern to match
 PATTERN = '_'.join([MODEL, PREDICTAND, PPREDICTORS, *PLEVELS])
 PATTERN = '_'.join([PATTERN, SPREDICTORS]) if SPREDICTORS else PATTERN
 PATTERN = '_'.join([PATTERN, DEM]) if DEM else PATTERN
 PATTERN = '_'.join([PATTERN, DEM_FEATURES]) if DEM_FEATURES else PATTERN
 PATTERN = '_'.join([PATTERN, DOY]) if DOY else PATTERN
+# PATTERN = '_'.join([PATTERN, '{:0d}mm_{}'.format(WET_DAY_THRESHOLD, LOSS)])
+PATTERN
+```
+%% Cell type:code id:ecaba394-f802-481f-8274-c44e2f5fdf1a tags:
+``` python
+# digital elevation model
+dem = xr.open_dataset(search_files(DEM_PATH, 'eu_dem_v11_stt.nc').pop())
+dem = dem.Band1.to_dataset().rename({'Band1': 'elevation'})
 ```
 %% Cell type:code id:a5db133d-2c36-4e84-879e-20e617e821f1 tags:
 ``` python
 # model predictions and observations NetCDF
 y_pred = xr.open_dataset(search_files(TARGET_PATH.joinpath(PREDICTAND), '.'.join([PATTERN, 'nc$'])).pop())
-y_true = xr.open_dataset(search_files(OBS_PATH.joinpath(PREDICTAND), '.nc$').pop())
+y_true = xr.open_dataset(search_files(OBS_PATH.joinpath(PREDICTAND), 'OBS_pr(.*).nc$').pop())
+```
+%% Cell type:code id:325f3086-85f0-4c28-b37d-7370d2d92405 tags:
+``` python
+# reference dataset: ERA-5 precipitation
+y_refe = xr.open_dataset(search_files(ERA5_PATH.joinpath('ERA5', 'total_precipitation'), '.nc$').pop())
 ```
 %% Cell type:code id:528c3116-7707-45ca-b811-0adad7bc20f3 tags:
 ``` python
 # subset to time period covered by predictions
 y_true = y_true.sel(time=y_pred.time)
+y_refe = y_refe.sel(time=y_pred.time).drop_vars('lambert_azimuthal_equal_area')
+y_refe = y_refe.rename({'tp': 'precipitation'})
 ```
 %% Cell type:code id:70b903cb-e597-45d3-b575-0ebaf7a45649 tags:
 ``` python
 # align datasets and mask missing values in model predictions
-y_true, y_pred_pr, y_pred_prob = xr.align(y_true, y_pred.precipitation.to_dataset(), y_pred.prob.to_dataset(), join='override')
+y_true, y_refe, y_pred_pr, y_pred_prob = xr.align(y_true, y_refe, y_pred.precipitation.to_dataset(), y_pred.prob.to_dataset(), join='override')
 y_pred_pr = y_pred_pr.where(~np.isnan(y_true.precipitation), other=np.nan)
 y_pred_prob = y_pred_prob.where(~np.isnan(y_true.precipitation), other=np.nan)
+y_refe = y_refe.where(~np.isnan(y_true.precipitation), other=np.nan)
+```
+%% Cell type:code id:4e71997f-7808-463a-8b45-dcac639ebe88 tags:
+``` python
+# align digital elevation model
+_, dem = xr.align(y_true.precipitation.isel(time=0), dem, join='override')
+dem = dem.where(~np.isnan(y_true.precipitation.isel(time=0)), other=np.nan)
 ```
 %% Cell type:markdown id:b269a131-cf5b-4c6c-9f8e-a5408250aa83 tags:
 ## Model validation: precipitation amount
 %% Cell type:markdown id:0fa1fe82-0d6e-4676-b5b8-9eac2fd28ffb tags:
 ### Coefficient of determination: monthly mean
 %% Cell type:code id:4d11cee6-1ebd-4424-8ec6-92e5a196bac4 tags:
 ``` python
-# get predicted and observed values over entire time series and grid points
+# calculate monthly mean precipitation (mm / month)
-y_pred_values = y_pred_pr[NAMES[PREDICTAND]].groupby('time.month').mean(dim='time').values.flatten()
+y_pred_values = y_pred_pr[NAMES[PREDICTAND]].resample(time='1M').sum(skipna=False).groupby('time.month').mean(dim='time').values
-y_true_values = y_true[NAMES[PREDICTAND]].groupby('time.month').mean(dim='time').values.flatten()
+y_true_values = y_true[NAMES[PREDICTAND]].resample(time='1M').sum(skipna=False).groupby('time.month').mean(dim='time').values
 ```
 %% Cell type:code id:6e55cdd5-8adb-40c5-9742-46f4fc3d4be9 tags:
 ``` python
 # apply mask of valid pixels
 mask = (~np.isnan(y_pred_values) & ~np.isnan(y_true_values))
 y_pred_values = y_pred_values[mask]
 y_true_values = y_true_values[mask]
 ```
 %% Cell type:code id:13a9ff21-34ea-4db1-9c0a-bcb7ea1001f7 tags:
 ``` python
 # calculate coefficient of determination
 r2 = r2_score(y_true_values, y_pred_values)
+r2
+```
+%% Cell type:code id:a1b33431-9f2b-4e42-bbb0-f4fa258edd98 tags:
+``` python
+# group timeseries by month and calculate mean over time and space
+y_pred_ac = y_pred_pr.resample(time='1M').sum(skipna=False).groupby('time.month').mean(dim=('y', 'x', 'time'), skipna=True)
+y_true_ac = y_true.resample(time='1M').sum(skipna=False).groupby('time.month').mean(dim=('y', 'x', 'time'), skipna=True)
 ```
 %% Cell type:code id:c683858e-8b7f-4c76-a40f-6f68397b3479 tags:
 ``` python
 # scatter plot of observations vs. predictions
 fig, ax = plt.subplots(1, 1, figsize=(10, 10))
 # plot only a subset of data: otherwise plot is overloaded ...
 # subset = np.random.choice(np.arange(0, len(y_pred_values)), size=int(1e3), replace=False)
 # ax.plot(y_true_values[subset], y_pred_values[subset], 'o', alpha=.5, markeredgecolor='grey', markerfacecolor='none', markersize=3);
 # plot entire dataset
 ax.plot(y_true_values, y_pred_values, 'o', alpha=.5, markeredgecolor='grey', markerfacecolor='none', markersize=3);
 # plot 1:1 mapping line
-interval = np.arange(0, 11)
+interval = np.arange(0, 300, 50)
 ax.plot(interval, interval, color='k', lw=2, ls='--')
 # add coefficient of determination: calculated on entire dataset!
-ax.text(interval[-1], interval[0], s='Coefficient of determination R$^2$ = {:.2f}'.format(r2), ha='right', fontsize=14)
+ax.text(interval[-1] - 2, interval[0] + 2, s='Coefficient of determination R$^2$ = {:.2f}'.format(r2), ha='right', fontsize=18)
 # format axes
 ax.set_ylim(interval[0], interval[-1])
 ax.set_xlim(interval[0], interval[-1])
 ax.set_xticks(interval)
-ax.set_xticklabels(interval, fontsize=14)
+ax.set_xticklabels(interval, fontsize=16)
 ax.set_yticks(interval)
-ax.set_yticklabels(interval, fontsize=14)
+ax.set_yticklabels(interval, fontsize=16)
-ax.set_xlabel('Observed', fontsize=14)
+ax.set_xlabel('Observed', fontsize=18)
-ax.set_ylabel('Predicted', fontsize=14)
+ax.set_ylabel('Predicted', fontsize=18)
-ax.set_title('Monthly mean {} (mm / day): 1991 - 2010'.format(NAMES[PREDICTAND]), fontsize=16, pad=10);
+ax.set_title('Monthly mean {} (mm / month)'.format(NAMES[PREDICTAND]), fontsize=20, pad=10);
+# add axis for annual cycle
+axins = inset_axes(ax, width="30%", height="40%", loc=2, borderpad=0.25)
+axins.plot(y_pred_ac[NAMES[PREDICTAND]].values, ls='--', color='k', label='Predicted')
+axins.plot(y_true_ac[NAMES[PREDICTAND]].values, ls='-', color='k', label='Observed')
+axins.legend(frameon=False, fontsize=12, loc='lower center');
+axins.set_yticks(np.arange(0, 200, 50))
+axins.set_yticklabels(np.arange(0, 200, 50), fontsize=12)
+axins.yaxis.tick_right()
+axins.set_xticks(np.arange(0, 12))
+axins.set_xticklabels([calendar.month_name[i + 1] for i in np.arange(0, 12)], rotation=90, fontsize=12)
 # save figure
 fig.savefig('../Notebooks/Figures/{}_r2.png'.format(PREDICTAND), dpi=300, bbox_inches='tight')
 ```
 %% Cell type:markdown id:3538a109-4d3a-418e-9d4d-c3c120256ab2 tags:
 ### Bias
 %% Cell type:markdown id:43c922bd-9e9b-4812-b096-f3bde06fb249 tags:
 Calculate yearly average bias over entire reference period:
 %% Cell type:code id:52efc445-054e-4184-9667-4e761bc12a84 tags:
 ``` python
 # yearly average bias over reference period
 y_pred_yearly_avg = y_pred_pr.groupby('time.year').mean(dim='time')
+y_refe_yearly_avg = y_refe.groupby('time.year').mean(dim='time')
 y_true_yearly_avg = y_true.groupby('time.year').mean(dim='time')
 bias_yearly_avg = ((y_pred_yearly_avg - y_true_yearly_avg) / y_true_yearly_avg) * 100
+bias_yearly_avg_ref = ((y_refe_yearly_avg - y_true_yearly_avg) / y_true_yearly_avg) * 100
 for var in bias_yearly_avg:
-    print('Yearly average relative bias of {}: {:.2f}%'.format(var, bias_yearly_avg[var].mean().item()))
+    print('(Model) Yearly average relative bias of {}: {:.2f}%'.format(var, bias_yearly_avg[var].mean().item()))
+    print('(ERA-5) Yearly average relative bias of {}: {:.2f}%'.format(var, bias_yearly_avg_ref.mean().to_array().values.item()))
 ```
 %% Cell type:code id:92a094cb-2a88-4f4a-8c87-1025672d6fe7 tags:
 ``` python
 # mean absolute error over reference period
-mae_avg = np.abs(y_pred_yearly_avg - y_true_yearly_avg).mean()
+mae_avg = np.abs(y_pred_yearly_avg - y_true_yearly_avg)
+mae_avg_ref = np.abs(y_refe_yearly_avg - y_true_yearly_avg)
 for var in mae_avg:
-    print('Yearly average MAE of {}: {:.2f} '.format(var, mae_avg[var].item()) + 'mm / day')
+    print('(Model) Yearly average MAE of {}: {:.2f} mm'.format(var, mae_avg[var].mean().item()))
+    print('(ERA-5) Yearly average MAE of {}: {:.2f} mm'.format(var, mae_avg_ref.mean().to_array().values.item()))
 ```
 %% Cell type:code id:25d397e2-1b46-4f48-b39d-8632a7e56288 tags:
 ``` python
 # root mean squared error over reference period
 rmse_avg = ((y_pred_yearly_avg - y_true_yearly_avg) ** 2).mean()
+rmse_avg_ref = ((y_refe_yearly_avg - y_true_yearly_avg) **2).mean()
 for var in rmse_avg:
-    print('Yearly average RMSE of {}: {:.2f} '.format(var, rmse_avg[var].item()) + 'mm / day')
+    print('(Model) Yearly average RMSE of {}: {:.2f} mm / day'.format(var, rmse_avg[var].item()))
+    print('(ERA-5) Yearly average RMSE of {}: {:.2f} mm / day'.format(var, rmse_avg_ref.mean().to_array().values.item()))
 ```
 %% Cell type:code id:d6bbdcd6-3920-4856-b90a-d56f0e5ab2df tags:
 ``` python
 # Pearson's correlation coefficient over reference period
 for var in y_pred_yearly_avg:
    correlations = []
    for year in y_pred_yearly_avg.year:
        y_p = y_pred_yearly_avg[var].sel(year=year).values
        y_t = y_true_yearly_avg[var].sel(year=year).values
        r, _ = stats.pearsonr(y_p[~np.isnan(y_p)], y_t[~np.isnan(y_t)])
        correlations.append(r)
 print('Yearly average Pearson correlation coefficient for {}: {:.2f}'.format(var, np.asarray(r).mean()))
 ```
+%% Cell type:code id:ca683581-6b3b-4abd-ad46-157ebded19c6 tags:
+``` python
+# plot yearly average MAE of reference vs. prediction
+vmin, vmax = 0, 5
+fig, axes = plt.subplots(1, 3, figsize=(24, 8), sharex=True, sharey=True)
+# plot bias of ERA-5 reference
+reference = bias_yearly_avg_ref.mean(dim='year').to_array().squeeze()
+im1 = axes[0].imshow(reference.values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)
+axes[0].text(x=reference.shape[0] - 2, y=2, s='Average: {:.1f}%'.format(reference.mean().item()), fontsize=14, ha='right')
+# plot MAE of model
+prediction = bias_yearly_avg.mean(dim='year').to_array().squeeze()
+im2 = axes[1].imshow(prediction.values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)
+axes[1].text(x=reference.shape[0] - 2, y=2, s='Average: {:.1f}%'.format(prediction.mean().item()), fontsize=14, ha='right')
+# plot topography
+im_dem = axes[2].imshow(dem['elevation'].values, origin='lower', cmap='terrain', vmin=0, vmax=4000)
+# set titles
+axes[0].set_title('ERA-5', fontsize=14, pad=10);
+axes[1].set_title('DCEDN', fontsize=14, pad=10);
+axes[2].set_title('Copernicus EU-DEM v1.1', fontsize=14, pad=10)
+# adjust axes
+for ax in axes.flat:
+    ax.axes.get_xaxis().set_ticklabels([])
+    ax.axes.get_xaxis().set_ticks([])
+    ax.axes.get_yaxis().set_ticklabels([])
+    ax.axes.get_yaxis().set_ticks([])
+    ax.axes.axis('tight')
+    ax.set_xlabel('')
+    ax.set_ylabel('')
+    ax.set_axis_off()
+# adjust figure
+# fig.suptitle('Average yearly mean absolute error: 1991 - 2010', fontsize=20);
+fig.subplots_adjust(hspace=0, wspace=0, top=0.85)
+# add colorbar for bias
+axes = axes.flatten()
+cbar_ax_bias = fig.add_axes([axes[-1].get_position().x1 + 0.01, axes[-1].get_position().y0,
+                             0.01, axes[-1].get_position().y1 - axes[-1].get_position().y0])
+cbar_bias = fig.colorbar(im_dem, cax=cbar_ax_bias)
+cbar_bias.set_label(label='Elevation (m)', fontsize=14)
+cbar_bias.ax.tick_params(labelsize=14, pad=10)
+# add colorbar for predictand
+cbar_ax_predictand = fig.add_axes([axes[0].get_position().x0, axes[0].get_position().y0 - 0.1,
+                                   axes[-1].get_position().x0 - axes[0].get_position().x0,
+                                   0.03])
+cbar_predictand = fig.colorbar(im1, cax=cbar_ax_predictand, orientation='horizontal')
+cbar_predictand.set_label(label='Relative mean error (%)', fontsize=14)
+cbar_predictand.ax.tick_params(labelsize=14, pad=10)
+# add metrics: MAE and RMSE
+#axes[1].text(x=ds.shape[0] - 2, y=2, s='MAE = {:.1f}'.format(mae_avg[NAMES[PREDICTAND]].item()) + 'mm day$^{-1}$', fontsize=14, ha='right')
+#axes[1].text(x=ds.shape[0] - 2, y=12, s='RMSE = {:.1f}'.format(rmse_avg[NAMES[PREDICTAND]].item()) + 'mm$^2$ day$^{-2}$', fontsize=14, ha='right')
+# save figure
+fig.savefig('../Notebooks/Figures/{}_rbias_ERA_vs_model.png'.format(PREDICTAND), dpi=300, bbox_inches='tight')
+```
 %% Cell type:code id:f022fcbc-077f-4f76-8330-47fa72a1fcec tags:
 ``` python
 # plot average of observation, prediction, and bias
 vmin, vmax = 0, 5
-fig, axes = plt.subplots(len(y_pred_yearly_avg.data_vars), 3, figsize=(24, len(y_pred_yearly_avg.data_vars) * 6),
+fig, axes = plt.subplots(len(y_pred_yearly_avg.data_vars), 3, figsize=(24, len(y_pred_yearly_avg.data_vars) * 8),
                         sharex=True, sharey=True)
 axes = axes.reshape(len(y_pred_yearly_avg.data_vars), -1)
 for i, var in enumerate(y_pred_yearly_avg):
    for ds, ax in zip([y_true_yearly_avg, y_pred_yearly_avg, bias_yearly_avg], axes[i, ...]):
        if ds is bias_yearly_avg:
            ds = ds[var].mean(dim='year')
            im2 = ax.imshow(ds.values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)
            ax.text(x=ds.shape[0] - 2, y=2, s='Average: {:.1f}%'.format(ds.mean().item()), fontsize=14, ha='right')
        else:
            im1 = ax.imshow(ds[var].mean(dim='year').values, origin='lower', cmap='BuPu', vmin=vmin, vmax=vmax)
 # set titles
 axes[0, 0].set_title('Observed', fontsize=16, pad=10);
 axes[0, 1].set_title('Predicted', fontsize=16, pad=10);
 axes[0, 2].set_title('Bias', fontsize=16, pad=10);
 # adjust axes
 for ax in axes.flat:
    ax.axes.get_xaxis().set_ticklabels([])
    ax.axes.get_xaxis().set_ticks([])
    ax.axes.get_yaxis().set_ticklabels([])
    ax.axes.get_yaxis().set_ticks([])
    ax.axes.axis('tight')
    ax.set_xlabel('')
    ax.set_ylabel('')
 # adjust figure
 fig.suptitle('Average {}: 1991 - 2010'.format(NAMES[PREDICTAND]), fontsize=20);
 fig.subplots_adjust(hspace=0, wspace=0, top=0.85)
 # add colorbar for bias
 axes = axes.flatten()
 cbar_ax_bias = fig.add_axes([axes[-1].get_position().x1 + 0.01, axes[-1].get_position().y0,
                             0.01, axes[-1].get_position().y1 - axes[-1].get_position().y0])
 cbar_bias = fig.colorbar(im2, cax=cbar_ax_bias)
 cbar_bias.set_label(label='Relative bias / (%)', fontsize=16)
 cbar_bias.ax.tick_params(labelsize=14)
 # add colorbar for predictand
 cbar_ax_predictand = fig.add_axes([axes[0].get_position().x0, axes[0].get_position().y0 - 0.1,
                                   axes[-1].get_position().x0 - axes[0].get_position().x0,
                                   0.05])
 cbar_predictand = fig.colorbar(im1, cax=cbar_ax_predictand, orientation='horizontal')
 cbar_predictand.set_label(label='{} / '.format(NAMES[PREDICTAND].capitalize()) + '(mm day$^{-1}$)', fontsize=16)
 cbar_predictand.ax.tick_params(labelsize=14)
 # add metrics: MAE and RMSE
-axes[1].text(x=ds.shape[0] - 2, y=2, s='MAE = {:.1f}'.format(mae_avg[NAMES[PREDICTAND]].item()) + 'mm day$^{-1}$', fontsize=14, ha='right')
+axes[1].text(x=ds.shape[0] - 2, y=2, s='MAE = {:.1f}'.format(mae_avg[NAMES[PREDICTAND]].mean().item()) + 'mm day$^{-1}$', fontsize=14, ha='right')
-axes[1].text(x=ds.shape[0] - 2, y=12, s='RMSE = {:.1f}'.format(rmse_avg[NAMES[PREDICTAND]].item()) + 'mm$^2$ day$^{-2}$', fontsize=14, ha='right')
+axes[1].text(x=ds.shape[0] - 2, y=12, s='RMSE = {:.1f}'.format(rmse_avg[NAMES[PREDICTAND]].mean().item()) + 'mm day$^{-1}$', fontsize=14, ha='right')
 # save figure
 fig.savefig('../Notebooks/Figures/{}_average_bias.png'.format(PREDICTAND), dpi=300, bbox_inches='tight')
 ```
 %% Cell type:markdown id:f9eccfb4-c8f6-41f1-9636-9a46221cf53e tags:
 ### Seasonal bias
 %% Cell type:markdown id:fe07f855-a68a-4bdf-a923-ef334fb82ad3 tags:
 Calculate seasonal bias:
 %% Cell type:code id:65813f9f-094d-43c0-8261-3364294631f2 tags:
 ``` python
 # group data by season: (DJF, MAM, JJA, SON)
 y_true_snl = y_true.groupby('time.season').mean(dim='time')
 y_pred_snl = y_pred_pr.groupby('time.season').mean(dim='time')
+y_refe_snl = y_refe.groupby('time.season').mean(dim='time')
 bias_snl = ((y_pred_snl - y_true_snl) / y_true_snl) * 100
+bias_snl_ref = ((y_refe_snl - y_true_snl) / y_true_snl) * 100
+```
+%% Cell type:code id:2a70e6ac-54fb-47b8-ae76-a1b51d9d1f17 tags:
+``` python
+# print average bias per season: ERA-5
+for var in bias_snl_ref.data_vars:
+    for season in bias_snl_ref[NAMES[PREDICTAND]].season:
+        print('(ERA-5) Average bias of mean {} for season {}: {:.1f}%'.format(var, season.values.item(), bias_snl_ref[var].sel(season=season).mean().item()))
 ```
 %% Cell type:code id:40fa07e4-2df1-4ac9-b27f-cd902e16ed30 tags:
 ``` python
-# print average bias per season
+# print average bias per season: model
 for var in bias_snl.data_vars:
    for season in bias_snl[NAMES[PREDICTAND]].season:
-        print('Average bias of mean {} for season {}: {:.1f}%'.format(var, season.values.item(), bias_snl[var].sel(season=season).mean().item()))
+        print('(Model) Average bias of mean {} for season {}: {:.1f}%'.format(var, season.values.item(), bias_snl[var].sel(season=season).mean().item()))
 ```
 %% Cell type:markdown id:a73b3ed4-eb44-4f3e-b240-7f6fe44bedd3 tags:
 Plot seasonal differences, taken from the [xarray documentation](xarray.pydata.org/en/stable/examples/monthly-means.html).
 %% Cell type:code id:2b2390e4-8bf1-41bd-b7d1-33e92fe8bc65 tags:
 ``` python
 # plot seasonal differences
 seasons = ('DJF', 'JJA')
 fig, axes = plt.subplots(nrows=1, ncols=len(seasons) + 1, figsize=(24,8), sharex=True, sharey=True)
 axes = axes.flatten()
 # plot annual average bias
 ds = bias_yearly_avg[NAMES[PREDICTAND]].mean(dim='year')
 axes[0].imshow(ds.values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)
 axes[0].set_title('Annual', fontsize=16);
 axes[0].text(x=ds.shape[0] - 2, y=2, s='Average: {:.1f}%'.format(ds.mean().item()), fontsize=14, ha='right')
 # plot seasonal average bias
 for ax, season in zip(axes[1:], seasons):
    ds = bias_snl[NAMES[PREDICTAND]].sel(season=season)
    ax.imshow(ds.values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)
    ax.set_title(season, fontsize=16);
    ax.text(x=ds.shape[0] - 2, y=2, s='Average: {:.1f}%'.format(ds.mean().item()), fontsize=14, ha='right')
 # adjust axes
 for ax in axes.flat:
    ax.axes.get_xaxis().set_ticklabels([])
    ax.axes.get_xaxis().set_ticks([])
    ax.axes.get_yaxis().set_ticklabels([])
    ax.axes.get_yaxis().set_ticks([])
    ax.axes.axis('tight')
    ax.set_xlabel('')
    ax.set_ylabel('')
 # adjust figure
 fig.suptitle('Average bias of {}: 1991 - 2010'.format(NAMES[PREDICTAND]), fontsize=20);
 fig.subplots_adjust(hspace=0, wspace=0, top=0.85)
 # add colorbar for bias
 axes = axes.flatten()
 cbar_ax = fig.add_axes([axes[-1].get_position().x1 + 0.01, axes[-1].get_position().y0,
                        0.01, axes[-1].get_position().y1 - axes[-1].get_position().y0])
 cbar = fig.colorbar(im2, cax=cbar_ax)
 cbar.set_label(label='Relative bias / (%)', fontsize=16)
 cbar.ax.tick_params(labelsize=14)
 # save figure
 fig.savefig('../Notebooks/Figures/{}_average_bias_seasonal.png'.format(PREDICTAND), dpi=300, bbox_inches='tight')
 ```
 %% Cell type:markdown id:ed9dee0e-9319-4ad5-a619-4ea30b116917 tags:
 ### Bias of extreme values
 %% Cell type:code id:92f0ce1d-2cd3-46f6-be1b-86cfe5c8e9d7 tags:
 ``` python
 # extreme quantile of interest
 quantile = 0.98
 ```
 %% Cell type:code id:bf98b3e0-7886-485f-a3bc-4bd64b7b2814 tags:
 ``` python
 # calculate extreme quantile for each year
 with warnings.catch_warnings():
    warnings.simplefilter('ignore', category=RuntimeWarning)
    y_pred_ex = y_pred_pr.groupby('time.year').quantile(quantile, dim='time')
    y_true_ex = y_true.groupby('time.year').quantile(quantile, dim='time')
+    y_refe_ex = y_refe.groupby('time.year').quantile(quantile, dim='time')
 ```
 %% Cell type:code id:89893df3-987a-4794-a6e9-0893c925218c tags:
 ``` python
 # calculate bias in extreme quantile for each year
 bias_ex = ((y_pred_ex - y_true_ex) / y_true_ex) * 100
+bias_ex_ref = ((y_refe_ex - y_true_ex) / y_true_ex) * 100
+```
+%% Cell type:code id:9a610a70-bb94-47e6-b470-e01bf4a295c0 tags:
+``` python
+# bias of extreme quantile: ERA-5
+for var in bias_ex_ref:
+    print('(ERA-5) Yearly average bias for P{:.0f} of {}: {:.1f}%'.format(quantile * 100, var, bias_ex_ref[var].mean().item()))
+```
+%% Cell type:code id:423962d7-453d-4c86-b93e-a4571bfec1c4 tags:
+``` python
+# bias of extreme quantile: Model
 for var in bias_ex:
-    print('Yearly average bias for P{:.0f} of {}: {:.1f}%'.format(quantile * 100, var, bias_ex[var].mean().item()))
+    print('(Model) Yearly average bias for P{:.0f} of {}: {:.1f}%'.format(quantile * 100, var, bias_ex[var].mean().item()))
 ```
 %% Cell type:code id:180b723a-49b0-4692-8249-b457eda48d44 tags:
 ``` python
 # mean absolute error in extreme quantile
 mae_ex = np.abs(y_pred_ex - y_true_ex).mean()
+mae_ex_ref = np.abs(y_refe_ex - y_true_ex).mean()
+```
+%% Cell type:code id:7331acdd-60bb-414e-a0e7-e81956c3a1bf tags:
+``` python
+# mae of extreme quantile: ERA-5
+for var in mae_ex_ref:
+    print('(ERA-5) Yearly average MAE for P{:.0f} of {}: {:.1f} mm / day'.format(quantile * 100, var, mae_ex_ref[var].item()))
+```
+%% Cell type:code id:d7bf1a6c-e111-4c72-8774-64a3939cbe50 tags:
+``` python
+# mae of extreme quantile: Model
 for var in mae_ex:
-    print('Yearly average MAE for P{:.0f} of {}: {:.1f} mm / day'.format(quantile * 100, var, mae_ex[var].item()))
+    print('(Model) Yearly average MAE for P{:.0f} of {}: {:.1f} mm / day'.format(quantile * 100, var, mae_ex[var].item()))
 ```
 %% Cell type:code id:e6309621-7d16-43b7-a9d4-c2857dbe8270 tags:
 ``` python
-# root mean squared error over reference period
+# root mean squared error in extreme quantile
 rmse_ex = ((y_pred_ex - y_true_ex) ** 2).mean()
+rmse_ex_ref = ((y_refe_ex - y_true_ex) ** 2).mean()
+```
+%% Cell type:code id:712a2109-14b9-45a3-9194-e2b917c5ba3f tags:
+``` python
+# rmse of extreme quantile: ERA-5
+for var in rmse_ex_ref:
+    print('(ERA-5) Yearly average RMSE for P{:.0f} of {}: {:.1f} mm / day'.format(quantile * 100, var, rmse_ex_ref[var].item()))
+```
+%% Cell type:code id:1dfad687-c16f-4767-8ddd-96c3e56bd96a tags:
+``` python
+# rmse of extreme quantile: Model
 for var in rmse_ex:
-    print('Yearly average RMSE for P{:.0f} of {}: {:.1f} mm / day'.format(quantile * 100, var, rmse_ex[var].item()))
+    print('(Model) Yearly average RMSE for P{:.0f} of {}: {:.1f} mm / day'.format(quantile * 100, var, rmse_ex[var].item()))
 ```
 %% Cell type:code id:95338821-a78e-4a1c-ae73-25031ba7f6ac tags:
 ``` python
 # plot extremes of observation, prediction, and bias
 vmin, vmax = 10, 40
 fig, axes = plt.subplots(len(y_pred_ex.data_vars), 3, figsize=(24, len(y_pred_ex.data_vars) * 6),
                         sharex=True, sharey=True)
 axes = axes.reshape(len(y_pred_ex.data_vars), -1)
 for i, var in enumerate(y_pred_ex):
    for ds, ax in zip([y_true_ex, y_pred_ex, bias_ex], axes[i, ...]):
        if ds is bias_ex:
            ds = ds[var].mean(dim='year')
            im2 = ax.imshow(ds.values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)
            ax.text(x=ds.shape[0] - 2, y=2, s='Average: {:.1f}%'.format(ds.mean().item()), fontsize=14, ha='right')
        else:
            im1 = ax.imshow(ds[var].mean(dim='year').values, origin='lower', cmap='BuPu', vmin=vmin, vmax=vmax)
 # set titles
 axes[0, 0].set_title('Observed', fontsize=16, pad=10);
 axes[0, 1].set_title('Predicted', fontsize=16, pad=10);
 axes[0, 2].set_title('Bias', fontsize=16, pad=10);
 # adjust axes
 for ax in axes.flat:
    ax.axes.get_xaxis().set_ticklabels([])
    ax.axes.get_xaxis().set_ticks([])
    ax.axes.get_yaxis().set_ticklabels([])
    ax.axes.get_yaxis().set_ticks([])
    ax.axes.axis('tight')
    ax.set_xlabel('')
    ax.set_ylabel('')
 # adjust figure
 fig.suptitle('Average P{:.0f} of {}: 1991 - 2010'.format(quantile * 100, NAMES[PREDICTAND]), fontsize=20);
 fig.subplots_adjust(hspace=0, wspace=0, top=0.85)
 # add colorbar for bias
 axes = axes.flatten()
 cbar_ax = fig.add_axes([axes[-1].get_position().x1 + 0.01, axes[-1].get_position().y0,
                        0.01, axes[-1].get_position().y1 - axes[-1].get_position().y0])
 cbar = fig.colorbar(im2, cax=cbar_ax)
 cbar.set_label(label='Relative bias / (%)', fontsize=16)
 cbar.ax.tick_params(labelsize=14)
 # add colorbar for predictand
 cbar_ax_predictand = fig.add_axes([axes[0].get_position().x0, axes[0].get_position().y0 - 0.1,
                                   axes[-1].get_position().x0 - axes[0].get_position().x0,
                                   0.05])
 cbar_predictand = fig.colorbar(im1, cax=cbar_ax_predictand, orientation='horizontal')
 cbar_predictand.set_label(label='{} / '.format(NAMES[PREDICTAND].capitalize()) + '(mm day$^{-1}$)', fontsize=16)
 cbar_predictand.ax.tick_params(labelsize=14)
 # add metrics: MAE and RMSE
 axes[1].text(x=ds.shape[0] - 2, y=2, s='MAE = {:.1f}'.format(mae_ex[NAMES[PREDICTAND]].item())  + 'mm day$^{-1}$', fontsize=14, ha='right')
 axes[1].text(x=ds.shape[0] - 2, y=12, s='RMSE = {:.1f}'.format(rmse_ex[NAMES[PREDICTAND]].item())  + 'mm$^2$ day$^{-2}$', fontsize=14, ha='right')
 # save figure
 fig.savefig('../Notebooks/Figures/{}_average_bias_p{:.0f}.png'.format(PREDICTAND, quantile * 100), dpi=300, bbox_inches='tight')
 ```
 %% Cell type:markdown id:f7758b71-e844-4a47-b741-25cc2d277814 tags:
 ### Bias of extremes: winter vs. summer
 %% Cell type:code id:de16b327-dc4b-4645-b3a0-abc8f72c4225 tags:
 ``` python
 # group data by season and compute extreme percentile
 with warnings.catch_warnings():
    warnings.simplefilter('ignore', category=RuntimeWarning)
    y_true_ex_snl = y_true.groupby('time.season').quantile(quantile, dim='time')
    y_pred_ex_snl = y_pred_pr.groupby('time.season').quantile(quantile, dim='time')
+    y_refe_ex_snl = y_refe.groupby('time.season').quantile(quantile, dim='time')
 ```
 %% Cell type:code id:185a375c-b7bc-42cf-a57d-08268e824f21 tags:
 ``` python
 # compute relative bias in seasonal extremes
 bias_ex_snl = ((y_pred_ex_snl - y_true_ex_snl) / y_true_ex_snl) * 100
+bias_ex_snl_ref = ((y_refe_ex_snl - y_true_ex_snl) / y_true_ex_snl) * 100
 ```
 %% Cell type:code id:e5f82b16-7ebf-4b73-80dd-0bc7e6a305a1 tags:
 ``` python
-# print average bias in extreme per season
+# print average bias in extreme per season: ERA-5
+for var in bias_ex_snl_ref.data_vars:
+    for season in bias_ex_snl_ref[NAMES[PREDICTAND]].season:
+        print('(ERA-5) Average bias of P{:.0f} {} for season {}: {:.1f}%'.format(quantile * 100, var, season.values.item(), bias_ex_snl_ref[var].sel(season=season).mean().item()))
+```
+%% Cell type:code id:0671b4f3-52c6-4167-b35b-03902dbe11a3 tags:
+``` python
+# print average bias in extreme per season: Model
 for var in bias_ex_snl.data_vars:
    for season in bias_ex_snl[NAMES[PREDICTAND]].season:
-        print('Average bias of P{:.0f} {} for season {}: {:.1f}%'.format(quantile * 100, var, season.values.item(), bias_ex_snl[var].sel(season=season).mean().item()))
+        print('(Model) Average bias of P{:.0f} {} for season {}: {:.1f}%'.format(quantile * 100, var, season.values.item(), bias_ex_snl[var].sel(season=season).mean().item()))
 ```
 %% Cell type:code id:322ee9c4-92db-4041-8a36-45aa8d2021b5 tags:
 ``` python
 # plot seasonal differences
 seasons = ('DJF', 'JJA')
 fig, axes = plt.subplots(nrows=1, ncols=len(seasons) + 1, figsize=(24,8), sharex=True, sharey=True)
 axes = axes.flatten()
 # plot annual average bias of extreme
 ds = bias_ex[NAMES[PREDICTAND]].mean(dim='year')
 axes[0].imshow(ds.values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)
 axes[0].set_title('Annual', fontsize=16);
 axes[0].text(x=ds.shape[0] - 2, y=2, s='Average: {:.1f}%'.format(ds.mean().item()), fontsize=14, ha='right')
 # plot seasonal average bias of extreme
 for ax, season in zip(axes[1:], seasons):
    ds = bias_ex_snl[NAMES[PREDICTAND]].sel(season=season)
    ax.imshow(ds.values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)
    ax.set_title(season, fontsize=16);
    ax.text(x=ds.shape[0] - 2, y=2, s='Average: {:.1f}%'.format(ds.mean().item()), fontsize=14, ha='right')
 # adjust axes
 for ax in axes.flat:
    ax.axes.get_xaxis().set_ticklabels([])
    ax.axes.get_xaxis().set_ticks([])
    ax.axes.get_yaxis().set_ticklabels([])
    ax.axes.get_yaxis().set_ticks([])
    ax.axes.axis('tight')
    ax.set_xlabel('')
    ax.set_ylabel('')
 # adjust figure
 fig.suptitle('Average bias of P{:.0f} of {}: 1991 - 2010'.format(quantile * 100, NAMES[PREDICTAND]), fontsize=20);
 fig.subplots_adjust(hspace=0, wspace=0, top=0.85)
 # add colorbar for bias
 axes = axes.flatten()
 cbar_ax = fig.add_axes([axes[-1].get_position().x1 + 0.01, axes[-1].get_position().y0,
                        0.01, axes[-1].get_position().y1 - axes[-1].get_position().y0])
 cbar = fig.colorbar(im2, cax=cbar_ax)
 cbar.set_label(label='Relative bias / (%)', fontsize=16)
 cbar.ax.tick_params(labelsize=14)
 # save figure
 fig.savefig('../Notebooks/Figures/{}_average_bias_seasonal_ex.png'.format(PREDICTAND), dpi=300, bbox_inches='tight')
 ```
 %% Cell type:markdown id:1f1a76c5-0bcb-4f79-832c-caf958e5703a tags:
 ### Frequency of wet days
 %% Cell type:code id:4491395e-f69a-4749-ac73-c4cbce60c3bc tags:
 ``` python
 # minimum precipitation (mm / day) defining a wet day
 WET_DAY_THRESHOLD = 1
 ```
 %% Cell type:code id:40676a79-26a2-4714-900e-d530fda32f8f tags:
 ``` python
 # true and predicted frequency of wet days
 mask = (~np.isnan(y_true)) & (~np.isnan(y_pred_pr))
 wet_days_true = (y_true >= WET_DAY_THRESHOLD).where(mask, other=np.nan).astype(np.float32)
 wet_days_pred = (y_pred_pr >= WET_DAY_THRESHOLD).where(mask, other=np.nan).astype(np.float32)
 ```
 %% Cell type:code id:1ad9ad08-ad1f-4a76-9020-c09a442385c9 tags:
 ``` python
 # number of wet days in reference period: annual
 n_wet_days_true = wet_days_true.sum(dim='time', skipna=False)
 n_wet_days_pred = wet_days_pred.sum(dim='time', skipna=False)
 ```
 %% Cell type:code id:54088572-1873-4949-9937-0ea099e9c2b6 tags:
 ``` python
 # frequency of wet days in reference period: annual
 f_wet_days_true = (n_wet_days_true / len(wet_days_true.time)) * 100
 f_wet_days_pred = (n_wet_days_pred / len(wet_days_pred.time)) * 100
 ```
 %% Cell type:code id:3534d1d9-f50d-40f3-b1f0-d34c4152a37c tags:
 ``` python
 # frequency of wet days in reference period: seasonal
 f_wet_days_true_snl = wet_days_true.groupby('time.season').mean(dim='time', skipna=False)
 f_wet_days_pred_snl = wet_days_pred.groupby('time.season').mean(dim='time', skipna=False)
 ```
 %% Cell type:code id:60ac0f93-f9ca-4f75-8786-e692efe3a556 tags:
 ``` python
 # relative bias of frequency of wet vs. dry days: annual
 bias_wet = ((f_wet_days_pred - f_wet_days_true) / f_wet_days_true) * 100
 # relative bias of frequency of wet vs. dry days: seasonal
 bias_wet_snl = ((f_wet_days_pred_snl - f_wet_days_true_snl) / f_wet_days_true_snl) * 100
 ```
 %% Cell type:code id:e8e9d30a-2fbc-4f29-bc82-bfbc155430a0 tags:
 ``` python
 # plot average of observation, prediction, and bias
 fig, axes = plt.subplots(2, 3, figsize=(24, 12), sharex=True, sharey=True)
 axes = axes.flatten()
 # plot annual average bias of extreme
 ds = bias_wet[NAMES[PREDICTAND]]
 im = axes[0].imshow(ds.values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)
 axes[0].set_title('Annual', fontsize=16);
 axes[0].text(x=ds.shape[0] - 2, y=2, s='Average: {:.1f}%'.format(ds.mean().item()), fontsize=14, ha='right')
 # plot seasonal average bias of extreme
 for ax, season in zip(axes[1:], bias_wet_snl.season):
    ds = bias_wet_snl[NAMES[PREDICTAND]].sel(season=season)
    ax.imshow(ds.values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)
    ax.set_title(season.item(), fontsize=16);
    ax.text(x=ds.shape[0] - 2, y=2, s='Average: {:.1f}%'.format(ds.mean().item()), fontsize=14, ha='right')
 # adjust axes
 for ax in axes.flat:
    ax.axes.get_xaxis().set_ticklabels([])
    ax.axes.get_xaxis().set_ticks([])
    ax.axes.get_yaxis().set_ticklabels([])
    ax.axes.get_yaxis().set_ticks([])
    ax.axes.axis('tight')
    ax.set_xlabel('')
    ax.set_ylabel('')
 # turn off last axis
 axes[-1].set_visible(False)
 # adjust figure
 fig.suptitle('Frequency of wet days (>= {:.1f} mm): 1991 - 2010'.format(WET_DAY_THRESHOLD), fontsize=20);
 fig.subplots_adjust(hspace=0.1, wspace=0, top=0.925)
 # add colorbar
 cbar_ax_predictand = fig.add_axes([axes[-1].get_position().x1 + 0.01, axes[-1].get_position().y0,
                                   0.01, axes[0].get_position().y1 - axes[-1].get_position().y0])
 cbar_predictand = fig.colorbar(im, cax=cbar_ax_predictand)
 cbar_predictand.set_label(label='Relative bias / (%)', fontsize=16)
 cbar_predictand.ax.tick_params(labelsize=14)
 # save figure
 fig.savefig('../Notebooks/Figures/{}_bias_wet_days.png'.format(PREDICTAND), dpi=300, bbox_inches='tight')
 ```
 %% Cell type:markdown id:fde67674-8bed-45b2-b4ca-4a507084b5a8 tags:
 ### Mean wet day precipitation
 %% Cell type:code id:aa2d2b5a-e192-4c34-975c-d4e61c969a15 tags:
 ``` python
 # calculate mean wet day precipitation
 dii_true = (y_true * wet_days_true).sum(dim='time', skipna=False) / n_wet_days_true
 dii_pred = (y_pred_pr * wet_days_pred).sum(dim='time', skipna=False) / n_wet_days_pred
 ```
 %% Cell type:code id:d6331bb6-afe8-4e62-9fa8-60bce9af42ec tags:
 ``` python
 # calculate relative bias of mean wet day precipitation
 bias_dii = ((dii_pred - dii_true) / dii_true) * 100
 ```
 %% Cell type:code id:36e3cbac-233d-4892-9756-941d91981534 tags:
 ``` python
 # plot average of observation, prediction, and bias
 fig, axes = plt.subplots(1, 3, figsize=(24, 6), sharex=True, sharey=True)
 for i, var in enumerate(dii_true):
    for ds, ax in zip([dii_true, dii_pred, bias_dii], axes):
        if ds is bias_dii:
            im2 = ax.imshow(ds[var].values, origin='lower', cmap='RdBu_r', vmin=-40, vmax=40)
            ax.text(x=ds[var].shape[0] - 2, y=2, s='Average: {:.1f}%'.format(ds[var].mean().item()), fontsize=14, ha='right')
        else:
            im1 = ax.imshow(ds[var].values, origin='lower', cmap='BuPu', vmin=0, vmax=15)
 # set titles
 axes[0].set_title('Observed', fontsize=16, pad=10);
 axes[1].set_title('Predicted', fontsize=16, pad=10);
 axes[2].set_title('Bias', fontsize=16, pad=10);
 # adjust axes
 for ax in axes.flat:
    ax.axes.get_xaxis().set_ticklabels([])
    ax.axes.get_xaxis().set_ticks([])
    ax.axes.get_yaxis().set_ticklabels([])
    ax.axes.get_yaxis().set_ticks([])
    ax.axes.axis('tight')
    ax.set_xlabel('')
    ax.set_ylabel('')
 # adjust figure
 fig.suptitle('Mean wet day (>= {:.1f} mm) precipitation: 1991 - 2010'.format(WET_DAY_THRESHOLD), fontsize=20);
 fig.subplots_adjust(hspace=0, wspace=0, top=0.85)
 # add colorbar for bias
 axes = axes.flatten()
 cbar_ax_bias = fig.add_axes([axes[-1].get_position().x1 + 0.01, axes[-1].get_position().y0,
                             0.01, axes[-1].get_position().y1 - axes[-1].get_position().y0])
 cbar_bias = fig.colorbar(im2, cax=cbar_ax_bias)
 cbar_bias.set_label(label='Relative bias / (%)', fontsize=16)
 cbar_bias.ax.tick_params(labelsize=14)
 # add colorbar for predictand
 cbar_ax_predictand = fig.add_axes([axes[0].get_position().x0, axes[0].get_position().y0 - 0.1,
                                   axes[-1].get_position().x0 - axes[0].get_position().x0,
                                   0.05])
 cbar_predictand = fig.colorbar(im1, cax=cbar_ax_predictand, orientation='horizontal')
 cbar_predictand.set_label(label='Mean wet day precipitation / (mm day$^{-1}$)', fontsize=16)
 cbar_predictand.ax.tick_params(labelsize=14)
 # save figure
 fig.savefig('../Notebooks/Figures/{}_bias_wet_days_p.png'.format(PREDICTAND), dpi=300, bbox_inches='tight')
 ```
 %% Cell type:markdown id:359e6d22-5f7f-4203-bb2a-fa51e731d867 tags:
 ## Model validation: precipitation probability
 %% Cell type:markdown id:5bd5c551-d426-45d7-9338-5b5003ca676e tags:
 ### ROC: Receiver operating characteristics
 %% Cell type:code id:1bff2faf-c894-4917-8dcf-310106c153ad tags:
 ``` python
 # true and predicted probability of precipitation
 p_true = (y_true[NAMES[PREDICTAND]] > 0).values.flatten()
 p_pred = y_pred_prob.prob.values.flatten()
 ```
 %% Cell type:code id:6c4a7097-26af-4497-bf52-43601038be41 tags:
 ``` python
 # apply mask of valid pixels
 mask = (~np.isnan(p_true) & ~np.isnan(p_pred))
 p_pred = p_pred[mask]
 p_true = p_true[mask].astype(float)
 ```
 %% Cell type:code id:e4c35894-e31f-4879-806e-0b3935412730 tags:
 ``` python
 # calculate ROC: false positive rate vs. true positive rate
 fpr, tpr, _ = roc_curve(p_true, p_pred)
 area = auc(fpr, tpr) # area under ROC curve
 rocss = 2 * area - 1 # ROC skill score (cf. https://journals.ametsoc.org/view/journals/clim/16/24/1520-0442_2003_016_4145_otrsop_2.0.co_2.xml)
 ```
 %% Cell type:code id:ac418718-44bf-4378-a1da-7fb75e45b3a8 tags:
 ``` python
 # plot ROC curve
 fig, ax = plt.subplots(1, 1, figsize=(10, 10))
 ax.plot(fpr, tpr, lw=2, label='Area={:.2f}, ROCSS={:.2f}'.format(area, rocss), color='k')
 # plot classifier with no skill
 interval = np.arange(-0.05, 1.1, 0.05)
 ax.plot([0, 1], [0, 1], lw=2, linestyle='--', color='k')
 ax.text(0.95, 0.975, 'Random Classifier', ha='right', va='top', rotation=45, fontsize=12)
 # plot perfect classifier
 ax.plot(0, 1, '-o', markersize=5, markerfacecolor='k', markeredgecolor='none')
 ax.text(0.02, 1, 'Perfect classifier', va='center', fontsize=12)
 # plot direction of increase / decrease
 ax.arrow(np.median(interval), np.median(interval), 0.1, -0.1, head_width=0.01, facecolor='k')
 ax.arrow(np.median(interval), np.median(interval), -0.1, 0.1, head_width=0.01, facecolor='k')
 ax.text(np.median(interval) + 0.05, np.median(interval) - 0.05, s='Worse', rotation=45, ha='left', fontsize=12)
 ax.text(np.median(interval) - 0.05, np.median(interval) + 0.05, s='Better', rotation=45, ha='left', fontsize=12)
 # adjust axes
 ax.set_xticks(np.arange(0, 1.1, 0.1))
 ax.set_xticklabels(['{:.2f}'.format(i) for i in np.arange(0, 1.1, 0.1)], fontsize=12)
 ax.set_yticks(np.arange(0, 1.1, 0.1))
 ax.set_yticklabels(['{:.2f}'.format(i) for i in np.arange(0, 1.1, 0.1)], fontsize=12)
 ax.set_xlim(interval[0], interval[-1])
 ax.set_ylim(interval[0], interval[-1])
 ax.set_xlabel('False Positive Rate', fontsize=14)
 ax.set_ylabel('True Positive Rate', fontsize=14)
 ax.set_title('ROC of precipitation probability: 1991 - 2010', fontsize=14, pad=10)
 ax.legend(frameon=False, loc='lower right', fontsize=14);
 # save figure
 fig.savefig('../Notebooks/Figures/{}_ROC.png'.format(PREDICTAND), dpi=300, bbox_inches='tight')
 ```