{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 112,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import os\n",
    "from glob import glob\n",
    "import xarray as xr\n",
    "import numpy as np"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 82,
   "metadata": {},
   "outputs": [],
   "source": [
    "fdir = '/home/www/oggm/cmip5-ng'\n",
    "fl = []\n",
    "fl_2100 = []\n",
    "fl_2300 = []\n",
    "for x in os.walk(fdir):\n",
    "    for y in glob(os.path.join(x[0], '*.nc')):\n",
    "        # exclude the redundant folder!\n",
    "        if 'redundant' not in y:\n",
    "            # the gcsm until 2300 are separately in 2300/ subfolders\n",
    "            if '2300' in y:\n",
    "                fl_2300.append(y)\n",
    "            else:\n",
    "                fl_2100.append(y)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 83,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_2100 = pd.DataFrame(fl_2100, columns=['path'])\n",
    "df_2100.columns = ['path']\n",
    "\n",
    "df_2300 = pd.DataFrame(fl_2300, columns=['path'])\n",
    "df_2300.columns = ['path']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 84,
   "metadata": {},
   "outputs": [],
   "source": [
    "for i, p in df_2100.iterrows():\n",
    "    p = p['path'].replace(fdir, '')\n",
    "    fn = p.split('/')[-1]\n",
    "    df_2100.loc[i, 'fname'] = fn\n",
    "    assert len(fn.split('_')) == 6\n",
    "    assert fn.split('_')[1] == 'mon'\n",
    "    df_2100.loc[i, 'var'] = fn.split('_')[0]\n",
    "    df_2100.loc[i, 'gcm'] = fn.split('_')[2]\n",
    "    df_2100.loc[i, 'rcp'] = fn.split('_')[3]\n",
    "    df_2100.loc[i, 'rea'] = fn.split('_')[4]\n",
    "\n",
    "###  \n",
    "for i, p in df_2300.iterrows():\n",
    "    p = p['path'].replace(fdir, '')\n",
    "    fn = p.split('/')[-1]\n",
    "    df_2300.loc[i, 'fname'] = fn\n",
    "    # there is no _g025 in the 2300 GCM names\n",
    "    assert len(fn.split('_')) == 5\n",
    "    assert fn.split('_')[1] == 'mon'\n",
    "    df_2300.loc[i, 'var'] = fn.split('_')[0]\n",
    "    df_2300.loc[i, 'gcm'] = fn.split('_')[2]\n",
    "    df_2300.loc[i, 'rcp'] = fn.split('_')[3]\n",
    "    df_2300.loc[i, 'rea'] = fn.split('_')[4][:-3]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "**Note that the newer downloaded 2300 GCMs have another grid than the 2100 GCMs which are 2.5° bilinear interpolated (and are thus named `_g025.nc`**\n",
    "Therefore, we use for the 2100 simulations the `_g025.nc` simulations where possible. There is just one GCM until 2300, which has not yet existed until 2100. We will add that one to the `all_gcm_list_2100.csv` "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 123,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div><svg style=\"position: absolute; width: 0; height: 0; overflow: hidden\">\n",
       "<defs>\n",
       "<symbol id=\"icon-database\" viewBox=\"0 0 32 32\">\n",
       "<path d=\"M16 0c-8.837 0-16 2.239-16 5v4c0 2.761 7.163 5 16 5s16-2.239 16-5v-4c0-2.761-7.163-5-16-5z\"></path>\n",
       "<path d=\"M16 17c-8.837 0-16-2.239-16-5v6c0 2.761 7.163 5 16 5s16-2.239 16-5v-6c0 2.761-7.163 5-16 5z\"></path>\n",
       "<path d=\"M16 26c-8.837 0-16-2.239-16-5v6c0 2.761 7.163 5 16 5s16-2.239 16-5v-6c0 2.761-7.163 5-16 5z\"></path>\n",
       "</symbol>\n",
       "<symbol id=\"icon-file-text2\" viewBox=\"0 0 32 32\">\n",
       "<path d=\"M28.681 7.159c-0.694-0.947-1.662-2.053-2.724-3.116s-2.169-2.030-3.116-2.724c-1.612-1.182-2.393-1.319-2.841-1.319h-15.5c-1.378 0-2.5 1.121-2.5 2.5v27c0 1.378 1.122 2.5 2.5 2.5h23c1.378 0 2.5-1.122 2.5-2.5v-19.5c0-0.448-0.137-1.23-1.319-2.841zM24.543 5.457c0.959 0.959 1.712 1.825 2.268 2.543h-4.811v-4.811c0.718 0.556 1.584 1.309 2.543 2.268zM28 29.5c0 0.271-0.229 0.5-0.5 0.5h-23c-0.271 0-0.5-0.229-0.5-0.5v-27c0-0.271 0.229-0.5 0.5-0.5 0 0 15.499-0 15.5 0v7c0 0.552 0.448 1 1 1h7v19.5z\"></path>\n",
       "<path d=\"M23 26h-14c-0.552 0-1-0.448-1-1s0.448-1 1-1h14c0.552 0 1 0.448 1 1s-0.448 1-1 1z\"></path>\n",
       "<path d=\"M23 22h-14c-0.552 0-1-0.448-1-1s0.448-1 1-1h14c0.552 0 1 0.448 1 1s-0.448 1-1 1z\"></path>\n",
       "<path d=\"M23 18h-14c-0.552 0-1-0.448-1-1s0.448-1 1-1h14c0.552 0 1 0.448 1 1s-0.448 1-1 1z\"></path>\n",
       "</symbol>\n",
       "</defs>\n",
       "</svg>\n",
       "<style>/* CSS stylesheet for displaying xarray objects in jupyterlab.\n",
       " *\n",
       " */\n",
       "\n",
       ":root {\n",
       "  --xr-font-color0: var(--jp-content-font-color0, rgba(0, 0, 0, 1));\n",
       "  --xr-font-color2: var(--jp-content-font-color2, rgba(0, 0, 0, 0.54));\n",
       "  --xr-font-color3: var(--jp-content-font-color3, rgba(0, 0, 0, 0.38));\n",
       "  --xr-border-color: var(--jp-border-color2, #e0e0e0);\n",
       "  --xr-disabled-color: var(--jp-layout-color3, #bdbdbd);\n",
       "  --xr-background-color: var(--jp-layout-color0, white);\n",
       "  --xr-background-color-row-even: var(--jp-layout-color1, white);\n",
       "  --xr-background-color-row-odd: var(--jp-layout-color2, #eeeeee);\n",
       "}\n",
       "\n",
       "html[theme=dark],\n",
       "body.vscode-dark {\n",
       "  --xr-font-color0: rgba(255, 255, 255, 1);\n",
       "  --xr-font-color2: rgba(255, 255, 255, 0.54);\n",
       "  --xr-font-color3: rgba(255, 255, 255, 0.38);\n",
       "  --xr-border-color: #1F1F1F;\n",
       "  --xr-disabled-color: #515151;\n",
       "  --xr-background-color: #111111;\n",
       "  --xr-background-color-row-even: #111111;\n",
       "  --xr-background-color-row-odd: #313131;\n",
       "}\n",
       "\n",
       ".xr-wrap {\n",
       "  display: block !important;\n",
       "  min-width: 300px;\n",
       "  max-width: 700px;\n",
       "}\n",
       "\n",
       ".xr-text-repr-fallback {\n",
       "  /* fallback to plain text repr when CSS is not injected (untrusted notebook) */\n",
       "  display: none;\n",
       "}\n",
       "\n",
       ".xr-header {\n",
       "  padding-top: 6px;\n",
       "  padding-bottom: 6px;\n",
       "  margin-bottom: 4px;\n",
       "  border-bottom: solid 1px var(--xr-border-color);\n",
       "}\n",
       "\n",
       ".xr-header > div,\n",
       ".xr-header > ul {\n",
       "  display: inline;\n",
       "  margin-top: 0;\n",
       "  margin-bottom: 0;\n",
       "}\n",
       "\n",
       ".xr-obj-type,\n",
       ".xr-array-name {\n",
       "  margin-left: 2px;\n",
       "  margin-right: 10px;\n",
       "}\n",
       "\n",
       ".xr-obj-type {\n",
       "  color: var(--xr-font-color2);\n",
       "}\n",
       "\n",
       ".xr-sections {\n",
       "  padding-left: 0 !important;\n",
       "  display: grid;\n",
       "  grid-template-columns: 150px auto auto 1fr 20px 20px;\n",
       "}\n",
       "\n",
       ".xr-section-item {\n",
       "  display: contents;\n",
       "}\n",
       "\n",
       ".xr-section-item input {\n",
       "  display: none;\n",
       "}\n",
       "\n",
       ".xr-section-item input + label {\n",
       "  color: var(--xr-disabled-color);\n",
       "}\n",
       "\n",
       ".xr-section-item input:enabled + label {\n",
       "  cursor: pointer;\n",
       "  color: var(--xr-font-color2);\n",
       "}\n",
       "\n",
       ".xr-section-item input:enabled + label:hover {\n",
       "  color: var(--xr-font-color0);\n",
       "}\n",
       "\n",
       ".xr-section-summary {\n",
       "  grid-column: 1;\n",
       "  color: var(--xr-font-color2);\n",
       "  font-weight: 500;\n",
       "}\n",
       "\n",
       ".xr-section-summary > span {\n",
       "  display: inline-block;\n",
       "  padding-left: 0.5em;\n",
       "}\n",
       "\n",
       ".xr-section-summary-in:disabled + label {\n",
       "  color: var(--xr-font-color2);\n",
       "}\n",
       "\n",
       ".xr-section-summary-in + label:before {\n",
       "  display: inline-block;\n",
       "  content: '►';\n",
       "  font-size: 11px;\n",
       "  width: 15px;\n",
       "  text-align: center;\n",
       "}\n",
       "\n",
       ".xr-section-summary-in:disabled + label:before {\n",
       "  color: var(--xr-disabled-color);\n",
       "}\n",
       "\n",
       ".xr-section-summary-in:checked + label:before {\n",
       "  content: '▼';\n",
       "}\n",
       "\n",
       ".xr-section-summary-in:checked + label > span {\n",
       "  display: none;\n",
       "}\n",
       "\n",
       ".xr-section-summary,\n",
       ".xr-section-inline-details {\n",
       "  padding-top: 4px;\n",
       "  padding-bottom: 4px;\n",
       "}\n",
       "\n",
       ".xr-section-inline-details {\n",
       "  grid-column: 2 / -1;\n",
       "}\n",
       "\n",
       ".xr-section-details {\n",
       "  display: none;\n",
       "  grid-column: 1 / -1;\n",
       "  margin-bottom: 5px;\n",
       "}\n",
       "\n",
       ".xr-section-summary-in:checked ~ .xr-section-details {\n",
       "  display: contents;\n",
       "}\n",
       "\n",
       ".xr-array-wrap {\n",
       "  grid-column: 1 / -1;\n",
       "  display: grid;\n",
       "  grid-template-columns: 20px auto;\n",
       "}\n",
       "\n",
       ".xr-array-wrap > label {\n",
       "  grid-column: 1;\n",
       "  vertical-align: top;\n",
       "}\n",
       "\n",
       ".xr-preview {\n",
       "  color: var(--xr-font-color3);\n",
       "}\n",
       "\n",
       ".xr-array-preview,\n",
       ".xr-array-data {\n",
       "  padding: 0 5px !important;\n",
       "  grid-column: 2;\n",
       "}\n",
       "\n",
       ".xr-array-data,\n",
       ".xr-array-in:checked ~ .xr-array-preview {\n",
       "  display: none;\n",
       "}\n",
       "\n",
       ".xr-array-in:checked ~ .xr-array-data,\n",
       ".xr-array-preview {\n",
       "  display: inline-block;\n",
       "}\n",
       "\n",
       ".xr-dim-list {\n",
       "  display: inline-block !important;\n",
       "  list-style: none;\n",
       "  padding: 0 !important;\n",
       "  margin: 0;\n",
       "}\n",
       "\n",
       ".xr-dim-list li {\n",
       "  display: inline-block;\n",
       "  padding: 0;\n",
       "  margin: 0;\n",
       "}\n",
       "\n",
       ".xr-dim-list:before {\n",
       "  content: '(';\n",
       "}\n",
       "\n",
       ".xr-dim-list:after {\n",
       "  content: ')';\n",
       "}\n",
       "\n",
       ".xr-dim-list li:not(:last-child):after {\n",
       "  content: ',';\n",
       "  padding-right: 5px;\n",
       "}\n",
       "\n",
       ".xr-has-index {\n",
       "  font-weight: bold;\n",
       "}\n",
       "\n",
       ".xr-var-list,\n",
       ".xr-var-item {\n",
       "  display: contents;\n",
       "}\n",
       "\n",
       ".xr-var-item > div,\n",
       ".xr-var-item label,\n",
       ".xr-var-item > .xr-var-name span {\n",
       "  background-color: var(--xr-background-color-row-even);\n",
       "  margin-bottom: 0;\n",
       "}\n",
       "\n",
       ".xr-var-item > .xr-var-name:hover span {\n",
       "  padding-right: 5px;\n",
       "}\n",
       "\n",
       ".xr-var-list > li:nth-child(odd) > div,\n",
       ".xr-var-list > li:nth-child(odd) > label,\n",
       ".xr-var-list > li:nth-child(odd) > .xr-var-name span {\n",
       "  background-color: var(--xr-background-color-row-odd);\n",
       "}\n",
       "\n",
       ".xr-var-name {\n",
       "  grid-column: 1;\n",
       "}\n",
       "\n",
       ".xr-var-dims {\n",
       "  grid-column: 2;\n",
       "}\n",
       "\n",
       ".xr-var-dtype {\n",
       "  grid-column: 3;\n",
       "  text-align: right;\n",
       "  color: var(--xr-font-color2);\n",
       "}\n",
       "\n",
       ".xr-var-preview {\n",
       "  grid-column: 4;\n",
       "}\n",
       "\n",
       ".xr-var-name,\n",
       ".xr-var-dims,\n",
       ".xr-var-dtype,\n",
       ".xr-preview,\n",
       ".xr-attrs dt {\n",
       "  white-space: nowrap;\n",
       "  overflow: hidden;\n",
       "  text-overflow: ellipsis;\n",
       "  padding-right: 10px;\n",
       "}\n",
       "\n",
       ".xr-var-name:hover,\n",
       ".xr-var-dims:hover,\n",
       ".xr-var-dtype:hover,\n",
       ".xr-attrs dt:hover {\n",
       "  overflow: visible;\n",
       "  width: auto;\n",
       "  z-index: 1;\n",
       "}\n",
       "\n",
       ".xr-var-attrs,\n",
       ".xr-var-data {\n",
       "  display: none;\n",
       "  background-color: var(--xr-background-color) !important;\n",
       "  padding-bottom: 5px !important;\n",
       "}\n",
       "\n",
       ".xr-var-attrs-in:checked ~ .xr-var-attrs,\n",
       ".xr-var-data-in:checked ~ .xr-var-data {\n",
       "  display: block;\n",
       "}\n",
       "\n",
       ".xr-var-data > table {\n",
       "  float: right;\n",
       "}\n",
       "\n",
       ".xr-var-name span,\n",
       ".xr-var-data,\n",
       ".xr-attrs {\n",
       "  padding-left: 25px !important;\n",
       "}\n",
       "\n",
       ".xr-attrs,\n",
       ".xr-var-attrs,\n",
       ".xr-var-data {\n",
       "  grid-column: 1 / -1;\n",
       "}\n",
       "\n",
       "dl.xr-attrs {\n",
       "  padding: 0;\n",
       "  margin: 0;\n",
       "  display: grid;\n",
       "  grid-template-columns: 125px auto;\n",
       "}\n",
       "\n",
       ".xr-attrs dt,\n",
       ".xr-attrs dd {\n",
       "  padding: 0;\n",
       "  margin: 0;\n",
       "  float: left;\n",
       "  padding-right: 10px;\n",
       "  width: auto;\n",
       "}\n",
       "\n",
       ".xr-attrs dt {\n",
       "  font-weight: normal;\n",
       "  grid-column: 1;\n",
       "}\n",
       "\n",
       ".xr-attrs dt:hover span {\n",
       "  display: inline-block;\n",
       "  background: var(--xr-background-color);\n",
       "  padding-right: 10px;\n",
       "}\n",
       "\n",
       ".xr-attrs dd {\n",
       "  grid-column: 2;\n",
       "  white-space: pre-wrap;\n",
       "  word-break: break-all;\n",
       "}\n",
       "\n",
       ".xr-icon-database,\n",
       ".xr-icon-file-text2 {\n",
       "  display: inline-block;\n",
       "  vertical-align: middle;\n",
       "  width: 1em;\n",
       "  height: 1.5em !important;\n",
       "  stroke-width: 0;\n",
       "  stroke: currentColor;\n",
       "  fill: currentColor;\n",
       "}\n",
       "</style><pre class='xr-text-repr-fallback'>&lt;xarray.Dataset&gt;\n",
       "Dimensions:    (time: 5412, bnds: 2, lat: 96, lon: 144)\n",
       "Coordinates:\n",
       "  * time       (time) object 1850-01-16 12:00:00 ... 2300-12-16 12:00:00\n",
       "  * lat        (lat) float64 -90.0 -88.11 -86.21 -84.32 ... 86.21 88.11 90.0\n",
       "  * lon        (lon) float64 0.0 2.5 5.0 7.5 10.0 ... 350.0 352.5 355.0 357.5\n",
       "Dimensions without coordinates: bnds\n",
       "Data variables:\n",
       "    time_bnds  (time, bnds) object 1850-01-01 00:00:00 ... 2301-01-01 00:00:00\n",
       "    lat_bnds   (lat, bnds) float64 -90.0 -89.05 -89.05 ... 89.05 89.05 90.0\n",
       "    lon_bnds   (lon, bnds) float64 -1.25 1.25 1.25 3.75 ... 356.2 356.2 358.8\n",
       "    pr         (time, lat, lon) float32 ...\n",
       "Attributes: (12/27)\n",
       "    institution:            Norwegian Climate Centre\n",
       "    institute_id:           NCC\n",
       "    experiment_id:          rcp45\n",
       "    source:                 NorESM1-M 2011  atmosphere: CAM-Oslo (CAM4-Oslo-n...\n",
       "    model_id:               NorESM1-M\n",
       "    forcing:                GHG, SA, Oz, Sl, Vl, BC, OC\n",
       "    ...                     ...\n",
       "    title:                  NorESM1-M model output prepared for CMIP5 RCP4.5\n",
       "    parent_experiment:      pre-industrial control\n",
       "    modeling_realm:         atmos\n",
       "    realization:            1\n",
       "    cmor_version:           2.6.0\n",
       "    modification:           Downloaded from Copernicus (Copernicus Climate Ch...</pre><div class='xr-wrap' style='display:none'><div class='xr-header'><div class='xr-obj-type'>xarray.Dataset</div></div><ul class='xr-sections'><li class='xr-section-item'><input id='section-51009ee7-a8e9-43f1-bec3-cdc9e12cda52' class='xr-section-summary-in' type='checkbox' disabled ><label for='section-51009ee7-a8e9-43f1-bec3-cdc9e12cda52' class='xr-section-summary'  title='Expand/collapse section'>Dimensions:</label><div class='xr-section-inline-details'><ul class='xr-dim-list'><li><span class='xr-has-index'>time</span>: 5412</li><li><span>bnds</span>: 2</li><li><span class='xr-has-index'>lat</span>: 96</li><li><span class='xr-has-index'>lon</span>: 144</li></ul></div><div class='xr-section-details'></div></li><li class='xr-section-item'><input id='section-729f4aaa-f3a3-4d1c-90e9-159b0b4642a1' class='xr-section-summary-in' type='checkbox'  checked><label for='section-729f4aaa-f3a3-4d1c-90e9-159b0b4642a1' class='xr-section-summary' >Coordinates: <span>(3)</span></label><div class='xr-section-inline-details'></div><div class='xr-section-details'><ul class='xr-var-list'><li class='xr-var-item'><div class='xr-var-name'><span class='xr-has-index'>time</span></div><div class='xr-var-dims'>(time)</div><div class='xr-var-dtype'>object</div><div class='xr-var-preview xr-preview'>1850-01-16 12:00:00 ... 2300-12-...</div><input id='attrs-b9916744-a7ad-4909-869a-5c745ac91d34' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-b9916744-a7ad-4909-869a-5c745ac91d34' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-40801ae9-8543-4d40-ae84-64ee1dbd1fd6' class='xr-var-data-in' type='checkbox'><label for='data-40801ae9-8543-4d40-ae84-64ee1dbd1fd6' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>bounds :</span></dt><dd>time_bnds</dd><dt><span>axis :</span></dt><dd>T</dd><dt><span>long_name :</span></dt><dd>time</dd><dt><span>standard_name :</span></dt><dd>time</dd></dl></div><div class='xr-var-data'><pre>array([cftime.DatetimeNoLeap(1850, 1, 16, 12, 0, 0, 0, has_year_zero=True),\n",
       "       cftime.DatetimeNoLeap(1850, 2, 15, 0, 0, 0, 0, has_year_zero=True),\n",
       "       cftime.DatetimeNoLeap(1850, 3, 16, 12, 0, 0, 0, has_year_zero=True),\n",
       "       ...,\n",
       "       cftime.DatetimeNoLeap(2300, 10, 16, 12, 0, 0, 0, has_year_zero=True),\n",
       "       cftime.DatetimeNoLeap(2300, 11, 16, 0, 0, 0, 0, has_year_zero=True),\n",
       "       cftime.DatetimeNoLeap(2300, 12, 16, 12, 0, 0, 0, has_year_zero=True)],\n",
       "      dtype=object)</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span class='xr-has-index'>lat</span></div><div class='xr-var-dims'>(lat)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>-90.0 -88.11 -86.21 ... 88.11 90.0</div><input id='attrs-88f7a6bd-02bc-437b-aa89-3bf12e6cf8f6' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-88f7a6bd-02bc-437b-aa89-3bf12e6cf8f6' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-30d7d659-04d2-4497-a41b-a15926d81773' class='xr-var-data-in' type='checkbox'><label for='data-30d7d659-04d2-4497-a41b-a15926d81773' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>bounds :</span></dt><dd>lat_bnds</dd><dt><span>units :</span></dt><dd>degrees_north</dd><dt><span>axis :</span></dt><dd>Y</dd><dt><span>long_name :</span></dt><dd>latitude</dd><dt><span>standard_name :</span></dt><dd>latitude</dd></dl></div><div class='xr-var-data'><pre>array([-90.      , -88.105263, -86.210526, -84.315789, -82.421053, -80.526316,\n",
       "       -78.631579, -76.736842, -74.842105, -72.947368, -71.052632, -69.157895,\n",
       "       -67.263158, -65.368421, -63.473684, -61.578947, -59.684211, -57.789474,\n",
       "       -55.894737, -54.      , -52.105263, -50.210526, -48.315789, -46.421053,\n",
       "       -44.526316, -42.631579, -40.736842, -38.842105, -36.947368, -35.052632,\n",
       "       -33.157895, -31.263158, -29.368421, -27.473684, -25.578947, -23.684211,\n",
       "       -21.789474, -19.894737, -18.      , -16.105263, -14.210526, -12.315789,\n",
       "       -10.421053,  -8.526316,  -6.631579,  -4.736842,  -2.842105,  -0.947368,\n",
       "         0.947368,   2.842105,   4.736842,   6.631579,   8.526316,  10.421053,\n",
       "        12.315789,  14.210526,  16.105263,  18.      ,  19.894737,  21.789474,\n",
       "        23.684211,  25.578947,  27.473684,  29.368421,  31.263158,  33.157895,\n",
       "        35.052632,  36.947368,  38.842105,  40.736842,  42.631579,  44.526316,\n",
       "        46.421053,  48.315789,  50.210526,  52.105263,  54.      ,  55.894737,\n",
       "        57.789474,  59.684211,  61.578947,  63.473684,  65.368421,  67.263158,\n",
       "        69.157895,  71.052632,  72.947368,  74.842105,  76.736842,  78.631579,\n",
       "        80.526316,  82.421053,  84.315789,  86.210526,  88.105263,  90.      ])</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span class='xr-has-index'>lon</span></div><div class='xr-var-dims'>(lon)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>0.0 2.5 5.0 ... 352.5 355.0 357.5</div><input id='attrs-3c52b075-0124-41c9-8160-e64d56ad43e0' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-3c52b075-0124-41c9-8160-e64d56ad43e0' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-830e1125-193d-41f5-ba16-44c38ab20ebc' class='xr-var-data-in' type='checkbox'><label for='data-830e1125-193d-41f5-ba16-44c38ab20ebc' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>bounds :</span></dt><dd>lon_bnds</dd><dt><span>units :</span></dt><dd>degrees_east</dd><dt><span>axis :</span></dt><dd>X</dd><dt><span>long_name :</span></dt><dd>longitude</dd><dt><span>standard_name :</span></dt><dd>longitude</dd></dl></div><div class='xr-var-data'><pre>array([  0. ,   2.5,   5. ,   7.5,  10. ,  12.5,  15. ,  17.5,  20. ,  22.5,\n",
       "        25. ,  27.5,  30. ,  32.5,  35. ,  37.5,  40. ,  42.5,  45. ,  47.5,\n",
       "        50. ,  52.5,  55. ,  57.5,  60. ,  62.5,  65. ,  67.5,  70. ,  72.5,\n",
       "        75. ,  77.5,  80. ,  82.5,  85. ,  87.5,  90. ,  92.5,  95. ,  97.5,\n",
       "       100. , 102.5, 105. , 107.5, 110. , 112.5, 115. , 117.5, 120. , 122.5,\n",
       "       125. , 127.5, 130. , 132.5, 135. , 137.5, 140. , 142.5, 145. , 147.5,\n",
       "       150. , 152.5, 155. , 157.5, 160. , 162.5, 165. , 167.5, 170. , 172.5,\n",
       "       175. , 177.5, 180. , 182.5, 185. , 187.5, 190. , 192.5, 195. , 197.5,\n",
       "       200. , 202.5, 205. , 207.5, 210. , 212.5, 215. , 217.5, 220. , 222.5,\n",
       "       225. , 227.5, 230. , 232.5, 235. , 237.5, 240. , 242.5, 245. , 247.5,\n",
       "       250. , 252.5, 255. , 257.5, 260. , 262.5, 265. , 267.5, 270. , 272.5,\n",
       "       275. , 277.5, 280. , 282.5, 285. , 287.5, 290. , 292.5, 295. , 297.5,\n",
       "       300. , 302.5, 305. , 307.5, 310. , 312.5, 315. , 317.5, 320. , 322.5,\n",
       "       325. , 327.5, 330. , 332.5, 335. , 337.5, 340. , 342.5, 345. , 347.5,\n",
       "       350. , 352.5, 355. , 357.5])</pre></div></li></ul></div></li><li class='xr-section-item'><input id='section-a3f3224a-b19c-40b3-a758-4cbb6b62b1f0' class='xr-section-summary-in' type='checkbox'  checked><label for='section-a3f3224a-b19c-40b3-a758-4cbb6b62b1f0' class='xr-section-summary' >Data variables: <span>(4)</span></label><div class='xr-section-inline-details'></div><div class='xr-section-details'><ul class='xr-var-list'><li class='xr-var-item'><div class='xr-var-name'><span>time_bnds</span></div><div class='xr-var-dims'>(time, bnds)</div><div class='xr-var-dtype'>object</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-abed9d93-b7e7-4a0c-9e8c-079f7c801455' class='xr-var-attrs-in' type='checkbox' disabled><label for='attrs-abed9d93-b7e7-4a0c-9e8c-079f7c801455' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-2c08b324-b234-4279-8a09-b0297e339351' class='xr-var-data-in' type='checkbox'><label for='data-2c08b324-b234-4279-8a09-b0297e339351' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'></dl></div><div class='xr-var-data'><pre>array([[cftime.DatetimeNoLeap(1850, 1, 1, 0, 0, 0, 0, has_year_zero=True),\n",
       "        cftime.DatetimeNoLeap(1850, 2, 1, 0, 0, 0, 0, has_year_zero=True)],\n",
       "       [cftime.DatetimeNoLeap(1850, 2, 1, 0, 0, 0, 0, has_year_zero=True),\n",
       "        cftime.DatetimeNoLeap(1850, 3, 1, 0, 0, 0, 0, has_year_zero=True)],\n",
       "       [cftime.DatetimeNoLeap(1850, 3, 1, 0, 0, 0, 0, has_year_zero=True),\n",
       "        cftime.DatetimeNoLeap(1850, 4, 1, 0, 0, 0, 0, has_year_zero=True)],\n",
       "       ...,\n",
       "       [cftime.DatetimeNoLeap(2300, 10, 1, 0, 0, 0, 0, has_year_zero=True),\n",
       "        cftime.DatetimeNoLeap(2300, 11, 1, 0, 0, 0, 0, has_year_zero=True)],\n",
       "       [cftime.DatetimeNoLeap(2300, 11, 1, 0, 0, 0, 0, has_year_zero=True),\n",
       "        cftime.DatetimeNoLeap(2300, 12, 1, 0, 0, 0, 0, has_year_zero=True)],\n",
       "       [cftime.DatetimeNoLeap(2300, 12, 1, 0, 0, 0, 0, has_year_zero=True),\n",
       "        cftime.DatetimeNoLeap(2301, 1, 1, 0, 0, 0, 0, has_year_zero=True)]],\n",
       "      dtype=object)</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span>lat_bnds</span></div><div class='xr-var-dims'>(lat, bnds)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-6e9ad836-2968-48b9-92cc-ae4cd76dc87f' class='xr-var-attrs-in' type='checkbox' disabled><label for='attrs-6e9ad836-2968-48b9-92cc-ae4cd76dc87f' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-72a2e7d0-931a-44d0-b9ba-27ed50998677' class='xr-var-data-in' type='checkbox'><label for='data-72a2e7d0-931a-44d0-b9ba-27ed50998677' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'></dl></div><div class='xr-var-data'><pre>array([[-90.      , -89.052632],\n",
       "       [-89.052632, -87.157895],\n",
       "       [-87.157895, -85.263158],\n",
       "       [-85.263158, -83.368421],\n",
       "       [-83.368421, -81.473684],\n",
       "       [-81.473684, -79.578947],\n",
       "       [-79.578947, -77.684211],\n",
       "       [-77.684211, -75.789474],\n",
       "       [-75.789474, -73.894737],\n",
       "       [-73.894737, -72.      ],\n",
       "       [-72.      , -70.105263],\n",
       "       [-70.105263, -68.210526],\n",
       "       [-68.210526, -66.315789],\n",
       "       [-66.315789, -64.421053],\n",
       "       [-64.421053, -62.526316],\n",
       "       [-62.526316, -60.631579],\n",
       "       [-60.631579, -58.736842],\n",
       "       [-58.736842, -56.842105],\n",
       "       [-56.842105, -54.947368],\n",
       "       [-54.947368, -53.052632],\n",
       "       [-53.052632, -51.157895],\n",
       "       [-51.157895, -49.263158],\n",
       "       [-49.263158, -47.368421],\n",
       "       [-47.368421, -45.473684],\n",
       "       [-45.473684, -43.578947],\n",
       "       [-43.578947, -41.684211],\n",
       "       [-41.684211, -39.789474],\n",
       "       [-39.789474, -37.894737],\n",
       "       [-37.894737, -36.      ],\n",
       "       [-36.      , -34.105263],\n",
       "       [-34.105263, -32.210526],\n",
       "       [-32.210526, -30.315789],\n",
       "       [-30.315789, -28.421053],\n",
       "       [-28.421053, -26.526316],\n",
       "       [-26.526316, -24.631579],\n",
       "       [-24.631579, -22.736842],\n",
       "       [-22.736842, -20.842105],\n",
       "       [-20.842105, -18.947368],\n",
       "       [-18.947368, -17.052632],\n",
       "       [-17.052632, -15.157895],\n",
       "       [-15.157895, -13.263158],\n",
       "       [-13.263158, -11.368421],\n",
       "       [-11.368421,  -9.473684],\n",
       "       [ -9.473684,  -7.578947],\n",
       "       [ -7.578947,  -5.684211],\n",
       "       [ -5.684211,  -3.789474],\n",
       "       [ -3.789474,  -1.894737],\n",
       "       [ -1.894737,   0.      ],\n",
       "       [  0.      ,   1.894737],\n",
       "       [  1.894737,   3.789474],\n",
       "       [  3.789474,   5.684211],\n",
       "       [  5.684211,   7.578947],\n",
       "       [  7.578947,   9.473684],\n",
       "       [  9.473684,  11.368421],\n",
       "       [ 11.368421,  13.263158],\n",
       "       [ 13.263158,  15.157895],\n",
       "       [ 15.157895,  17.052632],\n",
       "       [ 17.052632,  18.947368],\n",
       "       [ 18.947368,  20.842105],\n",
       "       [ 20.842105,  22.736842],\n",
       "       [ 22.736842,  24.631579],\n",
       "       [ 24.631579,  26.526316],\n",
       "       [ 26.526316,  28.421053],\n",
       "       [ 28.421053,  30.315789],\n",
       "       [ 30.315789,  32.210526],\n",
       "       [ 32.210526,  34.105263],\n",
       "       [ 34.105263,  36.      ],\n",
       "       [ 36.      ,  37.894737],\n",
       "       [ 37.894737,  39.789474],\n",
       "       [ 39.789474,  41.684211],\n",
       "       [ 41.684211,  43.578947],\n",
       "       [ 43.578947,  45.473684],\n",
       "       [ 45.473684,  47.368421],\n",
       "       [ 47.368421,  49.263158],\n",
       "       [ 49.263158,  51.157895],\n",
       "       [ 51.157895,  53.052632],\n",
       "       [ 53.052632,  54.947368],\n",
       "       [ 54.947368,  56.842105],\n",
       "       [ 56.842105,  58.736842],\n",
       "       [ 58.736842,  60.631579],\n",
       "       [ 60.631579,  62.526316],\n",
       "       [ 62.526316,  64.421053],\n",
       "       [ 64.421053,  66.315789],\n",
       "       [ 66.315789,  68.210526],\n",
       "       [ 68.210526,  70.105263],\n",
       "       [ 70.105263,  72.      ],\n",
       "       [ 72.      ,  73.894737],\n",
       "       [ 73.894737,  75.789474],\n",
       "       [ 75.789474,  77.684211],\n",
       "       [ 77.684211,  79.578947],\n",
       "       [ 79.578947,  81.473684],\n",
       "       [ 81.473684,  83.368421],\n",
       "       [ 83.368421,  85.263158],\n",
       "       [ 85.263158,  87.157895],\n",
       "       [ 87.157895,  89.052632],\n",
       "       [ 89.052632,  90.      ]])</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span>lon_bnds</span></div><div class='xr-var-dims'>(lon, bnds)</div><div class='xr-var-dtype'>float64</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-382a0ca9-1c77-4eff-852c-4b4386bea30d' class='xr-var-attrs-in' type='checkbox' disabled><label for='attrs-382a0ca9-1c77-4eff-852c-4b4386bea30d' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-3159dbf4-5ef2-435d-b961-e45177286c7a' class='xr-var-data-in' type='checkbox'><label for='data-3159dbf4-5ef2-435d-b961-e45177286c7a' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'></dl></div><div class='xr-var-data'><pre>array([[ -1.25,   1.25],\n",
       "       [  1.25,   3.75],\n",
       "       [  3.75,   6.25],\n",
       "       ...,\n",
       "       [351.25, 353.75],\n",
       "       [353.75, 356.25],\n",
       "       [356.25, 358.75]])</pre></div></li><li class='xr-var-item'><div class='xr-var-name'><span>pr</span></div><div class='xr-var-dims'>(time, lat, lon)</div><div class='xr-var-dtype'>float32</div><div class='xr-var-preview xr-preview'>...</div><input id='attrs-3b6ae73f-0f94-4056-b2e8-d5877386b090' class='xr-var-attrs-in' type='checkbox' ><label for='attrs-3b6ae73f-0f94-4056-b2e8-d5877386b090' title='Show/Hide attributes'><svg class='icon xr-icon-file-text2'><use xlink:href='#icon-file-text2'></use></svg></label><input id='data-e36ddf12-194e-4aa1-a266-508edb9bcc54' class='xr-var-data-in' type='checkbox'><label for='data-e36ddf12-194e-4aa1-a266-508edb9bcc54' title='Show/Hide data repr'><svg class='icon xr-icon-database'><use xlink:href='#icon-database'></use></svg></label><div class='xr-var-attrs'><dl class='xr-attrs'><dt><span>standard_name :</span></dt><dd>precipitation_flux</dd><dt><span>long_name :</span></dt><dd>Precipitation</dd><dt><span>comment :</span></dt><dd>at surface; includes both liquid and solid phases from all types of clouds (both large-scale and convective)</dd><dt><span>units :</span></dt><dd>kg m-2 s-1</dd><dt><span>original_name :</span></dt><dd>PRECT</dd><dt><span>cell_methods :</span></dt><dd>time: mean</dd><dt><span>cell_measures :</span></dt><dd>area: areacella</dd><dt><span>history :</span></dt><dd>2011-06-01T05:45:35Z altered by CMOR: Converted type from &#x27;d&#x27; to &#x27;f&#x27;.</dd><dt><span>associated_files :</span></dt><dd>baseURL: http://cmip-pcmdi.llnl.gov/CMIP5/dataLocation gridspecFile: gridspec_atmos_fx_NorESM1-M_historical_r0i0p0.nc areacella: areacella_fx_NorESM1-M_historical_r0i0p0.nc</dd></dl></div><div class='xr-var-data'><pre>[74815488 values with dtype=float32]</pre></div></li></ul></div></li><li class='xr-section-item'><input id='section-1af5d7d2-5823-448d-b84b-b46d869890a9' class='xr-section-summary-in' type='checkbox'  ><label for='section-1af5d7d2-5823-448d-b84b-b46d869890a9' class='xr-section-summary' >Attributes: <span>(27)</span></label><div class='xr-section-inline-details'></div><div class='xr-section-details'><dl class='xr-attrs'><dt><span>institution :</span></dt><dd>Norwegian Climate Centre</dd><dt><span>institute_id :</span></dt><dd>NCC</dd><dt><span>experiment_id :</span></dt><dd>rcp45</dd><dt><span>source :</span></dt><dd>NorESM1-M 2011  atmosphere: CAM-Oslo (CAM4-Oslo-noresm-ver1_cmip5-r112, f19L26);  ocean: MICOM (MICOM-noresm-ver1_cmip5-r112, gx1v6L53);  sea ice: CICE (CICE4-noresm-ver1_cmip5-r112);  land: CLM (CLM4-noresm-ver1_cmip5-r112)</dd><dt><span>model_id :</span></dt><dd>NorESM1-M</dd><dt><span>forcing :</span></dt><dd>GHG, SA, Oz, Sl, Vl, BC, OC</dd><dt><span>parent_experiment_id :</span></dt><dd>piControl</dd><dt><span>parent_experiment_rip :</span></dt><dd>r1i1p1</dd><dt><span>branch_time :</span></dt><dd>255135.0</dd><dt><span>contact :</span></dt><dd>Please send any requests or bug reports to noresm-ncc@met.no.</dd><dt><span>initialization_method :</span></dt><dd>1</dd><dt><span>physics_version :</span></dt><dd>1</dd><dt><span>tracking_id :</span></dt><dd>5ccde64e-cfe8-47f6-9de8-9ea1621e7781</dd><dt><span>product :</span></dt><dd>output</dd><dt><span>experiment :</span></dt><dd>historical</dd><dt><span>frequency :</span></dt><dd>mon</dd><dt><span>creation_date :</span></dt><dd>2011-06-01T05:45:35Z</dd><dt><span>history :</span></dt><dd>2011-06-01T05:45:35Z CMOR rewrote data to comply with CF standards and CMIP5 requirements.</dd><dt><span>Conventions :</span></dt><dd>CF-1.4</dd><dt><span>project_id :</span></dt><dd>CMIP5</dd><dt><span>table_id :</span></dt><dd>Table Amon (27 April 2011) a5a1c518f52ae340313ba0aada03f862</dd><dt><span>title :</span></dt><dd>NorESM1-M model output prepared for CMIP5 RCP4.5</dd><dt><span>parent_experiment :</span></dt><dd>pre-industrial control</dd><dt><span>modeling_realm :</span></dt><dd>atmos</dd><dt><span>realization :</span></dt><dd>1</dd><dt><span>cmor_version :</span></dt><dd>2.6.0</dd><dt><span>modification :</span></dt><dd>Downloaded from Copernicus (Copernicus Climate Change Service, Climate Data Store, (2018): CMIP5 monthly data on single levels. Copernicus Climate Change Service (C3S) Climate Data Store (CDS). DOI: 10.24381/cds.9d44a987 (Accessed on 10-08-2023)) and concatenated/formatted in single time series 1850-2300 for oggm research by R. Chizzola</dd></dl></div></li></ul></div></div>"
      ],
      "text/plain": [
       "<xarray.Dataset>\n",
       "Dimensions:    (time: 5412, bnds: 2, lat: 96, lon: 144)\n",
       "Coordinates:\n",
       "  * time       (time) object 1850-01-16 12:00:00 ... 2300-12-16 12:00:00\n",
       "  * lat        (lat) float64 -90.0 -88.11 -86.21 -84.32 ... 86.21 88.11 90.0\n",
       "  * lon        (lon) float64 0.0 2.5 5.0 7.5 10.0 ... 350.0 352.5 355.0 357.5\n",
       "Dimensions without coordinates: bnds\n",
       "Data variables:\n",
       "    time_bnds  (time, bnds) object ...\n",
       "    lat_bnds   (lat, bnds) float64 ...\n",
       "    lon_bnds   (lon, bnds) float64 ...\n",
       "    pr         (time, lat, lon) float32 ...\n",
       "Attributes: (12/27)\n",
       "    institution:            Norwegian Climate Centre\n",
       "    institute_id:           NCC\n",
       "    experiment_id:          rcp45\n",
       "    source:                 NorESM1-M 2011  atmosphere: CAM-Oslo (CAM4-Oslo-n...\n",
       "    model_id:               NorESM1-M\n",
       "    forcing:                GHG, SA, Oz, Sl, Vl, BC, OC\n",
       "    ...                     ...\n",
       "    title:                  NorESM1-M model output prepared for CMIP5 RCP4.5\n",
       "    parent_experiment:      pre-industrial control\n",
       "    modeling_realm:         atmos\n",
       "    realization:            1\n",
       "    cmor_version:           2.6.0\n",
       "    modification:           Downloaded from Copernicus (Copernicus Climate Ch..."
      ]
     },
     "execution_count": 123,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "xr.open_dataset(df_2300.loc[df_2300.gcm=='NorESM1-M'].iloc[0].path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 87,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2300 files: \n",
      "[-90.         -88.10526316 -86.21052632 -84.31578947 -82.42105263\n",
      " -80.52631579 -78.63157895 -76.73684211 -74.84210526 -72.94736842]\n",
      "_g025.nc files: \n",
      "[-88.75 -86.25 -83.75 -81.25 -78.75 -76.25 -73.75 -71.25 -68.75 -66.25]\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "(None, None)"
      ]
     },
     "execution_count": 87,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# here you see the different grids\n",
    "print('2300 files: '), print(xr.open_dataset(df_2300.loc[df_2300.gcm=='NorESM1-M'].iloc[0].path).lat[:10].values)\n",
    "print('_g025.nc files: '), print(xr.open_dataset(df_2100.loc[df_2100.gcm=='NorESM1-M'].iloc[0].path).lat[:10].values)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 91,
   "metadata": {},
   "outputs": [],
   "source": [
    "df_2100['interpolation'] = '_g025'  # bilinear latitude-longitude grid\n",
    "df_2300['interpolation'] = 'regular' # \"Regular latitude-longitude grid\"\n",
    "\n",
    "for i, p in df_2100.iterrows():\n",
    "    with xr.open_dataset(p['path'], use_cftime=True) as ds:\n",
    "        df_2100.loc[i, 'y0'] = str(ds['time.year'][0].data)\n",
    "        assert str(ds['time.month'][0].data) == '1'\n",
    "        df_2100.loc[i, 'y1'] = str(ds['time.year'][-1].data)\n",
    "        assert str(ds['time.month'][-1].data) == '12'\n",
    "        df_2100.loc[i, 'lon_resolution'] = '{:.2f}'.format(float(ds.lon[1] - ds.lon[0]))\n",
    "        \n",
    "for i, p in df_2300.iterrows():\n",
    "    with xr.open_dataset(p['path'], use_cftime=True) as ds:\n",
    "        df_2300.loc[i, 'y0'] = str(ds['time.year'][0].data)\n",
    "        assert str(ds['time.month'][0].data) == '1'\n",
    "        df_2300.loc[i, 'y1'] = str(ds['time.year'][-1].data)\n",
    "        assert str(ds['time.month'][-1].data) == '12'\n",
    "        df_2300.loc[i, 'lon_resolution'] = '{:.2f}'.format(float(ds.lon[1] - ds.lon[0]))\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 92,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "CESM1-CAM5rcp26\n",
      "CESM1-CAM5rcp45\n",
      "CESM1-CAM5rcp60\n"
     ]
    }
   ],
   "source": [
    "for gcm_rcp in (df_2300['gcm'] + df_2300['rcp']).unique():\n",
    "    if gcm_rcp not in (df_2100['gcm'] + df_2100['rcp']).unique():\n",
    "        print(gcm_rcp)\n",
    "# CESM1-CAM5 is missing in the GCMs until 2100      \n",
    "df_2100x = pd.concat([df_2100, df_2300.loc[df_2300.gcm == 'CESM1-CAM5']])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 93,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(array(['r1i1p1'], dtype=object), array(['r1i1p1'], dtype=object))"
      ]
     },
     "execution_count": 93,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2100x.rea.unique(), df_2300.rea.unique()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 94,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(array(['rcp45', 'historicalGHG', 'rcp60', 'historicalNat', 'rcp26',\n",
       "        'rcp85'], dtype=object),\n",
       " array(['rcp26', 'rcp85', 'rcp45', 'rcp60'], dtype=object))"
      ]
     },
     "execution_count": 94,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2100x.rcp.unique(), df_2300.rcp.unique()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 95,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(array(['pr', 'tas'], dtype=object), array(['pr', 'tas'], dtype=object))"
      ]
     },
     "execution_count": 95,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2100x['var'].unique(), df_2300['var'].unique()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 96,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array(['NorESM1-M', 'CanESM2', 'CCSM4', 'IPSL-CM5A-LR', 'CNRM-CM5',\n",
       "       'CSIRO-Mk3-6-0', 'GISS-E2-R', 'MPI-ESM-LR', 'GFDL-CM3',\n",
       "       'GFDL-ESM2G', 'CESM1-CAM5'], dtype=object)"
      ]
     },
     "execution_count": 96,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2100x.gcm.unique()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 97,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array(['CanESM2', 'MPI-ESM-LR', 'CESM1-CAM5', 'CSIRO-Mk3-6-0',\n",
       "       'NorESM1-M', 'CCSM4'], dtype=object)"
      ]
     },
     "execution_count": 97,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_2300.gcm.unique()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 114,
   "metadata": {},
   "outputs": [],
   "source": [
    "assert np.all(df_2300.y1=='2300')\n",
    "df_2100x = df_2100x.loc[df_2100x.y1!='2005']\n",
    "df_2100x.to_csv(os.path.join(fdir, 'all_gcm_list_2100.csv'))\n",
    "df_2300.to_csv(os.path.join(fdir, 'all_gcm_list_2300.csv'))\n",
    "df = pd.concat([df_2100, df_2300])\n",
    "df.to_csv(os.path.join(fdir, 'all_gcm_list.csv'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 115,
   "metadata": {},
   "outputs": [],
   "source": [
    "df = df.sort_values(by=['fname',\n",
    "                        'var'], ascending=True)\n",
    "with open(os.path.join(fdir, 'all_gcm_table.html'), 'w') as fo:\n",
    "    df.to_html(fo, columns=[\"fname\", \"gcm\", \"rcp\", \"rea\", \"var\", \"interpolation\", 'lon_resolution', \"y0\", \"y1\"])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 120,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "2100\n",
      "              rcp26 rcp45 rcp60 rcp85\n",
      "CCSM4             X     X     X     X\n",
      "CESM1-CAM5        X     X     X      \n",
      "CNRM-CM5          X     X           X\n",
      "CSIRO-Mk3-6-0     X     X     X     X\n",
      "CanESM2           X     X           X\n",
      "GFDL-CM3          X     X     X     X\n",
      "GFDL-ESM2G        X     X     X     X\n",
      "GISS-E2-R         X     X     X     X\n",
      "IPSL-CM5A-LR      X     X     X     X\n",
      "MPI-ESM-LR        X     X           X\n",
      "NorESM1-M         X     X     X     X\n",
      "\n",
      "\n",
      "2300\n",
      "              rcp26 rcp45 rcp60 rcp85\n",
      "CCSM4                         X     X\n",
      "CESM1-CAM5        X     X     X      \n",
      "CSIRO-Mk3-6-0           X           X\n",
      "CanESM2           X                  \n",
      "MPI-ESM-LR        X     X           X\n",
      "NorESM1-M               X            \n",
      "\n",
      "\n"
     ]
    }
   ],
   "source": [
    "for _df,endyr in zip([df_2100x, df_2300], ['2100', '2300']):\n",
    "    odf = pd.DataFrame()\n",
    "    for gcm in _df.gcm.unique():\n",
    "        s = _df.loc[_df.gcm == gcm]\n",
    "        for rcp in s.rcp.unique():\n",
    "            ss = s.loc[s.rcp == rcp]\n",
    "            assert ss['var'].str.contains('pr').sum() == 1\n",
    "            assert ss['var'].str.contains('tas').sum() == 1\n",
    "            odf.loc[gcm, rcp] = 'X'\n",
    "    odf = odf[sorted(odf.columns)]\n",
    "    odf = odf.fillna('')\n",
    "    odf = odf.sort_index()\n",
    "    with open(os.path.join(fdir, f'gcm_table_{endyr}.html'), 'w') as fo:\n",
    "        odf.to_html(fo)\n",
    "    print(endyr)\n",
    "    print(odf)\n",
    "    print('\\n')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}