%%capture cap
%run ../cacheb/cacheb-authentication.py

from pathlib import Path
with open(Path.home() / ".netrc", "a") as fp:
    fp.write(cap.stdout)

import xarray as xr

url = "https://cacheb.dcms.destine.eu/d1-climate-dt/ScenarioMIP-SSP3-7.0-IFS-NEMO-0001-high-sfc-v0.zarr"

ds = xr.open_dataset(
    url, 
    chunks={}, 
    engine="zarr", 
    storage_options={"client_kwargs": {"trust_env": True}}
)
ds

<xarray.Dataset> Size: 188TB
Dimensions:    (time: 175320, latitude: 4096, longitude: 8193)
Coordinates:
  * latitude   (latitude) float64 33kB -90.0 -89.96 -89.91 ... 89.91 89.96 90.0
  * longitude  (longitude) float64 66kB -180.0 -180.0 -179.9 ... 180.0 180.0
    step       timedelta64[ns] 8B ...
    surface    float64 8B ...
  * time       (time) datetime64[ns] 1MB 2020-01-01 ... 2039-12-31T23:00:00
Data variables:
    d2m        (time, latitude, longitude) float32 24TB dask.array<chunksize=(48, 512, 512), meta=np.ndarray>
    sd         (time, latitude, longitude) float32 24TB dask.array<chunksize=(48, 512, 512), meta=np.ndarray>
    ssr        (time, latitude, longitude) float32 24TB dask.array<chunksize=(48, 512, 512), meta=np.ndarray>
    str        (time, latitude, longitude) float32 24TB dask.array<chunksize=(48, 512, 512), meta=np.ndarray>
    t2m        (time, latitude, longitude) float32 24TB dask.array<chunksize=(48, 512, 512), meta=np.ndarray>
    tprate     (time, latitude, longitude) float32 24TB dask.array<chunksize=(48, 512, 512), meta=np.ndarray>
    u10        (time, latitude, longitude) float32 24TB dask.array<chunksize=(48, 512, 512), meta=np.ndarray>
    v10        (time, latitude, longitude) float32 24TB dask.array<chunksize=(48, 512, 512), meta=np.ndarray>
Attributes:
    Conventions:             CF-1.7
    GRIB_centre:             ecmf
    GRIB_centreDescription:  European Centre for Medium-Range Weather Forecasts
    GRIB_edition:            2
    GRIB_subCentre:          1003
    history:                 2024-06-06T16:50 GRIB to CDM+CF via cfgrib-0.9.1...
    institution:             European Centre for Medium-Range Weather Forecasts

array([-90.      , -89.956044, -89.912088, ...,  89.912088,  89.956044,
        90.      ])

array([-180.      , -179.956055, -179.912109, ...,  179.912109,  179.956055,
        180.      ])

[1 values with dtype=timedelta64[ns]]

[1 values with dtype=float64]

array(['2020-01-01T00:00:00.000000000', '2020-01-01T01:00:00.000000000',
       '2020-01-01T02:00:00.000000000', ..., '2039-12-31T21:00:00.000000000',
       '2039-12-31T22:00:00.000000000', '2039-12-31T23:00:00.000000000'],
      dtype='datetime64[ns]')

PandasIndex(Index([             -90.0, -89.95604395604396, -89.91208791208791,
       -89.86813186813187, -89.82417582417582, -89.78021978021978,
       -89.73626373626374,  -89.6923076923077, -89.64835164835165,
        -89.6043956043956,
       ...
        89.60439560439562,  89.64835164835165,  89.69230769230771,
        89.73626373626374,   89.7802197802198,  89.82417582417582,
        89.86813186813188,  89.91208791208791,  89.95604395604397,
                     90.0],
      dtype='float64', name='latitude', length=4096))

PandasIndex(Index([             -180.0,     -179.9560546875, -179.91210937500003,
           -179.8681640625,       -179.82421875,     -179.7802734375,
            -179.736328125,     -179.6923828125,        -179.6484375,
           -179.6044921875,
       ...
            179.6044921875,         179.6484375,      179.6923828125,
             179.736328125,      179.7802734375,        179.82421875,
            179.8681640625,  179.91210937500003,      179.9560546875,
                     180.0],
      dtype='float64', name='longitude', length=8193))

PandasIndex(DatetimeIndex(['2020-01-01 00:00:00', '2020-01-01 01:00:00',
               '2020-01-01 02:00:00', '2020-01-01 03:00:00',
               '2020-01-01 04:00:00', '2020-01-01 05:00:00',
               '2020-01-01 06:00:00', '2020-01-01 07:00:00',
               '2020-01-01 08:00:00', '2020-01-01 09:00:00',
               ...
               '2039-12-31 14:00:00', '2039-12-31 15:00:00',
               '2039-12-31 16:00:00', '2039-12-31 17:00:00',
               '2039-12-31 18:00:00', '2039-12-31 19:00:00',
               '2039-12-31 20:00:00', '2039-12-31 21:00:00',
               '2039-12-31 22:00:00', '2039-12-31 23:00:00'],
              dtype='datetime64[ns]', name='time', length=175320, freq=None))

xr.set_options(keep_attrs=True)

t2m = ds.t2m - 273.15
t2m.attrs["units"] = "°C"
t2m

<xarray.DataArray 't2m' (time: 175320, latitude: 4096, longitude: 8193)> Size: 24TB
dask.array<sub, shape=(175320, 4096, 8193), dtype=float32, chunksize=(48, 512, 512), chunktype=numpy.ndarray>
Coordinates:
  * latitude   (latitude) float64 33kB -90.0 -89.96 -89.91 ... 89.91 89.96 90.0
  * longitude  (longitude) float64 66kB -180.0 -180.0 -179.9 ... 180.0 180.0
    step       timedelta64[ns] 8B ...
    surface    float64 8B ...
  * time       (time) datetime64[ns] 1MB 2020-01-01 ... 2039-12-31T23:00:00
Attributes: (12/19)
    GRIB_NV:                         0
    GRIB_cfName:                     air_temperature
    GRIB_cfVarName:                  t2m
    GRIB_dataType:                   fc
    GRIB_gridDefinitionDescription:  150
    GRIB_gridType:                   healpix
    ...                              ...
    GRIB_typeOfLevel:                heightAboveGround
    GRIB_units:                      K
    last_restart_dim_updated:        175320
    long_name:                       2 metre temperature
    standard_name:                   air_temperature
    units:                           °C

array([-90.      , -89.956044, -89.912088, ...,  89.912088,  89.956044,
        90.      ])

array([-180.      , -179.956055, -179.912109, ...,  179.912109,  179.956055,
        180.      ])

[1 values with dtype=timedelta64[ns]]

[1 values with dtype=float64]

array(['2020-01-01T00:00:00.000000000', '2020-01-01T01:00:00.000000000',
       '2020-01-01T02:00:00.000000000', ..., '2039-12-31T21:00:00.000000000',
       '2039-12-31T22:00:00.000000000', '2039-12-31T23:00:00.000000000'],
      dtype='datetime64[ns]')

PandasIndex(Index([             -90.0, -89.95604395604396, -89.91208791208791,
       -89.86813186813187, -89.82417582417582, -89.78021978021978,
       -89.73626373626374,  -89.6923076923077, -89.64835164835165,
        -89.6043956043956,
       ...
        89.60439560439562,  89.64835164835165,  89.69230769230771,
        89.73626373626374,   89.7802197802198,  89.82417582417582,
        89.86813186813188,  89.91208791208791,  89.95604395604397,
                     90.0],
      dtype='float64', name='latitude', length=4096))

PandasIndex(Index([             -180.0,     -179.9560546875, -179.91210937500003,
           -179.8681640625,       -179.82421875,     -179.7802734375,
            -179.736328125,     -179.6923828125,        -179.6484375,
           -179.6044921875,
       ...
            179.6044921875,         179.6484375,      179.6923828125,
             179.736328125,      179.7802734375,        179.82421875,
            179.8681640625,  179.91210937500003,      179.9560546875,
                     180.0],
      dtype='float64', name='longitude', length=8193))

PandasIndex(DatetimeIndex(['2020-01-01 00:00:00', '2020-01-01 01:00:00',
               '2020-01-01 02:00:00', '2020-01-01 03:00:00',
               '2020-01-01 04:00:00', '2020-01-01 05:00:00',
               '2020-01-01 06:00:00', '2020-01-01 07:00:00',
               '2020-01-01 08:00:00', '2020-01-01 09:00:00',
               ...
               '2039-12-31 14:00:00', '2039-12-31 15:00:00',
               '2039-12-31 16:00:00', '2039-12-31 17:00:00',
               '2039-12-31 18:00:00', '2039-12-31 19:00:00',
               '2039-12-31 20:00:00', '2039-12-31 21:00:00',
               '2039-12-31 22:00:00', '2039-12-31 23:00:00'],
              dtype='datetime64[ns]', name='time', length=175320, freq=None))

germany = {'latitude': slice(46, 56), 'longitude': slice(5, 16)}
t2m_germany = t2m.sel(**germany)
t2m_germany_winter = t2m_germany[t2m_germany.time.dt.month.isin([12, 1, 2])]
t2m_germany_winter

<xarray.DataArray 't2m' (time: 43320, latitude: 228, longitude: 251)> Size: 10GB
dask.array<getitem, shape=(43320, 228, 251), dtype=float32, chunksize=(47, 228, 251), chunktype=numpy.ndarray>
Coordinates:
  * latitude   (latitude) float64 2kB 46.0 46.04 46.09 ... 55.89 55.93 55.98
  * longitude  (longitude) float64 2kB 5.01 5.054 5.098 ... 15.91 15.95 16.0
    step       timedelta64[ns] 8B ...
    surface    float64 8B ...
  * time       (time) datetime64[ns] 347kB 2020-01-01 ... 2039-12-31T23:00:00
Attributes: (12/19)
    GRIB_NV:                         0
    GRIB_cfName:                     air_temperature
    GRIB_cfVarName:                  t2m
    GRIB_dataType:                   fc
    GRIB_gridDefinitionDescription:  150
    GRIB_gridType:                   healpix
    ...                              ...
    GRIB_typeOfLevel:                heightAboveGround
    GRIB_units:                      K
    last_restart_dim_updated:        175320
    long_name:                       2 metre temperature
    standard_name:                   air_temperature
    units:                           °C

array([46.      , 46.043956, 46.087912, ..., 55.89011 , 55.934066, 55.978022])

array([ 5.009766,  5.053711,  5.097656, ..., 15.908203, 15.952148, 15.996094])

[1 values with dtype=timedelta64[ns]]

[1 values with dtype=float64]

array(['2020-01-01T00:00:00.000000000', '2020-01-01T01:00:00.000000000',
       '2020-01-01T02:00:00.000000000', ..., '2039-12-31T21:00:00.000000000',
       '2039-12-31T22:00:00.000000000', '2039-12-31T23:00:00.000000000'],
      dtype='datetime64[ns]')

PandasIndex(Index([              46.0,  46.04395604395606,  46.08791208791209,
       46.131868131868146, 46.175824175824175,  46.21978021978023,
        46.26373626373626,  46.30769230769232,  46.35164835164836,
        46.39560439560441,
       ...
       55.582417582417605, 55.626373626373635,  55.67032967032969,
        55.71428571428572,  55.75824175824178,  55.80219780219781,
        55.84615384615387,   55.8901098901099,  55.93406593406596,
       55.978021978021985],
      dtype='float64', name='latitude', length=228))

PandasIndex(Index([ 5.009765625000001,       5.0537109375,         5.09765625,
             5.1416015625,        5.185546875,       5.2294921875,
                5.2734375,       5.3173828125,        5.361328125,
             5.4052734375,
       ...
            15.6005859375, 15.644531250000002,      15.6884765625,
             15.732421875, 15.776367187499998,         15.8203125,
       15.864257812500002,       15.908203125, 15.952148437500002,
              15.99609375],
      dtype='float64', name='longitude', length=251))

PandasIndex(DatetimeIndex(['2020-01-01 00:00:00', '2020-01-01 01:00:00',
               '2020-01-01 02:00:00', '2020-01-01 03:00:00',
               '2020-01-01 04:00:00', '2020-01-01 05:00:00',
               '2020-01-01 06:00:00', '2020-01-01 07:00:00',
               '2020-01-01 08:00:00', '2020-01-01 09:00:00',
               ...
               '2039-12-31 14:00:00', '2039-12-31 15:00:00',
               '2039-12-31 16:00:00', '2039-12-31 17:00:00',
               '2039-12-31 18:00:00', '2039-12-31 19:00:00',
               '2039-12-31 20:00:00', '2039-12-31 21:00:00',
               '2039-12-31 22:00:00', '2039-12-31 23:00:00'],
              dtype='datetime64[ns]', name='time', length=43320, freq=None))

import costing

costing.estimate_download_size(t2m, t2m_germany_winter)

estimated_needed_chunks: 922
estimated_memory_size: 46.406 GB
estimated_download_size: 4.641 GB

t2m_germany_winter_mean = t2m_germany_winter.resample(time='QS-DEC').mean(dim="time")
t2m_germany_winter_mean

<xarray.DataArray 't2m' (time: 81, latitude: 228, longitude: 251)> Size: 19MB
dask.array<transpose, shape=(81, 228, 251), dtype=float32, chunksize=(1, 228, 251), chunktype=numpy.ndarray>
Coordinates:
  * latitude   (latitude) float64 2kB 46.0 46.04 46.09 ... 55.89 55.93 55.98
  * longitude  (longitude) float64 2kB 5.01 5.054 5.098 ... 15.91 15.95 16.0
    step       timedelta64[ns] 8B ...
    surface    float64 8B ...
  * time       (time) datetime64[ns] 648B 2019-12-01 2020-03-01 ... 2039-12-01
Attributes: (12/19)
    GRIB_NV:                         0
    GRIB_cfName:                     air_temperature
    GRIB_cfVarName:                  t2m
    GRIB_dataType:                   fc
    GRIB_gridDefinitionDescription:  150
    GRIB_gridType:                   healpix
    ...                              ...
    GRIB_typeOfLevel:                heightAboveGround
    GRIB_units:                      K
    last_restart_dim_updated:        175320
    long_name:                       2 metre temperature
    standard_name:                   air_temperature
    units:                           °C

array([46.      , 46.043956, 46.087912, ..., 55.89011 , 55.934066, 55.978022])

array([ 5.009766,  5.053711,  5.097656, ..., 15.908203, 15.952148, 15.996094])

[1 values with dtype=timedelta64[ns]]

[1 values with dtype=float64]

array(['2019-12-01T00:00:00.000000000', '2020-03-01T00:00:00.000000000',
       '2020-06-01T00:00:00.000000000', '2020-09-01T00:00:00.000000000',
       '2020-12-01T00:00:00.000000000', '2021-03-01T00:00:00.000000000',
       '2021-06-01T00:00:00.000000000', '2021-09-01T00:00:00.000000000',
       '2021-12-01T00:00:00.000000000', '2022-03-01T00:00:00.000000000',
       '2022-06-01T00:00:00.000000000', '2022-09-01T00:00:00.000000000',
       '2022-12-01T00:00:00.000000000', '2023-03-01T00:00:00.000000000',
       '2023-06-01T00:00:00.000000000', '2023-09-01T00:00:00.000000000',
       '2023-12-01T00:00:00.000000000', '2024-03-01T00:00:00.000000000',
       '2024-06-01T00:00:00.000000000', '2024-09-01T00:00:00.000000000',
       '2024-12-01T00:00:00.000000000', '2025-03-01T00:00:00.000000000',
       '2025-06-01T00:00:00.000000000', '2025-09-01T00:00:00.000000000',
       '2025-12-01T00:00:00.000000000', '2026-03-01T00:00:00.000000000',
       '2026-06-01T00:00:00.000000000', '2026-09-01T00:00:00.000000000',
       '2026-12-01T00:00:00.000000000', '2027-03-01T00:00:00.000000000',
       '2027-06-01T00:00:00.000000000', '2027-09-01T00:00:00.000000000',
       '2027-12-01T00:00:00.000000000', '2028-03-01T00:00:00.000000000',
       '2028-06-01T00:00:00.000000000', '2028-09-01T00:00:00.000000000',
       '2028-12-01T00:00:00.000000000', '2029-03-01T00:00:00.000000000',
       '2029-06-01T00:00:00.000000000', '2029-09-01T00:00:00.000000000',
       '2029-12-01T00:00:00.000000000', '2030-03-01T00:00:00.000000000',
       '2030-06-01T00:00:00.000000000', '2030-09-01T00:00:00.000000000',
       '2030-12-01T00:00:00.000000000', '2031-03-01T00:00:00.000000000',
       '2031-06-01T00:00:00.000000000', '2031-09-01T00:00:00.000000000',
       '2031-12-01T00:00:00.000000000', '2032-03-01T00:00:00.000000000',
       '2032-06-01T00:00:00.000000000', '2032-09-01T00:00:00.000000000',
       '2032-12-01T00:00:00.000000000', '2033-03-01T00:00:00.000000000',
       '2033-06-01T00:00:00.000000000', '2033-09-01T00:00:00.000000000',
       '2033-12-01T00:00:00.000000000', '2034-03-01T00:00:00.000000000',
       '2034-06-01T00:00:00.000000000', '2034-09-01T00:00:00.000000000',
       '2034-12-01T00:00:00.000000000', '2035-03-01T00:00:00.000000000',
       '2035-06-01T00:00:00.000000000', '2035-09-01T00:00:00.000000000',
       '2035-12-01T00:00:00.000000000', '2036-03-01T00:00:00.000000000',
       '2036-06-01T00:00:00.000000000', '2036-09-01T00:00:00.000000000',
       '2036-12-01T00:00:00.000000000', '2037-03-01T00:00:00.000000000',
       '2037-06-01T00:00:00.000000000', '2037-09-01T00:00:00.000000000',
       '2037-12-01T00:00:00.000000000', '2038-03-01T00:00:00.000000000',
       '2038-06-01T00:00:00.000000000', '2038-09-01T00:00:00.000000000',
       '2038-12-01T00:00:00.000000000', '2039-03-01T00:00:00.000000000',
       '2039-06-01T00:00:00.000000000', '2039-09-01T00:00:00.000000000',
       '2039-12-01T00:00:00.000000000'], dtype='datetime64[ns]')

PandasIndex(Index([              46.0,  46.04395604395606,  46.08791208791209,
       46.131868131868146, 46.175824175824175,  46.21978021978023,
        46.26373626373626,  46.30769230769232,  46.35164835164836,
        46.39560439560441,
       ...
       55.582417582417605, 55.626373626373635,  55.67032967032969,
        55.71428571428572,  55.75824175824178,  55.80219780219781,
        55.84615384615387,   55.8901098901099,  55.93406593406596,
       55.978021978021985],
      dtype='float64', name='latitude', length=228))

PandasIndex(Index([ 5.009765625000001,       5.0537109375,         5.09765625,
             5.1416015625,        5.185546875,       5.2294921875,
                5.2734375,       5.3173828125,        5.361328125,
             5.4052734375,
       ...
            15.6005859375, 15.644531250000002,      15.6884765625,
             15.732421875, 15.776367187499998,         15.8203125,
       15.864257812500002,       15.908203125, 15.952148437500002,
              15.99609375],
      dtype='float64', name='longitude', length=251))

PandasIndex(DatetimeIndex(['2019-12-01', '2020-03-01', '2020-06-01', '2020-09-01',
               '2020-12-01', '2021-03-01', '2021-06-01', '2021-09-01',
               '2021-12-01', '2022-03-01', '2022-06-01', '2022-09-01',
               '2022-12-01', '2023-03-01', '2023-06-01', '2023-09-01',
               '2023-12-01', '2024-03-01', '2024-06-01', '2024-09-01',
               '2024-12-01', '2025-03-01', '2025-06-01', '2025-09-01',
               '2025-12-01', '2026-03-01', '2026-06-01', '2026-09-01',
               '2026-12-01', '2027-03-01', '2027-06-01', '2027-09-01',
               '2027-12-01', '2028-03-01', '2028-06-01', '2028-09-01',
               '2028-12-01', '2029-03-01', '2029-06-01', '2029-09-01',
               '2029-12-01', '2030-03-01', '2030-06-01', '2030-09-01',
               '2030-12-01', '2031-03-01', '2031-06-01', '2031-09-01',
               '2031-12-01', '2032-03-01', '2032-06-01', '2032-09-01',
               '2032-12-01', '2033-03-01', '2033-06-01', '2033-09-01',
               '2033-12-01', '2034-03-01', '2034-06-01', '2034-09-01',
               '2034-12-01', '2035-03-01', '2035-06-01', '2035-09-01',
               '2035-12-01', '2036-03-01', '2036-06-01', '2036-09-01',
               '2036-12-01', '2037-03-01', '2037-06-01', '2037-09-01',
               '2037-12-01', '2038-03-01', '2038-06-01', '2038-09-01',
               '2038-12-01', '2039-03-01', '2039-06-01', '2039-09-01',
               '2039-12-01'],
              dtype='datetime64[ns]', name='time', freq='QS-DEC'))

%%time

t2m_germany_winter_mean_computed = t2m_germany_winter_mean.compute()

CPU times: user 3min 53s, sys: 1min 21s, total: 5min 14s
Wall time: 1min 48s

t2m_germany_winter_mean_computed = t2m_germany_winter_mean_computed.dropna("time")

import pandas as pd
import matplotlib.pyplot as plt
import cartopy.crs as ccrs
import cartopy.feature as cfeature
from cartopy import crs
from matplotlib.animation import FuncAnimation
from IPython.display import HTML
from mpl_toolkits.axes_grid1 import make_axes_locatable

fig, ax = plt.subplots(subplot_kw={'projection': ccrs.PlateCarree()})
ax.add_feature(cfeature.COASTLINE, linewidth=0.5)
ax.add_feature(cfeature.BORDERS, linestyle=':', linewidth=0.5)
ax.add_feature(cfeature.OCEAN, facecolor='lightblue', zorder=2)
ax.gridlines(draw_labels=True, zorder=3, color="white", alpha=0.5)

t2m_germany_winter_mean_computed.isel(time=0).plot(ax=ax, transform=ccrs.PlateCarree(), cmap='RdBu_r', add_colorbar=True, cbar_kwargs={'orientation': 'vertical', 'shrink':0.9,'pad': 0.15})

# function to update the plot for each frame (each timestep)
def update(frame):    
    data = t2m_germany_winter_mean_computed.isel(time=frame)
    plot = data.plot(
        ax=ax, 
        transform=ccrs.PlateCarree(), 
        cmap='RdBu_r', 
        vmin=-25, 
        vmax=25, 
        add_colorbar=False
    )

    ax.set_title(f"Time: {pd.Timestamp(data['time'].values).strftime('%Y-%m-%d')}") 
    return plot

anim = FuncAnimation(fig, update, frames=len(t2m_germany_winter_mean_computed['time']), repeat=True) # Create the animation
plt.close() # close the static plot to avoid duplicate display
HTML(anim.to_jshtml()) # display the animation in the notebook

t2m

<xarray.DataArray 't2m' (time: 175320, latitude: 4096, longitude: 8193)> Size: 24TB
dask.array<sub, shape=(175320, 4096, 8193), dtype=float32, chunksize=(48, 512, 512), chunktype=numpy.ndarray>
Coordinates:
  * latitude   (latitude) float64 33kB -90.0 -89.96 -89.91 ... 89.91 89.96 90.0
  * longitude  (longitude) float64 66kB -180.0 -180.0 -179.9 ... 180.0 180.0
    step       timedelta64[ns] 8B ...
    surface    float64 8B ...
  * time       (time) datetime64[ns] 1MB 2020-01-01 ... 2039-12-31T23:00:00
Attributes: (12/19)
    GRIB_NV:                         0
    GRIB_cfName:                     air_temperature
    GRIB_cfVarName:                  t2m
    GRIB_dataType:                   fc
    GRIB_gridDefinitionDescription:  150
    GRIB_gridType:                   healpix
    ...                              ...
    GRIB_typeOfLevel:                heightAboveGround
    GRIB_units:                      K
    last_restart_dim_updated:        175320
    long_name:                       2 metre temperature
    standard_name:                   air_temperature
    units:                           °C

array([-90.      , -89.956044, -89.912088, ...,  89.912088,  89.956044,
        90.      ])

array([-180.      , -179.956055, -179.912109, ...,  179.912109,  179.956055,
        180.      ])

[1 values with dtype=timedelta64[ns]]

[1 values with dtype=float64]

array(['2020-01-01T00:00:00.000000000', '2020-01-01T01:00:00.000000000',
       '2020-01-01T02:00:00.000000000', ..., '2039-12-31T21:00:00.000000000',
       '2039-12-31T22:00:00.000000000', '2039-12-31T23:00:00.000000000'],
      dtype='datetime64[ns]')

PandasIndex(Index([             -90.0, -89.95604395604396, -89.91208791208791,
       -89.86813186813187, -89.82417582417582, -89.78021978021978,
       -89.73626373626374,  -89.6923076923077, -89.64835164835165,
        -89.6043956043956,
       ...
        89.60439560439562,  89.64835164835165,  89.69230769230771,
        89.73626373626374,   89.7802197802198,  89.82417582417582,
        89.86813186813188,  89.91208791208791,  89.95604395604397,
                     90.0],
      dtype='float64', name='latitude', length=4096))

PandasIndex(Index([             -180.0,     -179.9560546875, -179.91210937500003,
           -179.8681640625,       -179.82421875,     -179.7802734375,
            -179.736328125,     -179.6923828125,        -179.6484375,
           -179.6044921875,
       ...
            179.6044921875,         179.6484375,      179.6923828125,
             179.736328125,      179.7802734375,        179.82421875,
            179.8681640625,  179.91210937500003,      179.9560546875,
                     180.0],
      dtype='float64', name='longitude', length=8193))

PandasIndex(DatetimeIndex(['2020-01-01 00:00:00', '2020-01-01 01:00:00',
               '2020-01-01 02:00:00', '2020-01-01 03:00:00',
               '2020-01-01 04:00:00', '2020-01-01 05:00:00',
               '2020-01-01 06:00:00', '2020-01-01 07:00:00',
               '2020-01-01 08:00:00', '2020-01-01 09:00:00',
               ...
               '2039-12-31 14:00:00', '2039-12-31 15:00:00',
               '2039-12-31 16:00:00', '2039-12-31 17:00:00',
               '2039-12-31 18:00:00', '2039-12-31 19:00:00',
               '2039-12-31 20:00:00', '2039-12-31 21:00:00',
               '2039-12-31 22:00:00', '2039-12-31 23:00:00'],
              dtype='datetime64[ns]', name='time', length=175320, freq=None))

darmstadt = {"latitude": 49.88, "longitude": 8.65}
base_temperature = 15 #[°C]

t2m_darmstadt = t2m.sel(darmstadt, method="nearest")
t2m_darmstadt

<xarray.DataArray 't2m' (time: 175320)> Size: 701kB
dask.array<getitem, shape=(175320,), dtype=float32, chunksize=(48,), chunktype=numpy.ndarray>
Coordinates:
    latitude   float64 8B 49.87
    longitude  float64 8B 8.657
    step       timedelta64[ns] 8B ...
    surface    float64 8B ...
  * time       (time) datetime64[ns] 1MB 2020-01-01 ... 2039-12-31T23:00:00
Attributes: (12/19)
    GRIB_NV:                         0
    GRIB_cfName:                     air_temperature
    GRIB_cfVarName:                  t2m
    GRIB_dataType:                   fc
    GRIB_gridDefinitionDescription:  150
    GRIB_gridType:                   healpix
    ...                              ...
    GRIB_typeOfLevel:                heightAboveGround
    GRIB_units:                      K
    last_restart_dim_updated:        175320
    long_name:                       2 metre temperature
    standard_name:                   air_temperature
    units:                           °C

array(49.86813187)

array(8.65722656)

[1 values with dtype=timedelta64[ns]]

[1 values with dtype=float64]

array(['2020-01-01T00:00:00.000000000', '2020-01-01T01:00:00.000000000',
       '2020-01-01T02:00:00.000000000', ..., '2039-12-31T21:00:00.000000000',
       '2039-12-31T22:00:00.000000000', '2039-12-31T23:00:00.000000000'],
      dtype='datetime64[ns]')

PandasIndex(DatetimeIndex(['2020-01-01 00:00:00', '2020-01-01 01:00:00',
               '2020-01-01 02:00:00', '2020-01-01 03:00:00',
               '2020-01-01 04:00:00', '2020-01-01 05:00:00',
               '2020-01-01 06:00:00', '2020-01-01 07:00:00',
               '2020-01-01 08:00:00', '2020-01-01 09:00:00',
               ...
               '2039-12-31 14:00:00', '2039-12-31 15:00:00',
               '2039-12-31 16:00:00', '2039-12-31 17:00:00',
               '2039-12-31 18:00:00', '2039-12-31 19:00:00',
               '2039-12-31 20:00:00', '2039-12-31 21:00:00',
               '2039-12-31 22:00:00', '2039-12-31 23:00:00'],
              dtype='datetime64[ns]', name='time', length=175320, freq=None))

costing.estimate_download_size(t2m, t2m_darmstadt)

estimated_needed_chunks: 3653
estimated_memory_size: 183.862 GB
estimated_download_size: 18.386 GB

t2m_darmstadt_daily_mean = t2m_darmstadt.resample(time='1D').mean(dim='time')
diff = (base_temperature - t2m_darmstadt_daily_mean)
hdd = diff.where(diff > 0).groupby("time.year").sum()

%%time

hdd_computed = hdd.compute()

CPU times: user 8min 48s, sys: 4min 53s, total: 13min 41s
Wall time: 3min 43s

plt.style.use("seaborn-v0_8-darkgrid")

fig, ax = plt.subplots()

plt.bar(hdd_computed.year, hdd.values, color='#ff0000', alpha=0.7)
plt.xlabel('time')
plt.ylabel('HDD [°C]')
plt.grid(axis='y', alpha=0.75)
plt.title('Heating Degrees Days in Darmstadt')
plt.xticks(hdd.year[::2]);

Climate Adaptation Digital Twin: winter temperature in Germany and Heating Degree Days in Darmstadt¶

Goal of this tutorial¶

What you will learn:¶

Working with EDH data¶

1. Data access¶

2. Data selection¶

3. Data reduction¶

4. Data download¶

5. Visualization¶

Heating Degree Days (HDD) in Darmstadt¶