PAT = "your_personal_access_token"

# e.g. PAT="edh_pat_44bbb7e9192a4c6bb47ddf07d07564eee5d17de8dfc48f7118f88e3bc4a4157f8fe2403f5aa0a2d53441b6922ea9a33a"

import xarray as xr

ds = xr.open_dataset(
    f"https://edh:{PAT}@data.earthdatahub.destine.eu/more-era5/ecv-for-climate-change-1981-2010-anomaly-v0",
    chunks={},
    engine="zarr",
)
ds

<xarray.Dataset> Size: 9GB
Dimensions:     (latitude: 721, longitude: 1440, valid_time: 548)
Coordinates:
  * latitude    (latitude) float64 6kB 90.0 89.75 89.5 ... -89.5 -89.75 -90.0
  * longitude   (longitude) float64 12kB 0.0 0.25 0.5 0.75 ... 359.2 359.5 359.8
    number      int64 8B ...
    surface     float64 8B ...
  * valid_time  (valid_time) datetime64[ns] 4kB 1979-01-01 ... 2024-08-01
Data variables:
    r           (valid_time, latitude, longitude) float32 2GB dask.array<chunksize=(120, 256, 256), meta=np.ndarray>
    siconc      (valid_time, latitude, longitude) float32 2GB dask.array<chunksize=(120, 256, 256), meta=np.ndarray>
    t2m         (valid_time, latitude, longitude) float32 2GB dask.array<chunksize=(120, 256, 256), meta=np.ndarray>
    tp          (valid_time, latitude, longitude) float32 2GB dask.array<chunksize=(120, 256, 256), meta=np.ndarray>
Attributes:
    Conventions:             CF-1.7
    GRIB_centre:             ecmf
    GRIB_centreDescription:  European Centre for Medium-Range Weather Forecasts
    GRIB_edition:            1
    GRIB_subCentre:          0
    history:                 2024-10-03T17:07 GRIB to CDM+CF via cfgrib-0.9.1...
    institution:             European Centre for Medium-Range Weather Forecasts

array([ 90.  ,  89.75,  89.5 , ..., -89.5 , -89.75, -90.  ])

array([0.0000e+00, 2.5000e-01, 5.0000e-01, ..., 3.5925e+02, 3.5950e+02,
       3.5975e+02])

[1 values with dtype=int64]

[1 values with dtype=float64]

array(['1979-01-01T00:00:00.000000000', '1979-02-01T00:00:00.000000000',
       '1979-03-01T00:00:00.000000000', ..., '2024-06-01T00:00:00.000000000',
       '2024-07-01T00:00:00.000000000', '2024-08-01T00:00:00.000000000'],
      dtype='datetime64[ns]')

PandasIndex(Index([  90.0,  89.75,   89.5,  89.25,   89.0,  88.75,   88.5,  88.25,   88.0,
        87.75,
       ...
       -87.75,  -88.0, -88.25,  -88.5, -88.75,  -89.0, -89.25,  -89.5, -89.75,
        -90.0],
      dtype='float64', name='latitude', length=721))

PandasIndex(Index([   0.0,   0.25,    0.5,   0.75,    1.0,   1.25,    1.5,   1.75,    2.0,
         2.25,
       ...
        357.5, 357.75,  358.0, 358.25,  358.5, 358.75,  359.0, 359.25,  359.5,
       359.75],
      dtype='float64', name='longitude', length=1440))

PandasIndex(DatetimeIndex(['1979-01-01', '1979-02-01', '1979-03-01', '1979-04-01',
               '1979-05-01', '1979-06-01', '1979-07-01', '1979-08-01',
               '1979-09-01', '1979-10-01',
               ...
               '2023-11-01', '2023-12-01', '2024-01-01', '2024-02-01',
               '2024-03-01', '2024-04-01', '2024-05-01', '2024-06-01',
               '2024-07-01', '2024-08-01'],
              dtype='datetime64[ns]', name='valid_time', length=548, freq=None))

xr.set_options(keep_attrs=True)

t2m_anomaly = ds.t2m
t2m_anomaly.attrs["units"] = "°C"
t2m_anomaly.attrs["long_name"] = "Temperature variation"
t2m_anomaly

<xarray.DataArray 't2m' (valid_time: 548, latitude: 721, longitude: 1440)> Size: 2GB
dask.array<open_dataset-t2m, shape=(548, 721, 1440), dtype=float32, chunksize=(120, 256, 256), chunktype=numpy.ndarray>
Coordinates:
  * latitude    (latitude) float64 6kB 90.0 89.75 89.5 ... -89.5 -89.75 -90.0
  * longitude   (longitude) float64 12kB 0.0 0.25 0.5 0.75 ... 359.2 359.5 359.8
    number      int64 8B ...
    surface     float64 8B ...
  * valid_time  (valid_time) datetime64[ns] 4kB 1979-01-01 ... 2024-08-01
Attributes: (12/31)
    GRIB_NV:                                  0
    GRIB_Nx:                                  1440
    GRIB_Ny:                                  721
    GRIB_cfName:                              unknown
    GRIB_cfVarName:                           t2m
    GRIB_dataType:                            an
    ...                                       ...
    GRIB_typeOfLevel:                         surface
    GRIB_units:                               K
    GRIB_uvRelativeToGrid:                    0
    long_name:                                Temperature variation
    standard_name:                            unknown
    units:                                    °C

array([ 90.  ,  89.75,  89.5 , ..., -89.5 , -89.75, -90.  ])

array([0.0000e+00, 2.5000e-01, 5.0000e-01, ..., 3.5925e+02, 3.5950e+02,
       3.5975e+02])

[1 values with dtype=int64]

[1 values with dtype=float64]

array(['1979-01-01T00:00:00.000000000', '1979-02-01T00:00:00.000000000',
       '1979-03-01T00:00:00.000000000', ..., '2024-06-01T00:00:00.000000000',
       '2024-07-01T00:00:00.000000000', '2024-08-01T00:00:00.000000000'],
      dtype='datetime64[ns]')

PandasIndex(Index([  90.0,  89.75,   89.5,  89.25,   89.0,  88.75,   88.5,  88.25,   88.0,
        87.75,
       ...
       -87.75,  -88.0, -88.25,  -88.5, -88.75,  -89.0, -89.25,  -89.5, -89.75,
        -90.0],
      dtype='float64', name='latitude', length=721))

PandasIndex(Index([   0.0,   0.25,    0.5,   0.75,    1.0,   1.25,    1.5,   1.75,    2.0,
         2.25,
       ...
        357.5, 357.75,  358.0, 358.25,  358.5, 358.75,  359.0, 359.25,  359.5,
       359.75],
      dtype='float64', name='longitude', length=1440))

PandasIndex(DatetimeIndex(['1979-01-01', '1979-02-01', '1979-03-01', '1979-04-01',
               '1979-05-01', '1979-06-01', '1979-07-01', '1979-08-01',
               '1979-09-01', '1979-10-01',
               ...
               '2023-11-01', '2023-12-01', '2024-01-01', '2024-02-01',
               '2024-03-01', '2024-04-01', '2024-05-01', '2024-06-01',
               '2024-07-01', '2024-08-01'],
              dtype='datetime64[ns]', name='valid_time', length=548, freq=None))

import numpy as np
xr.set_options(keep_attrs=True)

weight = np.pi / 2 * np.cos(np.deg2rad(t2m_anomaly.latitude))
t2m_anomaly_global_1981_2010 = (t2m_anomaly * weight).mean(["latitude", "longitude"])
t2m_anomaly_global_1981_2010

<xarray.DataArray (valid_time: 548)> Size: 4kB
dask.array<mean_agg-aggregate, shape=(548,), dtype=float64, chunksize=(120,), chunktype=numpy.ndarray>
Coordinates:
    number      int64 8B 0
    surface     float64 8B 0.0
  * valid_time  (valid_time) datetime64[ns] 4kB 1979-01-01 ... 2024-08-01
Attributes: (12/31)
    GRIB_NV:                                  0
    GRIB_Nx:                                  1440
    GRIB_Ny:                                  721
    GRIB_cfName:                              unknown
    GRIB_cfVarName:                           t2m
    GRIB_dataType:                            an
    ...                                       ...
    GRIB_typeOfLevel:                         surface
    GRIB_units:                               K
    GRIB_uvRelativeToGrid:                    0
    long_name:                                Temperature variation
    standard_name:                            unknown
    units:                                    °C

array(0)

array(0.)

array(['1979-01-01T00:00:00.000000000', '1979-02-01T00:00:00.000000000',
       '1979-03-01T00:00:00.000000000', ..., '2024-06-01T00:00:00.000000000',
       '2024-07-01T00:00:00.000000000', '2024-08-01T00:00:00.000000000'],
      dtype='datetime64[ns]')

PandasIndex(DatetimeIndex(['1979-01-01', '1979-02-01', '1979-03-01', '1979-04-01',
               '1979-05-01', '1979-06-01', '1979-07-01', '1979-08-01',
               '1979-09-01', '1979-10-01',
               ...
               '2023-11-01', '2023-12-01', '2024-01-01', '2024-02-01',
               '2024-03-01', '2024-04-01', '2024-05-01', '2024-06-01',
               '2024-07-01', '2024-08-01'],
              dtype='datetime64[ns]', name='valid_time', length=548, freq=None))

%%time

t2m_anomaly_global_1981_2010_computed = t2m_anomaly_global_1981_2010.compute()

CPU times: user 16.6 s, sys: 6.28 s, total: 22.9 s
Wall time: 14 s

import matplotlib.pyplot as plt

t2m_anomaly_global_1981_2010_computed.plot()
plt.title("2 meters temperature anomaly with respect to 1981-2010 reference period")

Text(0.5, 1.0, '2 meters temperature anomaly with respect to 1981-2010 reference period')

t2m_anomaly_global_pre_industrial = 0.63 + t2m_anomaly_global_1981_2010_computed

t2m_anomaly_global_pre_industrial.plot()
plt.title("2 meters temperature anomaly with respect to the pre-industrial period")

Text(0.5, 1.0, '2 meters temperature anomaly with respect to the pre-industrial period')

t2m_anomaly_global_pre_industrial_12_month = t2m_anomaly_global_pre_industrial.rolling(valid_time=12).mean()
t2m_anomaly_global_pre_industrial_12_month.plot()
plt.title("2 meters temperature anomaly with respect to the pre-industrial period, 12 months rolling average")

Text(0.5, 1.0, '2 meters temperature anomaly with respect to the pre-industrial period, 12 months rolling average')

How to work with the 'Essential Climate Variables for assessment of climate variability from 1979 to present'on Earth Data Hub: analysis of worldwide temperature change from pre-industrial period¶

Goal of this tutorial¶

What you will learn:¶

Working with EDH data¶

1. Data access¶

2. Data selection¶

3. Data reduction¶

4. Data downlaod¶

4. Visualization¶