"""Datasets for models
"""
# Any commits made to this module between 2015-05-01 and 2017-03-01
# by Gerrit Holl are developed for the EC project “Fidelity and
# Uncertainty in Climate Data Records from Earth Observations (FIDUCEO)”.
# Grant agreement: 638822
# 
# All those contributions are dual-licensed under the MIT license for use
# in typhon, and the GNU General Public License version 3.
import datetime
import numpy
from . import dataset
[docs]
class ERAInterim(dataset.NetCDFDataset, dataset.MultiFileDataset):
    # example path:
    # /badc/ecmwf-era-interim/data/gg/as/2015/01/01/ggas201501011200.nc
    name = section = "era_interim"
    subdir = "data/{AA:s}/{B:s}{C:s}/{year:04d}/{month:02d}/{day:02d}"
    re = (r"(?P<AA>[a-z]{2})(?P<B>[a-z])(?P<C>[a-z])"
          r"(?P<year>\d{4})(?P<month>\d{2})(?P<day>\d{2})"
          r"(?P<hour>\d{2})(?P<minute>\d{2})\.nc")
    start_date = datetime.datetime(1979, 1, 1, 0, 0, 0)
    end_date = datetime.datetime(2016, 1, 1, 0, 0, 0)
    granule_duration = datetime.timedelta(hours=6)
    def _read(self, f, *args, **kwargs):
        # may need to convert, but I currently need gg/as which on CEMS is
        # already in converted format, so will assume NetCDF
        (M, extra) = super()._read(f, *args,
                          pseudo_fields={"time": self._get_time_from_ds},
                          prim="t",
                          **kwargs)
        return (M, extra)
    @staticmethod
    def _get_time_from_ds(ds):
        epoch = datetime.datetime.strptime(ds["t"].time_origin,
                                           "%d-%b-%Y:%H:%M:%S")
        return numpy.datetime64(epoch) + ds["t"][:].astype("timedelta64[D]")