Source code for typhon.files.handlers.common

from collections import defaultdict
from copy import copy
from datetime import datetime
from functools import wraps
import glob
from inspect import signature, ismethod
import os
import pickle
import warnings

import netCDF4
import pandas as pd
import xarray as xr
import numpy as np

from fsspec.implementations.local import LocalFileSystem

# The HDF4 file handler needs pyhdf, this might be very tricky to install if
# you cannot use anaconda. Hence, I do not want it to be a hard dependency:
pyhdf_is_installed = False
try:
    from pyhdf import HDF, VS, V
    from pyhdf.SD import SD, SDC
    pyhdf_is_installed = True
except ImportError:
    pass

# The HDF5 file handler needs h5py, this might be very tricky to install if
# you cannot use anaconda. Hence, I do not want it to be a hard dependency:
h5py_is_installed = False
try:
    import h5py
    h5py_is_installed = True
except ImportError:
    pass

__all__ = [
    'CSV',
    'FileHandler',
    'FileInfo',
    'HDF4',
    'HDF5',
    'NetCDF4',
    'Plotter',
    'expects_file_info',
    # 'Numpy',
    # 'Pickle',
    # 'XML'
]


def parametrized(dec):
    """A decorator for decorators that need parameters

    Do not think about this too long, it may cause headaches. Have a look at
    this instead: https://stackoverflow.com/a/26151604

    Args:
        dec: A decorator function

    Returns:
        The decoratored decorator function.
    """
    def layer(*args, **kwargs):
        def repl(f):
            return dec(f, *args, **kwargs)
        return repl
    return layer


@parametrized
def expects_file_info(method, pos=None, key=None):
    """Convert a method argument to a :class:`FileInfo` object

    This is a decorator function that can take parameters.

    If the argument is already a FileInfo object, nothing happens.

    Args:
        method: Method object that should be decorated.
        pos: The index of the file info in the positional argument list.
            Default is 1 (assumes to decorate a method).
        key: The key of the file info in the key word argument dict.

    Returns:
        The return value of the decorated method.

    Examples:

        .. code-block:: python

        @expects_file_info()(0)
        def read(file, *args, *kwargs):
            # file is a Fileinfo object now with the attribute path containing
            # "path/to/file.txt"

        read("path/to/file.txt")

    """

    if pos is None and key is None:
        pos = 1

    @wraps(method)
    def wrapper(*args, **kwargs):
        args = list(args)
        if args and pos is not None:
            if not isinstance(args[pos], FileInfo):
                args[pos] = FileInfo(args[pos])
        else:
            if not isinstance(kwargs[key], FileInfo):
                kwargs[key] = FileInfo(kwargs[key])

        return method(*args, **kwargs)
    return wrapper


def _xarray_rename_fields(dataset, mapping):
    if mapping is not None:
        # Maybe some variables should be renamed that are not in the
        # dataset any longer?
        names = set(dataset.dims.keys()) | set(dataset.variables.keys())

        mapping = {
            old_name: new_name
            for old_name, new_name in mapping.items()
            if old_name in names
        }

        dataset = dataset.rename(mapping)

    return dataset



[docs]
class FileHandler:
    """Base file handler class.

    This can be used alone or with the :class:`~typhon.files.fileset.FileSet`
    classes. You can either initialize specific *reader* ,*info* or *writer*
    functions or you can inherit from this class and override its methods. If
    you need a very specialised and reusable file handler class, you should
    consider following the second approach.
    """


[docs]
    def __init__(
            self, reader=None, info=None, writer=None, **kwargs):
        """Initialize a filer handler object.

        Args:
            reader: Reference to a function that defines how to read a given
                file and returns an object with the read data. The function
                must accept a :class:`FileInfo` object as first parameter.
            info: Reference to a function that returns a :class:`FileInfo`
                object with information about the given file. You cannot use
                the :meth:`get_info` without setting this parameter. The
                function must accept a filename as string as first parameter.
            writer: Reference to a function that defines how to write the data
                to a file. The function must accept the data object as first
                and a :class:`FileInfo` object as second parameter.
        """

        self.reader = reader
        self.info = info
        self.writer = writer

        # If you want to ravel / flat the data coming from this file handler
        # (e.g., this is necessary for collocation routines), you need the
        # dimension names that you can stack on top each other.
        self.stack_dims = {}



[docs]
    @expects_file_info()
    def get_info(self, filename, **kwargs):
        """Return a :class:`FileInfo` object with parameters about the
        file content.

        Notes:
            This is the base class method that does nothing per default.

        Args:
            filename: A string containing path and name or a :class:`FileInfo`
                object of the file of which to get the information about.
            **kwargs: Additional keyword arguments.

        Returns:
            A :class:`FileInfo` object.
        """
        if self.info is not None:
            # Some functions do not accept additional key word arguments (via
            # kwargs). And if they are methods, they accept an additional
            # "self" or "class" parameter.
            number_args = 1 + int(ismethod(self.info))
            if len(signature(self.info).parameters) > number_args:
                return self.info(filename, **kwargs)
            else:
                return self.info(filename)

        raise NotImplementedError(
            "This file handler does not support reading data from a file. You "
            "should use a different file handler.")



[docs]
    @expects_file_info()
    def read(self, filename, **kwargs):
        """Open a file by its name, read its content and return it

        Notes:
            This is the base class method that does nothing per default.

        Args:
            filename: A string containing path and name or a :class:`FileInfo`
                object of the file from which to read.
            **kwargs: Additional key word arguments.

        Returns:
            An object containing the file's content (e.g. numpy array, etc.).
        """
        if self.reader is not None:
            # Some functions do not accept additional key word arguments (via
            # kwargs). And if they are methods, they accept an additional
            # "self" or "class" parameter.
            number_args = 1 + int(ismethod(self.reader))
            if len(signature(self.reader).parameters) > number_args:
                return self.reader(filename, **kwargs)
            else:
                return self.reader(filename)

        raise NotImplementedError(
            "This file handler does not support reading data from a file. You "
            "should use a different file handler.")



[docs]
    @expects_file_info(pos=2)
    def write(self, data, filename, **kwargs):
        """Store a data object to a file.

        Notes:
            This is the base class method that does nothing per default.

        Args:
            filename: A string containing path and name or a :class:`FileInfo`
                object to which to store the data. Existing files will be
                overwritten.
            data: Object with data (e.g. numpy array, etc.).

        Returns:
            None
        """
        if self.writer is not None:
            if len(signature(self.writer).parameters) > 2:
                self.writer(data, filename, **kwargs)
            else:
                self.writer(data, filename)

            return None

        raise NotImplementedError(
            "This file handler does not support writing data to a file. You "
            "should use a different file handler.")


    def _ensure_local_filesystem(self, file_info):
        if not isinstance(file_info.file_system, LocalFileSystem):
            raise NotImplementedError(
                    f"File handler {type(self).__name__:s} can only "
                    "read from local file system, not from "
                    f"{str(type(file_info.file_system).__name__)}")



[docs]
class FileInfo(os.PathLike):
    """Container of information about a file (time coverage, etc.)

    This is a simple object that holds the path and name, time coverage and
    further attributes of a file. It fulfills the os.PathLike protocol, i.e.
    you can use it as filename argument for the most python functions.

    See this Example:

    .. code-block:: python

        # Initialise a FileInfo object that points to a file
        file_info = FileInfo(
            path="path/to/a/file.txt",
            # The time coverage of the file (needed by Dataset classes)
            times=[datetime(2018, 1, 1), datetime(2018, 1, 10)],
            # Additional attributes:
            attr={},
        )

        with open(file_info) as file:
            ...

        # If you need to access the path or other attributes directly, you can
        # do it like this:
        file_info.path   # "path/to/a/file.txt"
        file_info.times  # [datetime(2018, 1, 1), datetime(2018, 1, 10)]
        file_info.attr   # {}
    """

[docs]
    def __init__(self, path=None, times=None, attr=None, fs=None):
        """Initialise a FileInfo object.

        Args:
            path: Absolute path to a file.
            times: A list or tuple of two datetime objects indicating start and
                end time of the file.
            attr: A dictionary with further attributes.
            fs: Implementation of fsspec file system
        """
        super(FileInfo, self).__init__()

        self._path = None
        self.path = path

        self._times = None
        self.times = times

        if attr is None:
            self.attr = {}
        else:
            self.attr = attr

        self.file_system = fs or LocalFileSystem()


    def __eq__(self, other):
        return (isinstance(other, type(self))
                and self.path == other.path
                and self.times == other.times)

    def __fspath__(self):
        return self.path

    def __hash__(self):
        # With this we can use this FileInfo object also as a key in a
        # dictionary
        return hash(self.path)

    def __repr__(self):
        return f"FileInfo(\n  '{self.path}',\n" \
               f"  times={self.times},\n" \
               f"  attr={self.attr},\n" \
               f"  fs={self.file_system})"

    def __str__(self):
        return self.path


[docs]
    def copy(self):
        return copy(self)



[docs]
    @classmethod
    def from_json_dict(cls, json_dict):
        times = []
        for i in range(2):
            if json_dict["times"][i] is None:
                times.append([None])
            else:
                times.append(
                    datetime.strptime(
                        json_dict["times"][i], "%Y-%m-%dT%H:%M:%S.%f"),
                )

        return cls(json_dict["path"], times, json_dict["attr"])


    @property
    def path(self):
        return self._path

    @path.setter
    def path(self, value):
        if isinstance(value, FileInfo):
            raise ValueError("You cannot set path to a FileInfo object.")
        self._path = value

    @property
    def times(self):
        return self._times

    @times.setter
    def times(self, value):
        if value is None:
            self._times = [None, None]
        else:
            self._times = list(value)
            if len(self._times) != 2:
                raise ValueError("FileInfo.times can only be a list of two "
                                 "timestamps!")


[docs]
    def update(self, other_info, ignore_none_time=True):
        """Update this object with another FileInfo object.

        Args:
            other_info: A FileInfo object.
            ignore_none_time: If the start time or end time of *other_info* is
                set to None, it does not overwrite the corresponding time of
                this object.

        Returns:
            None
        """
        self.attr.update(**other_info.attr)

        if other_info.times[0] is not None or not ignore_none_time:
            self.times[0] = other_info.times[0]
        if other_info.times[1] is not None or not ignore_none_time:
            self.times[1] = other_info.times[1]



[docs]
    def to_json_dict(self):
        return {
            "path": self.path,
            "times": [
                self.times[0].strftime("%Y-%m-%dT%H:%M:%S.%f"),
                self.times[1].strftime("%Y-%m-%dT%H:%M:%S.%f")
            ],
            "attr": self.attr,
        }





[docs]
class CSV(FileHandler):
    """File handler that can read / write data from / to a CSV file

    A CSV file is file containing data separated by commas (or by any other
    delimiter).
    """

[docs]
    def __init__(self, info=None):
        """Initializes a CSV file handler class.

        Args:
            info: A function that returns a :class:`FileInfo` object of a
                given file.
        """
        # Call the base class initializer
        super().__init__(info=info)



[docs]
    @expects_file_info()
    def read(self, file_info, fields=None, **kwargs):
        """Read a CSV file and return an xarray.Dataset with its content

        Args:
            file_info: Path and name of the file as string or FileInfo object.
            fields: Field that you want to extract from the file. If not given,
                all fields are going to be extracted.
            **kwargs: Additional keyword arguments for the pandas function
                `pandas.read_csv`. See for more details:
                https://pandas.pydata.org/pandas-docs/stable/generated/pandas.read_csv.html

        Returns:
            A xarray.Dataset object.
        """

        with file_info.file_system.open(file_info.path, "rt") as fp:
            data = pd.read_csv(fp, **kwargs).to_xarray()

        if fields is None:
            return data
        else:
            return data[fields]



[docs]
    @expects_file_info(pos=2)
    def write(self, data, file_info, **kwargs):
        """Write a xarray.Dataset to a CSV file.

        Args:
            data: An DataGroup object that should be saved.
            file_info: Path and name of the file as string or FileInfo object.
            **kwargs: Additional keyword arguments for
                `pandas.Dataframe.to_csv`. See for more details:
                https://pandas.pydata.org/pandas-docs/stable/generated/pandas.DataFrame.to_csv.html

        Returns:
            None
        """
        data.to_dataframe().to_csv(file_info.path, **kwargs)





[docs]
class HDF4(FileHandler):
    """File handler that can read data from a HDF4 file
    """

[docs]
    def __init__(self, info=None):
        """Initializes a CSV file handler class.

        Args:
            info: A function that returns a :class:`FileInfo` object of a
                given file.
        """
        if not pyhdf_is_installed:
            raise ImportError("Could not import pyhdf, which is necessary for "
                              "reading HDF4 files!")

        # Call the base class initializer
        super().__init__(info=info)



[docs]
    @expects_file_info()
    def read(self, file_info, fields=None, mapping=None):
        """Read and parse HDF4 files and load them to a xarray.Dataset

        Args:
            file_info: Path and name of the file as string or FileInfo object.
            fields: Field names that you want to extract from this file as a
                list.
            mapping: A dictionary that maps old field names to new field names.
                If given, `fields` must contain the old field names.

        Returns:
            A xarray.Dataset object.
        """

        self._ensure_local_filesystem(file_info)
        if fields is None:
            raise NotImplementedError(
                "You have to set field names. Loading the complete file is not"
                " yet implemented!"
            )

        dataset = xr.Dataset()

        # Files in HDF4 format are not very pretty. This code is taken from
        # http://hdfeos.org/zoo/OTHER/2010128055614_21420_CS_2B-GEOPROF_GRANULE_P_R04_E03.hdf.py
        # and adapted by John Mrziglod.

        file = HDF.HDF(file_info.path)

        try:
            vs = file.vstart()

            for field in fields:
                # Add the field data to the dataset.
                dataset[field] = self._get_field(vs, field)
        except Exception as e:
            raise e
        finally:
            file.close()

        return _xarray_rename_fields(dataset, mapping)


    @staticmethod
    def _get_field(vs, field):
        field_id = vs.find(field)

        if field_id == 0:
            # Field was not found.
            warnings.warn(
                "Field '{0}' was not found!".format(field), RuntimeWarning
            )

        field_id = vs.attach(field_id)
        nrecs, _, _, _, _ = field_id.inquire()
        raw_data = field_id.read(nRec=nrecs)
        data = xr.DataArray(raw_data).squeeze()
        field_id.detach()
        return data



class HDF5(FileHandler):
    """File handler for SEVIRI level 1.5 HDF files
    """

    def __init__(self, **kwargs):
        """

        Args:
            **kwargs: Additional key word arguments for base class.
        """
        if not h5py_is_installed:
            raise ImportError("Could not import h5py, which is necessary for "
                              "reading HDF5 files!")

        # Call the base class initializer
        super().__init__(**kwargs)

    @expects_file_info()
    def read(self, file_info, fields=None, mapping=None, **kwargs):
        """Read SEVIRI HDF5 files and load them to a xarray.Dataset

        Args:
            file_info: Path and name of the file as string or FileInfo object.
                This can also be a tuple/list of file names or a path with
                asterisk.
            fields: ...
            **kwargs: Additional keyword arguments that are valid for
                :class:`typhon.files.handlers.common.NetCDF4`.

        Returns:
            A xrarray.Dataset object.
        """

        self._ensure_local_filesystem(file_info)
        # Here, the user fields overwrite the standard fields:
        if fields is None:
            raise NotImplementedError(
                "Loading complete HDF5 files without giving explicit field "
                "names is not yet implemented!"
            )

        # keys are dimension size, values are dimension names
        dim_dict = {}

        # Load the dataset from the file:
        with h5py.File(file_info.path, 'r') as file:
            dataset = xr.Dataset()

            for field in fields:
                if field not in file:
                    raise KeyError(f"No field named '{field}'!")

                dims = []
                for dim_size in file[field].shape:
                    dim_name = dim_dict.get(dim_size, None)
                    if dim_name is None:
                        dim_name = f"dim_{len(dim_dict)}"
                        dim_dict[dim_size] = dim_name

                    dims.append(dim_name)

                dataset[field] = xr.DataArray(
                    file[field], dims=dims,
                    # Currently, some attributes may contain byte-strings that
                    # are not nice for further processing
                    attrs={}, #dict(file[field].attrs)
                )

            xr.decode_cf(dataset, **kwargs)
            dataset.load()

        return _xarray_rename_fields(dataset, mapping)



[docs]
class NetCDF4(FileHandler):
    """File handler that can load / store xarray.Dataset from / to NetCDF4

    This file handler can also handle pseudo groups in :class:`xarray.Dataset`
    objects.
    """


[docs]
    def __init__(self, **kwargs):
        """Initialize a NetCDF4 file handler class

        Args:
            info: You cannot use the :meth:`get_info` without giving a
                function here that returns a FileInfo object.
        """
        # Call the base class initializer
        super().__init__(**kwargs)



[docs]
    @expects_file_info()
    def read(self, file_info, fields=None, mapping=None, **kwargs):
        """Read and parse NetCDF files and load them to a xarray.Dataset

        Args:
            file_info: Path and name of the file as string or FileInfo object.
                This can also be a tuple/list of file names or a path with
                asterisk (this is still not implemented!).
            fields: List of field names that should be read. The other fields
                will be ignored. If `mapping` is given, this should contain the
                new field names.
            mapping: A dictionary which is used for renaming the fields. If
                given, `fields` must contain the old field names.
            **kwargs: Additional keyword arguments for
                :func:`xarray.decode_cf` such as `mask_and_scale`, etc.

        Returns:
            A xarray.Dataset object.

        Examples:

            .. code-block:: python

                from typhon.files import NetCDF4

                fh = NetCDF4()
                data = fh.read("filename.nc")

                # OR if you want to load only some fields:
                data = fh.read("filename.nc", fields=["temp", "lat", "lon"])

        """
        self._ensure_local_filesystem(file_info)
        # xr.open_dataset does still not support loading all groups from a
        # file except a very cumbersome (and expensive) way by using the
        # parameter `group`. To avoid this, we load all groups and their
        # variables by using the netCDF4 directly and load them later into a
        # xarray dataset.

        with netCDF4.Dataset(file_info.path, "r") as root:
            # xarray decode_cf scales, don't do it twice!
            root.set_auto_scale(False)
            dataset = xr.Dataset()
            self._load_group(dataset, None, root, fields)

            dataset = xr.decode_cf(dataset, **kwargs)

        return _xarray_rename_fields(dataset, mapping)


    @staticmethod
    def _get_dimension_name(ds, group, path, dim):
        # If the dimension is defined in the subgroup, use NOT the one of the
        # parent group:
        if dim in group.variables or path == "":
            # use the subgroup dimension!
            return path + dim

        # Go through all ancestor groups (start with the parent, then
        # grandparent, etc.) and check whether there is a dimension that suits:
        ancestor_groups = [None] + path[:-1].split("/")[:-1]

        for i, ancestor_group in enumerate(reversed(ancestor_groups)):
            if ancestor_group is None:
                ancestor_dim = dim
            else:
                ancestor_dim = "/".join(
                    ancestor_groups[1:len(ancestor_groups) - i] + [dim])

            ancestor_size = ds.dims.get(ancestor_dim, None)

            if ancestor_size is not None \
                    and group.dimensions[dim].size == ancestor_size:
                # use the ancestor dimension:
                return ancestor_dim

        # use the subgroup dimension!
        return path + dim

    @staticmethod
    def _load_group(ds, path, group, fields):
        if path is None:
            # The current group is the root group
            path = ""
            ds.attrs = dict(group.__dict__)
        else:
            path += "/"

        # Dimension (coordinate) mapping: A dimension might be defined in a
        # group, then it is valid for this group only. Otherwise, the
        # dimension from the parent group is taken (if it suits with name and
        # size)
        dim_map = {
            dim: NetCDF4._get_dimension_name(ds, group, path, dim)
            for dim in group.dimensions
        }

        # Load variables:
        try:
            for var_name, var in group.variables.items():
                if fields is None or path + var_name in fields:
                    dims = [dim_map[dim] for dim in var.dimensions]
                    if len(dims) == 0 and var[:] is np.ma.masked:
                        ds[path + var_name] = dims, np.nan, dict(var.__dict__)
                    else:
                        ds[path + var_name] = dims, var[:], dict(var.__dict__)
        except RuntimeError:
            raise KeyError(f"Could not load the variable {path + var_name}!")

        # Do the same for all sub groups:
        for sub_group_name, sub_group in group.groups.items():
            NetCDF4._load_group(
                ds, path + sub_group_name, sub_group, fields
            )


[docs]
    @expects_file_info(pos=2)
    def write(self, data, filename, **kwargs):
        """Save a xarray.Dataset to a NetCDF4 file

        Args:
            data: A xarray.Dataset object. It may contain 'pseudo' groups (i.e.
                variables with */* in their names). Those variables will be
                saved in subgroups.
            filename: A string or a :class:`FileInfo` object with the path
                where the data should be stored.

        Returns:
            None

        Examples:

            .. code-block:: python

                from typhon.files import NetCDF4
                import xarray as xr

                fh = NetCDF4()
                data = xr.Dataset({
                    "data/temperature": ("time", [0, 1]),
                    "lat": ("time", [0, 1]),
                    "lon": ("time", [0, 1]),
                }, coords={
                    "time": ("time", [0, 1]),
                })

                # Save the dataset:
                fh.write(data, "filename.nc")
        """
        group_vars = defaultdict(list)

        # Get the variables for the different groups:
        for full_name in data.variables:
            group, _ = NetCDF4._split_path(full_name)
            group_vars[group].append(full_name)

        # If we ware writing out multiple groups, we do not want to overwrite
        # the last file:
        user_mode = kwargs.pop("mode", "w")
        already_opened = False
        for group, variables in group_vars.items():
            ds = data[variables]

            # We do not want to store global coordinates in each subgroup.
            # Hence, we drop them before saving the group:
            coords_to_drop = [
                coord
                for coord in ds.coords.keys()
                if NetCDF4._split_path(coord)[0] != group
            ]
            ds = ds.drop_vars(coords_to_drop)

            # Remove the group name from all variables (incl. dimensions):
            mapping = {
                full: NetCDF4._split_path(full)[1]
                for full in ds.data_vars
            }
            ds = ds.rename(mapping)
            mapping = {
                full: NetCDF4._split_path(full)[1]
                for full in ds.coords
            }
            ds = ds.rename(mapping)
            mapping = {
                dim: NetCDF4._split_path(dim)[1]
                for dim in ds.dims
            }
            ds = ds.rename(mapping)

            ds.to_netcdf(
                filename.path, group=group,
                mode="a" if already_opened else user_mode,
                **kwargs
            )
            already_opened = True


    @staticmethod
    def _split_path(path):
        if "/" not in path:
            return None, path
        return path.rsplit("/", 1)

    def _ensure_local_filesystem(self, file_info):
        if not isinstance(file_info.file_system, LocalFileSystem):
            raise NotImplementedError(
                    f"File handler {type(self).__name__:s} can only "
                    "read from local file system, not from "
                    f"{str(type(file_info.file_system).__name__)}. "
                    "Use FSNetCDF instead.")



class FSNetCDF(FileHandler):
    """File handler for reading NetCDF files via alternate file systems.

    Alternative to the NetCDF file handler for reading files from
    alternative file systems, such as remote file systemss.  Does not
    support writing or multi-group files.

    Usage example with fileset::

        fs = FileSet(
                path=(
                    "noaa-goes16/GLM-L2-LCFA/{year}/{doy}/{hour}/"
                    "OR_GLM-L2-LCFA_G16_s{year}{doy}{hour}{minute}{second}*_"
                    "e{end_year}{end_doy}{end_hour}{end_minute}{end_second}*_c*.nc"),
                fs=s3fs.S3FileSystem(anon=True),
                handler=FSNetCDF())

        finf = fs.find_closest(datetime.datetime(2021, 11, 10, 10))
        fs.read(finf)
    """

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        self._open = []

    @expects_file_info()
    def read(self, file_info, fields=None, mapping=None, **kwargs):
        """Read possibly remote NetCDF file."""
        fp = file_info.file_system.open(file_info.path)
        ds = xr.open_dataset(fp, engine="h5netcdf")
        self._open.append(ds)
        return ds

    def close_all(self):
        """Close all open files."""
        while self._open:
            self._open.pop(0).close()

    def __del__(self):
        self.close_all()



[docs]
class Plotter(FileHandler):
    """File handler that can save matplotlib.figure objects to a file.

    This is a specialised file handler object that can just store
    matplotlib.figure objects. It cannot read from a file nor get the time
    coverage from one. This is designed for having a simple plot dataset as
    output.
    """


[docs]
    def __init__(self, fig_args=None, **kwargs):
        """Initializes a Plotter file handler class.

        Args:
            fig_args: A dictionary of additional keyword arguments for the
                fig.savefig method.
        """
        # Call the base class initializer
        super().__init__(**kwargs)

        if fig_args is None:
            self.fig_args = {}
        else:
            self.fig_args = fig_args



[docs]
    @expects_file_info(pos=2)
    def write(self, figure, filename, fig_args=None):
        """ Saves a matplotlib.figure object to a file.

        Args:
            figure: A matplotlib.figure object.
            filename: Path and name of the file as string or FileInfo object.
            fig_args: A dictionary of additional keyword arguments for the
                fig.savefig method. This updates the *fig_args* given during
                initialisation.
        """

        params = self.fig_args.copy()
        if fig_args is not None:
            params.update(**fig_args)

        return figure.savefig(filename.path, **params)




# class Numpy(handlers.FileHandler):
#     def __init__(self, **kwargs):
#         # Call the base class initializer
#         super().__init__(**kwargs)
#
#     def get_info(self, filename):
#         # Get info parameters from a file (time coverage, etc)
#         ...
#
#     def read(self, filename, fields=None):
#         """ Reads and parses files with numpy arrays and load them to a xarray.
#
#         See the base class for further documentation.
#         """
#         numpy_data = np.load(filename)
#         print(numpy_data.keys())
#         data = xarray.Dataset.from_dict(numpy_data)
#
#         return data
#
#     def write(self, filename, data):
#         """ Writes a xarray to a NetCDF file.
#
#         See the base class for further documentation.
#         """
#
#         # Data must be a xarray object!
#         data_dict = data.to_dict()
#         np.save(filename, data_dict)
#
#
# class Pickle(handlers.FileHandler):
#     def __init__(self, **kwargs):
#         # Call the base class initializer
#         super().__init__(**kwargs)
#
#     def get_info(self, filename):
#         # Get info parameters from a file (time coverage, etc)
#         ...
#
#     def read(self, filename, fields=None):
#         """ Reads and parses files with numpy arrays and load them to a xarray.
#
#         See the base class for further documentation.
#         """
#
#         with open(filename, 'rb') as file:
#             return pickle.load(file)
#
#     def write(self, filename, data):
#         """ Writes a xarray to a NetCDF file.
#
#         See the base class for further documentation.
#         """
#
#         with open(filename, 'wb') as file:
#             pickle.dump(data, file)
#
#
# class XML(handlers.FileHandler):
#     def __init__(self, **kwargs):
#         # Call the base class initializer
#         super().__init__(**kwargs)
#
#     def get_info(self, filename):
#         # Get info parameters from a file (time coverage, etc)
#         ...
#
#     def read(self, filename, fields=None):
#         """ Reads and parses NetCDF files and load them to a xarray.
#
#         See the parent class for further documentation.
#         """
#         #
#         return typhon.arts.xml.load(filename)
#
#     def write(self, filename, data):
#         """ Writes a xarray to a NetCDF file.
#
#         See the base class for further documentation.
#         """
#
#         # Data must be a xarray object!
#         typhon.arts.xml.save(data, filename)