Source code for my_code_base.stats.xarray_utils

# %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
# Author: Markus Ritschel
# eMail:  git@markusritschel.de
# Date:   2024-06-19
# %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
#
import logging
import xarray as xr
from multipledispatch import dispatch
from .timeseries import extend_annual_series, weighted_annual_mean


log = logging.getLogger(__name__)



[docs]
@xr.register_dataset_accessor("stats")
@xr.register_dataarray_accessor("stats")
class StatsAccessor:
    """
    This class provides statistical operations on xarray data.

    Parameters
    ----------
    obj : xarray.Dataset or xarray.DataArray
        The xarray object on which statistical operations will be performed.

    Methods
    -------
    weighted_mean(dim)
        Calculate the weighted mean based on the given dimension.
    """

    def __init__(self, obj):
        self._obj = obj

    @dispatch(str)
    def weighted_mean(self, dim):
        """
        Calculate the weighted annual mean (taking days of months into account).

        Parameters
        ----------
        dim : str
            The dimension along which to calculate the weighted mean.

        Returns
        -------
        weighted_mean : xarray.Dataset or xarray.DataArray
            The weighted annual mean.

        """
        log.debug(f"Identified single dimension {dim}. Building weighted annual mean.")
        return weighted_annual_mean(self._obj)

    def _is_annual(self):
        """
        Check if the xarray object has a 'year' dimension.

        Returns
        -------
        bool
            True if the xarray object has a 'year' dimension, False otherwise.
        """
        return 'year' in self._obj.dims


[docs]
    def fill_months_with_annual_value(self):
        """
        Fill the xarray object with annual values for each month.

        Returns
        -------
        xarray.Dataset or xarray.DataArray
            The xarray object with extended annual series.

        Raises
        ------
        ValueError
            If the time series is not of yearly frequency.
        """
        ds = self._obj
        if not self._is_annual():
            raise ValueError("Time series is not of yearly frequency.")
        return extend_annual_series(ds)