timemean.py 10.9 KB
Newer Older
"""Time mean diagnostics"""
import iris
import iris.coord_categorisation
import iris.analysis
import iris.exceptions

import numpy as np
from bscearth.utils.log import Log
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
from earthdiagnostics.diagnostic import (
    Diagnostic,
    DiagnosticOption,
    DiagnosticDomainOption,
    DiagnosticFrequencyOption,
    DiagnosticVariableOption,
)
from earthdiagnostics.frequency import Frequencies
from earthdiagnostics.utils import TempFile, Utils


class TimeMean(Diagnostic):
    """
    Base class for all time mean diagnostics

    :param data_manager: data management object
    :type data_manager: DataManager
    :param startdate: startdate
    :type startdate: str
    :param member: member number
    :type member: int
    :param chunk: chunk's number
    :type chunk: int
    :param variable: variable's name
    :type variable: str
    :param domain: variable's domain
    :type domain: ModelingRealm
    :param frequency: original frequency
    :type frequency: str
    :param grid: original data grid
    :type grid: str
    """

Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
    def __init__(
        self,
        data_manager,
        startdate,
        member,
        chunk,
        domain,
        variable,
        frequency,
        grid,
    ):
        Diagnostic.__init__(self, data_manager)
        self.startdate = startdate
        self.member = member
        self.chunk = chunk
        self.variable = variable
        self.domain = domain
        self.frequency = frequency
        self.grid = grid
        self._target_frequency = None
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed

        self.variable_file = None
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        return (
            "Calculate {0._target_frequency} mean "
            "Startdate: {0.startdate} Member: {0.member} Chunk: {0.chunk} "
            "Variable: {0.domain}:{0.variable} "
            "Original frequency: {0.frequency} Grid: {0.grid}".format(self)
        )
        if self._different_type(other):
            return False
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        return (
            self.startdate == other.startdate
            and self.member == other.member
            and self.chunk == other.chunk
            and self.domain == other.domain
            and self.variable == other.variable
            and self.frequency == other.frequency
            and self.grid == other.grid
            and self._target_frequency == other._target_frequency
        )

    @classmethod
    def _process_options(cls, diags, options):
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        options_available = (
            DiagnosticDomainOption(),
            DiagnosticVariableOption(diags.data_manager.config.var_manager),
            DiagnosticFrequencyOption(),
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
            DiagnosticOption("grid", ""),
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        )
        options = cls.process_options(options, options_available)
        return options

    @classmethod
    def generate_jobs(cls, diags, options):
        """
        Create a job for each chunk to compute the diagnostic

        :param diags: Diagnostics manager class
        :type diags: Diags
        :param options: variable, domain, frequency=day, grid=''
        :type options: list[str]
        :return:
        """
        options = cls._process_options(diags, options)
        job_list = list()
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        chunk_list = diags.config.experiment.get_chunk_list()
        for startdate, member, chunk in chunk_list:
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
            job_list.append(
                cls(
                    diags.data_manager,
                    startdate,
                    member,
                    chunk,
                    options["domain"],
                    options["variable"],
                    options["frequency"],
                    options["grid"],
                )
            )
        return job_list

    def request_data(self):
        """Request data required by the diagnostic"""
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        self.variable_file = self.request_chunk(
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
            self.domain,
            self.variable,
            self.startdate,
            self.member,
            self.chunk,
            frequency=self.frequency,
            grid=self.grid,
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        )
        Compute the time mean

        Parameters
        ----------
        raise NotImplementedError()

    def compute(self):
        """Run the diagnostic"""
        temp = TempFile.get()
        Log.info('Load data')
        cube = iris.load_cube(self.variable_file.local_file)
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        time_centered = [
            coord
            for coord in cube.coords()
            if coord.var_name == "time_centered"
        ]
        if time_centered:
            cube.remove_coord(time_centered[0])
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        iris.coord_categorisation.add_day_of_month(cube, "time")
        iris.coord_categorisation.add_month_number(cube, "time")
        iris.coord_categorisation.add_year(cube, "time")
        Log.info('Compute mean')
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        cube.remove_coord("day_of_month")
        cube.remove_coord("month_number")
        cube.remove_coord("year")
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
            region_coord = cube.coord("region")
            cube.remove_coord(region_coord)
        except iris.exceptions.CoordinateNotFoundError:
            region_coord = None
        cube.data
        iris.save(cube, temp)
        if region_coord:
            handler = Utils.open_cdf(temp)
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
            region = handler.createVariable("region", str, ("dim0",))
            region.standard_name = region_coord.standard_name
            region[...] = region_coord.points.astype(np.dtype(str))

Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
            handler.variables[self.variable].coordinates += " region"
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
            Utils.rename_variable(temp, "dim0", "region", False)


class DailyMean(TimeMean):
    """
    Calculates daily mean for a given variable
    :param data_manager: data management object
    :type data_manager: DataManager
    :param startdate: startdate
    :type startdate: str
    :param member: member number
    :type member: int
    :param chunk: chunk's number
    :type chunk: int
    :param variable: variable's name
    :type variable: str
    :param domain: variable's domain
    :type domain: ModelingRealm
    :param frequency: original frequency
    :type frequency: str
    :param grid: original data grid
    :type grid: str
    """

Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
    alias = "daymean"
    "Diagnostic alias for the configuration file"
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed

Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
    def __init__(
        self,
        data_manager,
        startdate,
        member,
        chunk,
        domain,
        variable,
        frequency,
        grid,
    ):
        TimeMean.__init__(
            self,
            data_manager,
            startdate,
            member,
            chunk,
            domain,
            variable,
            frequency,
            grid,
        )
        self._target_frequency = "daily"
        Compute the time mean
        Parameters
        ----------
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        return cube.aggregated_by(
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
            ["day_of_month", "month_number", "year"], iris.analysis.MEAN
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        )

    def declare_data_generated(self):
        """Declare data to be generated by the diagnostic"""
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        self.mean_file = self.declare_chunk(
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
            self.domain,
            self.variable,
            self.startdate,
            self.member,
            self.chunk,
            frequency=Frequencies.daily,
            grid=self.grid,
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        )


class MonthlyMean(TimeMean):
    """
    Calculates monthly mean for a given variable
    :param data_manager: data management object
    :type data_manager: DataManager
    :param startdate: startdate
    :type startdate: str
    :param member: member number
    :type member: int
    :param chunk: chunk's number
    :type chunk: int
    :param variable: variable's name
    :type variable: str
    :param domain: variable's domain
    :type domain: ModelingRealm
    :param frequency: original frequency
    :type frequency: str
    :param grid: original data grid
    :type grid: str
    """

Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
    alias = "monmean"
    "Diagnostic alias for the configuration file"
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed

Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
    def __init__(
        self,
        data_manager,
        startdate,
        member,
        chunk,
        domain,
        variable,
        frequency,
        grid,
    ):
        TimeMean.__init__(
            self,
            data_manager,
            startdate,
            member,
            chunk,
            domain,
            variable,
            frequency,
            grid,
        )
        self._target_frequency = "monthly"
        Compute the time mean
        Parameters
        ----------
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        return cube.aggregated_by(["month_number", "year"], iris.analysis.MEAN)

    def declare_data_generated(self):
        """Declare data to be generated by the diagnostic"""
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        self.mean_file = self.declare_chunk(
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
            self.domain,
            self.variable,
            self.startdate,
            self.member,
            self.chunk,
            frequency=Frequencies.monthly,
            grid=self.grid,
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        )


class YearlyMean(TimeMean):
    """
    Calculates monthly mean for a given variable
    :param data_manager: data management object
    :type data_manager: DataManager
    :param startdate: startdate
    :type startdate: str
    :param member: member number
    :type member: int
    :param chunk: chunk's number
    :type chunk: int
    :param variable: variable's name
    :type variable: str
    :param domain: variable's domain
    :type domain: ModelingRealm
    :param frequency: original frequency
    :type frequency: str
    :param grid: original data grid
    :type grid: str
    """
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
    alias = "yearmean"
    "Diagnostic alias for the configuration file"
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed

Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
    def __init__(
        self,
        data_manager,
        startdate,
        member,
        chunk,
        domain,
        variable,
        frequency,
        grid,
    ):
        TimeMean.__init__(
            self,
            data_manager,
            startdate,
            member,
            chunk,
            domain,
            variable,
            frequency,
            grid,
        )
        self._target_frequency = "yearly"
        Compute the time mean
        Parameters
        ----------
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        return cube.aggregated_by(["year"], iris.analysis.MEAN)

    def declare_data_generated(self):
        """Declare data to be generated by the diagnostic"""
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        self.mean_file = self.declare_chunk(
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
            self.domain,
            self.variable,
            self.startdate,
            self.member,
            self.chunk,
            frequency=Frequencies.yearly,
            grid=self.grid,
Javier Vegas-Regidor's avatar
Javier Vegas-Regidor committed
        )