From 6a66045d10d034f3e6babb5a91e088582945f257 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Mon, 16 Oct 2017 16:26:10 +0200 Subject: [PATCH 01/47] Fixed basin bug --- earthdiagnostics/ocean/heatcontent.py | 11 ++++++----- earthdiagnostics/ocean/siasiesiv.py | 13 ++++++------- 2 files changed, 12 insertions(+), 12 deletions(-) diff --git a/earthdiagnostics/ocean/heatcontent.py b/earthdiagnostics/ocean/heatcontent.py index 31ac9268..9b8731ff 100644 --- a/earthdiagnostics/ocean/heatcontent.py +++ b/earthdiagnostics/ocean/heatcontent.py @@ -1,13 +1,14 @@ # coding=utf-8 import shutil +import numpy as np + from earthdiagnostics import cdftools +from earthdiagnostics.box import Box from earthdiagnostics.constants import Basins -from earthdiagnostics.utils import Utils, TempFile from earthdiagnostics.diagnostic import Diagnostic, DiagnosticBasinOption, DiagnosticIntOption -from earthdiagnostics.box import Box from earthdiagnostics.modelingrealm import ModelingRealms -import numpy as np +from earthdiagnostics.utils import Utils, TempFile class HeatContent(Diagnostic): @@ -159,9 +160,9 @@ class HeatContent(Diagnostic): box_save = self.box self.heatcsum = self.declare_chunk(ModelingRealms.ocean, 'heatcsum', self.startdate, self.member, self.chunk, - box=box_save, region=self.basin.fullname) + box=box_save, region=self.basin.name) self.heatcmean = self.declare_chunk(ModelingRealms.ocean, 'heatcvmean', self.startdate, self.member, self.chunk, - box=box_save, region=self.basin.fullname) + box=box_save, region=self.basin.name) def compute(self): """ diff --git a/earthdiagnostics/ocean/siasiesiv.py b/earthdiagnostics/ocean/siasiesiv.py index d16295a4..ec2bc5d4 100644 --- a/earthdiagnostics/ocean/siasiesiv.py +++ b/earthdiagnostics/ocean/siasiesiv.py @@ -1,17 +1,16 @@ # coding=utf-8 -import netCDF4 import os -from bscearth.utils.log import Log - -from earthdiagnostics.diagnostic import Diagnostic, DiagnosticBasinOption -from earthdiagnostics.utils import Utils, TempFile # noinspection PyUnresolvedReferences import earthdiagnostics.cdftoolspython as cdftoolspython +import netCDF4 import numpy as np +from bscearth.utils.log import Log -from earthdiagnostics.modelingrealm import ModelingRealms from earthdiagnostics.constants import Basins +from earthdiagnostics.diagnostic import Diagnostic, DiagnosticBasinOption +from earthdiagnostics.modelingrealm import ModelingRealms +from earthdiagnostics.utils import Utils, TempFile class Siasiesiv(Diagnostic): @@ -106,7 +105,7 @@ class Siasiesiv(Diagnostic): def _declare_var(self, var_name): self.generated[var_name] = self.declare_chunk(ModelingRealms.seaIce, var_name, self.startdate, self.member, - self.chunk, region=self.basin.fullname) + self.chunk, region=self.basin.name) def compute(self): """ -- GitLab From 0f746c314b8a41068f2c269f94bebe57dfa8d94e Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Tue, 17 Oct 2017 13:33:43 +0200 Subject: [PATCH 02/47] Fixed regionmean diagnostic error --- doc/source/conf.py | 2 +- earthdiagnostics/__init__.py | 9 ++--- earthdiagnostics/cmorizer.py | 1 - earthdiagnostics/datafile.py | 53 +++++++++++++++++++-------- earthdiagnostics/diagnostic.py | 2 + earthdiagnostics/ocean/interpolate.py | 6 +-- earthdiagnostics/ocean/regionmean.py | 9 ++++- earthdiagnostics/utils.py | 2 +- setup.py | 1 + 9 files changed, 56 insertions(+), 29 deletions(-) diff --git a/doc/source/conf.py b/doc/source/conf.py index 13a4d471..81114e45 100644 --- a/doc/source/conf.py +++ b/doc/source/conf.py @@ -12,8 +12,8 @@ # All configuration values have a default; values that are commented out # serve to show the default. -import sys import os +import sys # If extensions (or modules to document with autodoc) are in another directory, # add these directories to sys.path here. If the directory is relative to the diff --git a/earthdiagnostics/__init__.py b/earthdiagnostics/__init__.py index 75244852..e442aee3 100644 --- a/earthdiagnostics/__init__.py +++ b/earthdiagnostics/__init__.py @@ -2,13 +2,10 @@ """ Module containing the Earth Diagnostics. """ -from cdo import Cdo -from nco import Nco -from earthdiagnostics.cdftools import CDFTools import os -cdo = Cdo() -nco = Nco() -cdftools = CDFTools('/home/Earth/jvegas/CDFTOOLS_3.0/bin') +from earthdiagnostics.cdftools import CDFTools + +cdftools = CDFTools() DEVNULL = open(os.devnull, 'wb') diff --git a/earthdiagnostics/cmorizer.py b/earthdiagnostics/cmorizer.py index 7cf8c5c3..c4233ea2 100644 --- a/earthdiagnostics/cmorizer.py +++ b/earthdiagnostics/cmorizer.py @@ -430,7 +430,6 @@ class Cmorizer(object): netcdf_file.data_convention = self.config.data_convention netcdf_file.region = region - netcdf_file.frequency = frequency netcdf_file.domain = var_cmor.domain netcdf_file.var = var_cmor.short_name diff --git a/earthdiagnostics/datafile.py b/earthdiagnostics/datafile.py index ddaf1b10..809c489e 100644 --- a/earthdiagnostics/datafile.py +++ b/earthdiagnostics/datafile.py @@ -4,6 +4,7 @@ import os import shutil from datetime import datetime +import iris import numpy as np from bscearth.utils.log import Log @@ -150,8 +151,9 @@ class DataFile(Publisher): self._rename_coordinate_variables() self._correct_metadata() self._prepare_region() - self.add_diagnostic_history() + if self.region is not None: + self.upload() def upload(self): self.storage_status = StorageStatus.UPLOADING @@ -204,18 +206,21 @@ class DataFile(Publisher): def _fix_variable_name(self, var_handler): var_handler.standard_name = self.cmor_var.standard_name var_handler.long_name = self.cmor_var.long_name - # var_handler.short_name = self.cmor_var.short_name - def _fix_values_metadata(self, var_type): - if self.cmor_var.valid_min != '': - valid_min = '-a valid_min,{0},o,{1},"{2}" '.format(self.final_name, var_type.char, self.cmor_var.valid_min) - else: - valid_min = '' - if self.cmor_var.valid_max != '': - valid_max = '-a valid_max,{0},o,{1},"{2}" '.format(self.final_name, var_type.char, self.cmor_var.valid_max) - else: - valid_max = '' - Utils.nco.ncatted(input=self.local_file, output=self.local_file, + def _fix_values_metadata(self, var_type, file_path=None): + if file_path is None: + file_path = self.local_file + valid_min = '' + valid_max = '' + + if self.cmor_var is not None: + if self.cmor_var.valid_min != '': + valid_min = '-a valid_min,{0},o,{1},"{2}" '.format(self.final_name, var_type.char, self.cmor_var.valid_min) + + if self.cmor_var.valid_max != '': + valid_max = '-a valid_max,{0},o,{1},"{2}" '.format(self.final_name, var_type.char, self.cmor_var.valid_max) + + Utils.nco.ncatted(input=file_path, output=file_path, options=('-O -a _FillValue,{0},o,{1},"1.e20" ' '-a missingValue,{0},o,{1},"1.e20" {2}{3}'.format(self.final_name, var_type.char, valid_min, valid_max),)) @@ -273,10 +278,27 @@ class DataFile(Publisher): def _update_var_with_region_data(self): temp = TempFile.get() shutil.copyfile(self.remote_file, temp) + handler = Utils.openCdf(temp) + var_handler = handler.variables[self.final_name] + var_type = var_handler.dtype + handler.close() + self._fix_values_metadata(var_type, temp) + Utils.nco.ncks(input=temp, output=temp, options=['--mk_rec_dmn region']) handler = Utils.openCdf(temp) - handler_send = Utils.openCdf(self.local_file) - value = handler_send.variables[self.final_name][:] + var_handler = handler.variables[self.final_name] + if hasattr(var_handler, 'valid_min'): + del var_handler.valid_min + if hasattr(var_handler, 'valid_max'): + del var_handler.valid_max + handler.sync() + cubes = iris.load(self.local_file) + for cube in cubes: + if self.final_name == cube.var_name: + value = cube.data + break + if isinstance(value, np.ma.MaskedArray): + value = np.ma.getdata(value) var_region = handler.variables['region'] basin_index = np.where(var_region[:] == self.region) if len(basin_index[0]) == 0: @@ -285,9 +307,8 @@ class DataFile(Publisher): else: basin_index = basin_index[0][0] - handler.variables[self.final_name][..., basin_index] = value + handler.variables[self.final_name][..., basin_index] = np.multiply(np.ones(value.shape), value) handler.close() - handler_send.close() Utils.move_file(temp, self.local_file) def _add_region_dimension_to_var(self): diff --git a/earthdiagnostics/diagnostic.py b/earthdiagnostics/diagnostic.py index 4e90373d..e6bf4bb0 100644 --- a/earthdiagnostics/diagnostic.py +++ b/earthdiagnostics/diagnostic.py @@ -136,6 +136,8 @@ class Diagnostic(Publisher): region = region.name generated_chunk = self.data_manager.declare_chunk(domain, var, startdate, member, chunk, grid, region, box, diagnostic=self, vartype=vartype, frequency=frequency) + if region is not None: + generated_chunk.add_modifier(self) self._generated_files.append(generated_chunk) return generated_chunk diff --git a/earthdiagnostics/ocean/interpolate.py b/earthdiagnostics/ocean/interpolate.py index 262f8767..dab72b36 100644 --- a/earthdiagnostics/ocean/interpolate.py +++ b/earthdiagnostics/ocean/interpolate.py @@ -1,14 +1,14 @@ # coding=utf-8 +import os import shutil import threading -import os from bscearth.utils.log import Log + from earthdiagnostics.diagnostic import Diagnostic, DiagnosticOption, DiagnosticDomainOption, DiagnosticBoolOption, \ DiagnosticVariableListOption - -from earthdiagnostics.utils import Utils, TempFile from earthdiagnostics.modelingrealm import ModelingRealms +from earthdiagnostics.utils import Utils, TempFile class Interpolate(Diagnostic): diff --git a/earthdiagnostics/ocean/regionmean.py b/earthdiagnostics/ocean/regionmean.py index 1d6cebb8..bb4b93c8 100644 --- a/earthdiagnostics/ocean/regionmean.py +++ b/earthdiagnostics/ocean/regionmean.py @@ -159,7 +159,14 @@ class RegionMean(Diagnostic): temp2 = TempFile.get() Utils.nco.ncks(input=mean_file, output=temp2, options=('-v {0},lat,lon{1}'.format(original_name, levels),)) - self.declared[final_name].set_local_file(temp2, rename_var=original_name) + handler = Utils.openCdf(temp2) + var_handler = handler.variables[original_name] + if hasattr(var_handler, 'valid_min'): + del var_handler.valid_min + if hasattr(var_handler, 'valid_max'): + del var_handler.valid_max + handler.close() + self.declared[final_name].set_local_file(temp2, diagnostic=self, rename_var=original_name) def declare_var(self, var, threed, box_save): if threed: diff --git a/earthdiagnostics/utils.py b/earthdiagnostics/utils.py index 42304aa0..49331840 100644 --- a/earthdiagnostics/utils.py +++ b/earthdiagnostics/utils.py @@ -259,7 +259,7 @@ class Utils(object): Log.debug('Hashing copy ... {0}', datetime.datetime.now()) hash_destiny = Utils.get_file_hash(destiny, save=save_hash) retrials -= 1 - Log.info('Finished {0}', datetime.datetime.now()) + Log.debug('Finished {0}', datetime.datetime.now()) @staticmethod def move_file(source, destiny, save_hash=False): diff --git a/setup.py b/setup.py index 41183306..0e68a089 100644 --- a/setup.py +++ b/setup.py @@ -5,6 +5,7 @@ Installation script for EarthDiagnostics package """ from os import path + from setuptools import find_packages from setuptools import setup -- GitLab From 2e24db6b5013319ec642717a056ccd4e34a7a39b Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Tue, 17 Oct 2017 15:13:14 +0200 Subject: [PATCH 03/47] Optimization for data_size check on files --- earthdiagnostics/datafile.py | 16 +++++++++++----- 1 file changed, 11 insertions(+), 5 deletions(-) diff --git a/earthdiagnostics/datafile.py b/earthdiagnostics/datafile.py index 809c489e..6b9309b2 100644 --- a/earthdiagnostics/datafile.py +++ b/earthdiagnostics/datafile.py @@ -52,6 +52,7 @@ class DataFile(Publisher): self._storage_status = StorageStatus.READY self.job_added = False self._modifiers = [] + self._size = None def __str__(self): return 'Data file for {0}'.format(self.remote_file) @@ -62,6 +63,11 @@ class DataFile(Publisher): @property def size(self): + if self._size is None: + self._get_size() + return self._size + + def _get_size(self): if self.local_status == LocalStatus.READY: os.path.getsize(self.local_file) return None @@ -110,6 +116,7 @@ class DataFile(Publisher): if self._local_status == value: return self._local_status = value + self._size = None self.dispatch(self) @property @@ -121,6 +128,7 @@ class DataFile(Publisher): if self._storage_status == value: return self._storage_status = value + self._size = None self.dispatch(self) @classmethod @@ -485,12 +493,10 @@ class NetCDFFile(DataFile): except Exception as ex: Log.error('Can not create link to {1}: {0}'.format(ex, self.remote_file)) - @property - def size(self): + def _get_size(self): if self.local_status == LocalStatus.READY: - return os.path.getsize(self.local_file) + self._size = os.path.getsize(self.local_file) if self.storage_status == StorageStatus.READY: - return os.path.getsize(self.remote_file) - return None + self._size = os.path.getsize(self.remote_file) -- GitLab From 964147add8bd6486eca46621756a7fc9a230d365 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Tue, 17 Oct 2017 15:16:34 +0200 Subject: [PATCH 04/47] Bumped version --- VERSION | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/VERSION b/VERSION index c4dd8a8a..d1a88439 100644 --- a/VERSION +++ b/VERSION @@ -1,2 +1,2 @@ -3.0.0rc1 +3.0.0rc2 -- GitLab From 98f98283d2ac7b90f2787f3e40cf47738a7e47af Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Tue, 17 Oct 2017 15:55:58 +0200 Subject: [PATCH 05/47] Fixed bug with PRIMAVERA path --- earthdiagnostics/cmormanager.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/earthdiagnostics/cmormanager.py b/earthdiagnostics/cmormanager.py index 58ce7e23..5aadcc8f 100644 --- a/earthdiagnostics/cmormanager.py +++ b/earthdiagnostics/cmormanager.py @@ -303,8 +303,12 @@ class CMORManager(DataManager): grid = self.config.cmor.default_ocean_grid else: grid = self.config.cmor.default_atmos_grid + if cmor_var is None: + table_name = domain.get_table(frequency, self.config.data_convention).name + else: + table_name = cmor_var.get_table(frequency, self.config.data_convention).name folder_path = os.path.join(self._get_startdate_path(startdate), self._get_member_str(member), - cmor_var.get_table(frequency, self.config.data_convention).name, var, + table_name, var, grid, self.config.cmor.version) return folder_path -- GitLab From 89e47854b6fb06e6dbbb96df7609422856ff124d Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Wed, 18 Oct 2017 10:13:53 +0200 Subject: [PATCH 06/47] Fixed bug with file size check --- earthdiagnostics/datafile.py | 19 ++++++++++++------- 1 file changed, 12 insertions(+), 7 deletions(-) diff --git a/earthdiagnostics/datafile.py b/earthdiagnostics/datafile.py index 6b9309b2..0ad8a799 100644 --- a/earthdiagnostics/datafile.py +++ b/earthdiagnostics/datafile.py @@ -68,9 +68,11 @@ class DataFile(Publisher): return self._size def _get_size(self): - if self.local_status == LocalStatus.READY: - os.path.getsize(self.local_file) - return None + try: + if self.local_status == LocalStatus.READY: + self._size = os.path.getsize(self.local_file) + except Exception: + self._size = None def _clean_local(self): if self.local_status != LocalStatus.READY or len(self.suscribers) > 0 or self.upload_required(): @@ -494,9 +496,12 @@ class NetCDFFile(DataFile): Log.error('Can not create link to {1}: {0}'.format(ex, self.remote_file)) def _get_size(self): - if self.local_status == LocalStatus.READY: - self._size = os.path.getsize(self.local_file) - if self.storage_status == StorageStatus.READY: - self._size = os.path.getsize(self.remote_file) + try: + if self.local_status == LocalStatus.READY: + self._size = os.path.getsize(self.local_file) + if self.storage_status == StorageStatus.READY: + self._size = os.path.getsize(self.remote_file) + except Exception: + self._size = None -- GitLab From 7e6a97f2204a1853d7f1d1d93fe6fb9d64a1553c Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Wed, 18 Oct 2017 12:49:47 +0200 Subject: [PATCH 07/47] Added check for strange rename error that was removing the time dimension --- earthdiagnostics/cmorizer.py | 8 +++----- earthdiagnostics/utils.py | 29 +++++++++++++++++++++++------ earthdiagnostics/work_manager.py | 7 +++++++ 3 files changed, 33 insertions(+), 11 deletions(-) diff --git a/earthdiagnostics/cmorizer.py b/earthdiagnostics/cmorizer.py index c4233ea2..1f426270 100644 --- a/earthdiagnostics/cmorizer.py +++ b/earthdiagnostics/cmorizer.py @@ -1,11 +1,11 @@ # coding=utf-8 import glob import os -import pygrib import shutil import uuid from datetime import datetime +import pygrib from bscearth.utils.date import parse_date, chunk_end_date, previous_day, date2str, add_months from bscearth.utils.log import Log @@ -600,11 +600,9 @@ class Cmorizer(object): if "time_bnds" in handler.variables: time_var.bounds = "time_bnds" handler.variables['time_bnds'].units = time_var.units + Utils.convert_units(handler.variables['time_bnds'], 'days since 1850-01-01 00:00:00', 'standard') + Utils.convert_units(time_var, 'days since 1850-1-1 00:00:00', 'standard') handler.close() - temp = TempFile.get() - Utils.cdo.setreftime('1850-01-01,00:00:00,days', input=filename, output=temp) - Utils.move_file(temp, filename) - self._set_leadtime_var(filename) def _set_leadtime_var(self, filename): diff --git a/earthdiagnostics/utils.py b/earthdiagnostics/utils.py index 49331840..b557faf4 100644 --- a/earthdiagnostics/utils.py +++ b/earthdiagnostics/utils.py @@ -152,10 +152,9 @@ class Utils(object): Utils._rename_vars_directly(dic_names, filepath, handler, must_exist, rename_dimension) except RuntimeError: error = True - handler.close() - if not Utils.check_netcdf_file(temp): + if not error and not Utils.check_netcdf_file(temp): error = True if error: @@ -169,10 +168,22 @@ class Utils(object): def check_netcdf_file(filepath): with suppress_stdout(): try: + handler = Utils.openCdf(filepath) + if 'time' in handler.variables: + if handler.variables['time'].dimensions != ('time', ): + handler.close() + return False + handler.close() + iris.FUTURE.netcdf_promote = True - iris.load(filepath) + cubes = iris.load(filepath) + if len(cubes) == 0: + return False except iris.exceptions.IrisError: return False + except RuntimeError: + # HDF error, usually + return False return True @staticmethod @@ -642,11 +653,17 @@ class Utils(object): os.chmod(path, st.st_mode | stat.S_IWGRP) @staticmethod - def convert_units(var_handler, new_units): + def convert_units(var_handler, new_units, calendar=None): if new_units == var_handler.units: return - new_unit = Units(new_units) - old_unit = Units(var_handler.units) + + if hasattr(var_handler, 'calendar'): + old_calendar = var_handler.calendar + else: + old_calendar = None + + new_unit = Units(new_units, calendar=calendar) + old_unit = Units(var_handler.units, calendar=old_calendar) var_handler[:] = Units.conform(var_handler[:], old_unit, new_unit, inplace=True) if 'valid_min' in var_handler.ncattrs(): var_handler.valid_min = Units.conform(float(var_handler.valid_min), old_unit, new_unit, diff --git a/earthdiagnostics/work_manager.py b/earthdiagnostics/work_manager.py index ef3a62ea..0d0f5c02 100644 --- a/earthdiagnostics/work_manager.py +++ b/earthdiagnostics/work_manager.py @@ -260,6 +260,13 @@ class Downloader(object): if suscribers: return -suscribers + if datafile1.size is None: + if datafile2.size is None: + return 0 + else: + return -1 + elif datafile2.size is None: + return 1 size = datafile1.size - datafile2.size if size: return -size -- GitLab From 169a43fca1654a02070c05d3fd9e825cddc2d2d4 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Wed, 18 Oct 2017 18:16:02 +0200 Subject: [PATCH 08/47] Fixed everything except AreaMoc and InterpCDO --- earthdiagnostics/cmorizer.py | 8 ++++++-- earthdiagnostics/datafile.py | 6 +++--- earthdiagnostics/ocean/areamoc.py | 23 ++++++++++++----------- earthdiagnostics/ocean/heatcontent.py | 2 ++ earthdiagnostics/ocean/siasiesiv.py | 20 +++++++++++++------- earthdiagnostics/utils.py | 3 +++ earthdiagnostics/work_manager.py | 7 +++++-- 7 files changed, 44 insertions(+), 25 deletions(-) diff --git a/earthdiagnostics/cmorizer.py b/earthdiagnostics/cmorizer.py index 1f426270..a790eea0 100644 --- a/earthdiagnostics/cmorizer.py +++ b/earthdiagnostics/cmorizer.py @@ -597,11 +597,15 @@ class Cmorizer(object): def _update_time_variables(self, filename): handler = Utils.openCdf(filename) time_var = handler.variables['time'] + if hasattr(time_var, 'calendar'): + calendar = time_var.calendar + else: + calendar = 'standard' if "time_bnds" in handler.variables: time_var.bounds = "time_bnds" handler.variables['time_bnds'].units = time_var.units - Utils.convert_units(handler.variables['time_bnds'], 'days since 1850-01-01 00:00:00', 'standard') - Utils.convert_units(time_var, 'days since 1850-1-1 00:00:00', 'standard') + Utils.convert_units(handler.variables['time_bnds'], 'days since 1850-01-01 00:00:00', calendar) + Utils.convert_units(time_var, 'days since 1850-1-1 00:00:00', calendar) handler.close() self._set_leadtime_var(filename) diff --git a/earthdiagnostics/datafile.py b/earthdiagnostics/datafile.py index 0ad8a799..d82fe20e 100644 --- a/earthdiagnostics/datafile.py +++ b/earthdiagnostics/datafile.py @@ -224,10 +224,10 @@ class DataFile(Publisher): valid_max = '' if self.cmor_var is not None: - if self.cmor_var.valid_min != '': + if self.cmor_var.valid_min: valid_min = '-a valid_min,{0},o,{1},"{2}" '.format(self.final_name, var_type.char, self.cmor_var.valid_min) - if self.cmor_var.valid_max != '': + if self.cmor_var.valid_max: valid_max = '-a valid_max,{0},o,{1},"{2}" '.format(self.final_name, var_type.char, self.cmor_var.valid_max) Utils.nco.ncatted(input=file_path, output=file_path, @@ -333,7 +333,7 @@ class DataFile(Publisher): value = original_var[:] new_var[..., 0] = value handler.close() - Utils.nco.ncks(input=self.local_file, output=self.local_file, options='-O -x -v {0}'.format(self.final_name)) + Utils.nco.ncks(input=self.local_file, output=self.local_file, options=('-x -v {0}'.format(self.final_name),)) Utils.rename_variable(self.local_file, 'new_var', self.final_name) def _rename_coordinate_variables(self): diff --git a/earthdiagnostics/ocean/areamoc.py b/earthdiagnostics/ocean/areamoc.py index 80c18474..0179bcd3 100644 --- a/earthdiagnostics/ocean/areamoc.py +++ b/earthdiagnostics/ocean/areamoc.py @@ -1,12 +1,13 @@ # coding=utf-8 +import os + import numpy as np + +from earthdiagnostics.box import Box from earthdiagnostics.constants import Basins from earthdiagnostics.diagnostic import Diagnostic, DiagnosticIntOption, DiagnosticBasinOption -from earthdiagnostics.box import Box -from earthdiagnostics.utils import Utils, TempFile -import os - from earthdiagnostics.modelingrealm import ModelingRealms +from earthdiagnostics.utils import Utils, TempFile class AreaMoc(Diagnostic): @@ -149,14 +150,14 @@ class AreaMoc(Diagnostic): destiny.close() nco.ncks(input=temp2, output=temp, - options='-O -d lev,{0:.1f},{1:.1f} -d lat,{2:.1f},{3:.1f}'.format(self.box.min_depth, - self.box.max_depth, - self.box.min_lat, - self.box.max_lat)) + options=('-d lev,{0:.1f},{1:.1f} -d lat,{2:.1f},{3:.1f}'.format(self.box.min_depth, + self.box.max_depth, + self.box.min_lat, + self.box.max_lat),)) cdo.vertmean(input=temp, output=temp2) os.remove(temp) - nco.ncap2(input=temp2, output=temp2, options='-O -s "coslat[lat]=cos(lat[lat]*3.141592657/180.0)"') - nco.ncwa(input=temp2, output=temp2, options='-w coslat -a lat') - nco.ncks(input=temp2, output=temp2, options='-O -v vsftmyz,time') + nco.ncap2(input=temp2, output=temp2, options=('-s "coslat[lat]=cos(lat[lat]*3.141592657/180.0)"',)) + nco.ncwa(input=temp2, output=temp2, options='(-w coslat -a lat',) + nco.ncks(input=temp2, output=temp2, options=('-v vsftmyz,time',)) self.results.set_local_file(temp2) diff --git a/earthdiagnostics/ocean/heatcontent.py b/earthdiagnostics/ocean/heatcontent.py index 9b8731ff..d44e6492 100644 --- a/earthdiagnostics/ocean/heatcontent.py +++ b/earthdiagnostics/ocean/heatcontent.py @@ -51,6 +51,8 @@ class HeatContent(Diagnostic): self.max_level = max_level def __eq__(self, other): + if not isinstance(other, HeatContent): + return False return self.startdate == other.startdate and self.member == other.member and self.chunk == other.chunk and \ self.box == other.box and self.basin == other.basin and self.mxloption == other.mxloption diff --git a/earthdiagnostics/ocean/siasiesiv.py b/earthdiagnostics/ocean/siasiesiv.py index ec2bc5d4..21adfc0f 100644 --- a/earthdiagnostics/ocean/siasiesiv.py +++ b/earthdiagnostics/ocean/siasiesiv.py @@ -34,7 +34,7 @@ class Siasiesiv(Diagnostic): e2t = None gphit = None - def __init__(self, data_manager, startdate, member, chunk, basin, mask): + def __init__(self, data_manager, startdate, member, chunk, basin, mask, var_manager): """ :param data_manager: data management object :type data_manager: DataManager @@ -54,6 +54,9 @@ class Siasiesiv(Diagnostic): self.chunk = chunk self.mask = mask self.generated = {} + self.var_manager = var_manager + self.sic_varname = self.var_manager.get_variable('sic').short_name + self.sit_varname = self.var_manager.get_variable('sit').short_name def __str__(self): return 'Siasiesiv Startdate: {0} Member: {1} Chunk: {2} Basin: {3}'.format(self.startdate, self.member, @@ -81,7 +84,8 @@ class Siasiesiv(Diagnostic): job_list = list() for startdate, member, chunk in diags.config.experiment.get_chunk_list(): - job_list.append(Siasiesiv(diags.data_manager, startdate, member, chunk, options['basin'], mask)) + job_list.append(Siasiesiv(diags.data_manager, startdate, member, chunk, options['basin'], mask, + diags.config.var_manager)) mesh_handler = Utils.openCdf('mesh_hgr.nc') Siasiesiv.e1t = np.asfortranarray(mesh_handler.variables['e1t'][0, :]) Siasiesiv.e2t = np.asfortranarray(mesh_handler.variables['e2t'][0, :]) @@ -91,8 +95,10 @@ class Siasiesiv(Diagnostic): return job_list def request_data(self): - self.sit = self.request_chunk(ModelingRealms.seaIce, 'sit', self.startdate, self.member, self.chunk) - self.sic = self.request_chunk(ModelingRealms.seaIce, 'sic', self.startdate, self.member, self.chunk) + self.sit = self.request_chunk(ModelingRealms.seaIce, self.sit_varname, + self.startdate, self.member, self.chunk) + self.sic = self.request_chunk(ModelingRealms.seaIce, self.sic_varname, + self.startdate, self.member, self.chunk) def declare_data_generated(self): self._declare_var('sivols') @@ -112,13 +118,13 @@ class Siasiesiv(Diagnostic): Runs the diagnostic """ sit_handler = Utils.openCdf(self.sit.local_file) - sit = np.asfortranarray(sit_handler.variables['sit'][:]) + sit = np.asfortranarray(sit_handler.variables[self.sit_varname][:]) timesteps = sit_handler.dimensions['time'].size sit_handler.close() sic_handler = Utils.openCdf(self.sic.local_file) - Utils.convert_units(sic_handler.variables['sic'], '1.0') - sic = np.asfortranarray(sic_handler.variables['sic'][:]) + Utils.convert_units(sic_handler.variables[self.sic_varname], '1.0') + sic = np.asfortranarray(sic_handler.variables[self.sic_varname][:]) sic_handler.close() result = np.empty((8, timesteps)) diff --git a/earthdiagnostics/utils.py b/earthdiagnostics/utils.py index b557faf4..1bfe8755 100644 --- a/earthdiagnostics/utils.py +++ b/earthdiagnostics/utils.py @@ -184,6 +184,9 @@ class Utils(object): except RuntimeError: # HDF error, usually return False + except Exception: + # HDF error, usually + return False return True @staticmethod diff --git a/earthdiagnostics/work_manager.py b/earthdiagnostics/work_manager.py index 0d0f5c02..e1ff2a3a 100644 --- a/earthdiagnostics/work_manager.py +++ b/earthdiagnostics/work_manager.py @@ -1,8 +1,10 @@ # coding=utf-8 import datetime import operator +import sys import threading import time +import traceback from bscearth.utils.log import Log # noinspection PyCompatibility @@ -161,8 +163,9 @@ class WorkManager(object): job.compute() except Exception as ex: job.consumed_time = datetime.datetime.now() - time - job.message = str(ex) - Log.error('Job {0} failed: {1}', job, ex) + exc_type, exc_value, exc_traceback = sys.exc_info() + job.message = '{0}\n{1}'.format(ex, ''.join(traceback.format_tb(exc_traceback))) + Log.error('Job {0} failed: {1}', job, job.message ) job.status = DiagnosticStatus.FAILED return False -- GitLab From 450dada5a6cb491bf1cbdcd1c1200a4506476b60 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Thu, 19 Oct 2017 15:21:45 +0200 Subject: [PATCH 09/47] Fixed areamoc --- earthdiagnostics/ocean/areamoc.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/earthdiagnostics/ocean/areamoc.py b/earthdiagnostics/ocean/areamoc.py index 0179bcd3..ff23513d 100644 --- a/earthdiagnostics/ocean/areamoc.py +++ b/earthdiagnostics/ocean/areamoc.py @@ -158,6 +158,6 @@ class AreaMoc(Diagnostic): cdo.vertmean(input=temp, output=temp2) os.remove(temp) nco.ncap2(input=temp2, output=temp2, options=('-s "coslat[lat]=cos(lat[lat]*3.141592657/180.0)"',)) - nco.ncwa(input=temp2, output=temp2, options='(-w coslat -a lat',) + nco.ncwa(input=temp2, output=temp2, options=('-w coslat -a lat',)) nco.ncks(input=temp2, output=temp2, options=('-v vsftmyz,time',)) self.results.set_local_file(temp2) -- GitLab From 844292a63230b380a934159b80dab4739cdf34a0 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Fri, 20 Oct 2017 10:13:12 +0200 Subject: [PATCH 10/47] Fixed cmorization when only some chunks are requested --- earthdiagnostics/cmorizer.py | 2 ++ earthdiagnostics/cmormanager.py | 40 ++++++++++++++------------------- 2 files changed, 19 insertions(+), 23 deletions(-) diff --git a/earthdiagnostics/cmorizer.py b/earthdiagnostics/cmorizer.py index a790eea0..ef95d88b 100644 --- a/earthdiagnostics/cmorizer.py +++ b/earthdiagnostics/cmorizer.py @@ -94,6 +94,8 @@ class Cmorizer(object): except Exception as ex: Log.error('Could not CMORize oceanic file {0}: {1}', count, ex) count += 1 + if count >= self.experiment.chunks: + return def _filter_files(self, file_list): if not self.cmor.filter_files: diff --git a/earthdiagnostics/cmormanager.py b/earthdiagnostics/cmormanager.py index 5aadcc8f..76af2d1d 100644 --- a/earthdiagnostics/cmormanager.py +++ b/earthdiagnostics/cmormanager.py @@ -444,44 +444,38 @@ class CMORManager(DataManager): def _unpack_cmor_files(self, startdate, member): if self.config.cmor.force: return False - chunk = 1 cmorized = False - - if not self.config.cmor.force_untar: - while self.is_cmorized(startdate, member, chunk, ModelingRealms.atmos) or \ - self.is_cmorized(startdate, member, chunk, ModelingRealms.ocean): - chunk += 1 - - while self._unpack_chunk(startdate, member, chunk): - chunk += 1 - cmorized = True - - if self.experiment.num_chunks <= chunk: - cmorized = True + for chunk in range(1, self.experiment.num_chunks + 1): + if not self.config.cmor.force_untar: + if self.is_cmorized(startdate, member, chunk, ModelingRealms.atmos) or \ + self.is_cmorized(startdate, member, chunk, ModelingRealms.ocean): + cmorized = True + continue + + if self._unpack_chunk(startdate, member, chunk): + cmorized = True if cmorized: Log.info('Startdate {0} member {1} ready', startdate, member) return cmorized def _unpack_chunk(self, startdate, member, chunk): + if not self.config.cmor.chunk_cmorization_requested(chunk): + return True filepaths = self._get_transferred_cmor_data_filepaths(startdate, member, chunk, 'tar.gz') if len(filepaths) > 0: - if self.config.cmor.chunk_cmorization_requested(chunk): - Log.info('Unzipping cmorized data for {0} {1} {2}...', startdate, member, chunk) - Utils.unzip(filepaths, True) - else: - return True + Log.info('Unzipping cmorized data for {0} {1} {2}...', startdate, member, chunk) + Utils.unzip(filepaths, True) if not os.path.exists(self.cmor_path): os.mkdir(self.cmor_path) filepaths = self._get_transferred_cmor_data_filepaths(startdate, member, chunk, 'tar') if len(filepaths) > 0: - if self.config.cmor.chunk_cmorization_requested(chunk): - Log.info('Unpacking cmorized data for {0} {1} {2}...', startdate, member, chunk) - Utils.untar(filepaths, self.cmor_path) - self._correct_paths(startdate) - self.create_links(startdate, member) + Log.info('Unpacking cmorized data for {0} {1} {2}...', startdate, member, chunk) + Utils.untar(filepaths, self.cmor_path) + self._correct_paths(startdate) + self.create_links(startdate, member) return True return False -- GitLab From c90ef578ab26acae560990128f74cbf7556a5d0f Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Fri, 20 Oct 2017 15:55:30 +0200 Subject: [PATCH 11/47] Fixed PRIMAVERA/CMIP6 filename --- earthdiagnostics/cmormanager.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/earthdiagnostics/cmormanager.py b/earthdiagnostics/cmormanager.py index 76af2d1d..231eab59 100644 --- a/earthdiagnostics/cmormanager.py +++ b/earthdiagnostics/cmormanager.py @@ -282,8 +282,9 @@ class CMORManager(DataManager): grid = self.config.cmor.default_ocean_grid else: grid = self.config.cmor.default_atmos_grid - file_name = '{0}_{1}_{2}_{3}_{4}_{5}{6}'.format(var, cmor_table.name, self.experiment.experiment_name, - self.experiment.model, self._get_member_str(member), + file_name = '{0}_{1}_{2}_{3}_{4}_{5}{6}'.format(var, cmor_table.name, self.experiment.model, + self.experiment.experiment_name, + self._get_member_str(member), grid, time_bound) else: raise Exception('Data convention {0} not supported'.format(self.config.data_convention)) -- GitLab From 430cba38435d61049d356f00bf2bb4b43c01b552 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Tue, 24 Oct 2017 16:49:28 +0200 Subject: [PATCH 12/47] Added selcode before split --- earthdiagnostics/cmorizer.py | 61 +++++++++++++++++++++++------------- earthdiagnostics/config.py | 3 ++ 2 files changed, 43 insertions(+), 21 deletions(-) diff --git a/earthdiagnostics/cmorizer.py b/earthdiagnostics/cmorizer.py index ef95d88b..191f9c02 100644 --- a/earthdiagnostics/cmorizer.py +++ b/earthdiagnostics/cmorizer.py @@ -8,6 +8,7 @@ from datetime import datetime import pygrib from bscearth.utils.date import parse_date, chunk_end_date, previous_day, date2str, add_months from bscearth.utils.log import Log +from cdo import CDOException from earthdiagnostics.datafile import NetCDFFile from earthdiagnostics.frequency import Frequency, Frequencies @@ -73,7 +74,6 @@ class Cmorizer(object): tar_files.sort() if len(tar_files) > 0: break - if not len(tar_files): Log.error('No {1} files found in {0}'.format(self.original_files_path, args)) @@ -250,18 +250,17 @@ class Cmorizer(object): self._obtain_atmos_timestep(gribfile) full_file = self._get_monthly_grib(current_date, gribfile, grid) - self._unpack_grib(full_file, gribfile, grid) + if not self._unpack_grib(full_file, gribfile, grid): + os.remove(gribfile) + return next_gribfile = self.get_original_grib_path(add_months(current_date, 1, self.experiment.calendar), grid) - if not os.path.exists(next_gribfile): os.remove(gribfile) - cdo_reftime = parse_date(self.startdate).strftime('%Y-%m-%d,00:00') - - self._ungrib_vars(cdo_reftime, gribfile, current_date.month, Frequency('{0}hr'.format(self.atmos_timestep))) - self._ungrib_vars(cdo_reftime, gribfile, current_date.month, Frequencies.daily) - self._ungrib_vars(cdo_reftime, gribfile, current_date.month, Frequencies.monthly) + self._ungrib_vars(gribfile, current_date.month, Frequency('{0}hr'.format(self.atmos_timestep))) + self._ungrib_vars(gribfile, current_date.month, Frequencies.daily) + self._ungrib_vars(gribfile, current_date.month, Frequencies.monthly) for splited_file in glob.glob('{0}_*.128.nc'.format(gribfile)): os.remove(splited_file) @@ -273,19 +272,37 @@ class Cmorizer(object): self._merge_and_cmorize_atmos(chunk_start, chunk_end, grid, '{0}hr'.format(self.atmos_timestep)) - @staticmethod - def _unpack_grib(full_file, gribfile, grid): + def _unpack_grib(self, full_file, gribfile, grid): Log.info('Unpacking... ') # remap on regular Gauss grid - if grid == 'SH': - Utils.cdo.splitparam(input='-sp2gpl {0}'.format(full_file), output=gribfile + '_', options='-f nc4') - else: - Utils.cdo.splitparam(input=full_file, output=gribfile + '_', options='-R -f nc4') - # total precipitation (remove negative values) - Utils.cdo.setcode(228, - input='-setmisstoc,0 -setvrange,0,Inf -add {0}_{{142,143}}.128.nc'.format(gribfile), - output='{0}_228.128.nc'.format(gribfile)) - Utils.remove_file('ICM') + + codes = self.cmor.get_requested_codes() + if 228 in codes: + codes.update(142, 143) + codes_str = ','.join([str(code) for code in codes]) + try: + if grid == 'SH': + Utils.cdo.splitparam(input='-sp2gpl -selcode,{0} {1} '.format(codes_str, full_file), + output=gribfile + '_', + options='-f nc4') + + else: + Utils.cdo.splitparam(input='-selcode,{0} {1}'.format(codes_str, full_file), + output=gribfile + '_', + options='-R -f nc4') + # total precipitation (remove negative values) + if 228 in codes: + Utils.cdo.setcode(228, + input='-setmisstoc,0 -setvrange,0,Inf ' + '-add {0}_{{142,143}}.128.nc'.format(gribfile), + output='{0}_228.128.nc'.format(gribfile), + options='-f nc4') + return True + except CDOException: + Log.info('No requested codes found in {0} file'.format(grid)) + return False + finally: + Utils.remove_file('ICM') def _get_monthly_grib(self, current_date, gribfile, grid): prev_gribfile = self.get_scratch_grib_path(add_months(current_date, -1, self.experiment.calendar), grid) @@ -509,12 +526,14 @@ class Cmorizer(object): os.remove('rules_files') Utils.remove_file(prev_gribfile) - def _ungrib_vars(self, cdo_reftime, gribfile, month, frequency): + def _ungrib_vars(self, gribfile, month, frequency): + cdo_reftime = parse_date(self.startdate).strftime('%Y-%m-%d,00:00') + Log.info('Preparing {0} variables'.format(frequency)) var_codes = self.config.cmor.get_variables(frequency) for var_code in var_codes: if not os.path.exists('{0}_{1}.128.nc'.format(gribfile, var_code)): - continue + continue new_units = None cdo_operator = '-selmon,{0}'.format(month) diff --git a/earthdiagnostics/config.py b/earthdiagnostics/config.py index 133bd6da..e9be69f6 100644 --- a/earthdiagnostics/config.py +++ b/earthdiagnostics/config.py @@ -233,6 +233,9 @@ class CMORConfig(object): return self._var_monthly raise ValueError('Frequency not recognized: {0}'.format(frequency)) + def get_requested_codes(self): + return set(list(self._var_hourly.keys()) + list(self._var_daily.keys()) + list(self._var_monthly.keys())) + def get_levels(self, frequency, variable): return self.get_variables(frequency)[variable] -- GitLab From 75e7be765e6cb065ad8b92eedf8be687e934354b Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Tue, 24 Oct 2017 17:26:40 +0200 Subject: [PATCH 13/47] Fixed problem with time bounds calendar in cmorizer --- earthdiagnostics/cmorizer.py | 4 ++-- earthdiagnostics/utils.py | 4 +--- 2 files changed, 3 insertions(+), 5 deletions(-) diff --git a/earthdiagnostics/cmorizer.py b/earthdiagnostics/cmorizer.py index 191f9c02..7248e06b 100644 --- a/earthdiagnostics/cmorizer.py +++ b/earthdiagnostics/cmorizer.py @@ -94,7 +94,7 @@ class Cmorizer(object): except Exception as ex: Log.error('Could not CMORize oceanic file {0}: {1}', count, ex) count += 1 - if count >= self.experiment.chunks: + if count >= self.experiment.num_chunks: return def _filter_files(self, file_list): @@ -625,7 +625,7 @@ class Cmorizer(object): if "time_bnds" in handler.variables: time_var.bounds = "time_bnds" handler.variables['time_bnds'].units = time_var.units - Utils.convert_units(handler.variables['time_bnds'], 'days since 1850-01-01 00:00:00', calendar) + Utils.convert_units(handler.variables['time_bnds'], 'days since 1850-01-01 00:00:00', calendar, calendar) Utils.convert_units(time_var, 'days since 1850-1-1 00:00:00', calendar) handler.close() self._set_leadtime_var(filename) diff --git a/earthdiagnostics/utils.py b/earthdiagnostics/utils.py index 1bfe8755..b0629f78 100644 --- a/earthdiagnostics/utils.py +++ b/earthdiagnostics/utils.py @@ -656,14 +656,12 @@ class Utils(object): os.chmod(path, st.st_mode | stat.S_IWGRP) @staticmethod - def convert_units(var_handler, new_units, calendar=None): + def convert_units(var_handler, new_units, calendar=None, old_calendar=None): if new_units == var_handler.units: return if hasattr(var_handler, 'calendar'): old_calendar = var_handler.calendar - else: - old_calendar = None new_unit = Units(new_units, calendar=calendar) old_unit = Units(var_handler.units, calendar=old_calendar) -- GitLab From e5f4bf48142b2473a7bf3ed2cb82beffe1c83ccb Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Tue, 24 Oct 2017 17:52:43 +0200 Subject: [PATCH 14/47] Fixed bug preventing to cmorize last chunk --- earthdiagnostics/cmorizer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/earthdiagnostics/cmorizer.py b/earthdiagnostics/cmorizer.py index 7248e06b..c4e4a93e 100644 --- a/earthdiagnostics/cmorizer.py +++ b/earthdiagnostics/cmorizer.py @@ -94,7 +94,7 @@ class Cmorizer(object): except Exception as ex: Log.error('Could not CMORize oceanic file {0}: {1}', count, ex) count += 1 - if count >= self.experiment.num_chunks: + if count > self.experiment.num_chunks: return def _filter_files(self, file_list): -- GitLab From 39b7b8cab96da02e6acaa853f4b0ffc9ce2ab31d Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Tue, 7 Nov 2017 16:42:11 +0100 Subject: [PATCH 15/47] Automatic deletion of uneeded files now working --- diags.conf | 19 +++++++------ earthdiagnostics/datafile.py | 28 +++++++++++++++++++ earthdiagnostics/datamanager.py | 12 ++++++-- earthdiagnostics/diagnostic.py | 7 +++-- .../general/verticalmeanmetersiris.py | 19 +++++++------ earthdiagnostics/obsreconmanager.py | 10 ++----- earthdiagnostics/work_manager.py | 20 +++++++++++-- 7 files changed, 80 insertions(+), 35 deletions(-) diff --git a/diags.conf b/diags.conf index 7c063c69..fa591f64 100644 --- a/diags.conf +++ b/diags.conf @@ -17,11 +17,11 @@ CON_FILES = /esnas/autosubmit/con_files/ # an alias defined in the ALIAS section (see more below). If you are using the diagnostics just to CMORize, leave it # empty #DIAGS = discretize,atmos,sfcWind,,0,40 -DIAGS = climpercent,atmos,sfcWind,2010,2012,11 daysover,atmos,sfcWind,2010,2012,11 -#DIAGS = OHC +DIAGS = vmean,ocean,uo,0,30 monmean,ocean,uovmean0.0-30.0m,day vmean,ocean,vo,0,30 monmean,ocean,vovmean0.0-30.0m,day +# DIAGS = monmean,ocean,uovmean0.0-30.0m,day monmean,ocean,vovmean0.0-30.0m,day # Frequency of the data you want to use by default. Some diagnostics do not use this value: i.e. monmean always stores # its results at monthly frequency (obvious) and has a parameter to specify input's frequency. -FREQUENCY = 6hr +FREQUENCY = day # Path to CDFTOOLS binaries CDFTOOLS_PATH = ~jvegas/CDFTOOLS/bin # If true, copies the mesh files regardless of presence in scratch dir @@ -70,14 +70,14 @@ SERVER_URL = https://earth.bsc.es/thredds [EXPERIMENT] # Experiments parameters as defined in CMOR standard -INSTITUTE = ecmwf -MODEL = erainterim +INSTITUTE = mercator +MODEL = glorys2_v4 # Model version: Available versions -MODEL_VERSION = Ec3.2_O1L75 +MODEL_VERSION = # Atmospheric output timestep in hours -ATMOS_TIMESTEP = 6 +ATMOS_TIMESTEP = 0 # Ocean output timestep in hours -OCEAN_TIMESTEP = 6 +OCEAN_TIMESTEP = 0 # For those who use Autosubmit, this will be easy # EXPID is the unique identifier of the experiment. @@ -88,8 +88,9 @@ OCEAN_TIMESTEP = 6 # CHUNK_SIZE is the size of each data file, given in months # CHUNKS is the number of chunks. You can specify less chunks than present on the experiment EXPID = testing_erainterim -STARTDATES = 20101101 20111101 20121101 +STARTDATES = 199[3-9]0[1-9]01 199[3-9]1[0-2]01 200[0-9]0[1-9]01 200[0-9]1[0-2]01 201[0-5]0[1-9]01 201[0-5]1[0-2]01 # STARTDATES = 19840101 19850101 +# STARTDATES = 19930101 MEMBERS = 0 MEMBER_DIGITS = 1 CHUNK_SIZE = 1 diff --git a/earthdiagnostics/datafile.py b/earthdiagnostics/datafile.py index d82fe20e..866c9310 100644 --- a/earthdiagnostics/datafile.py +++ b/earthdiagnostics/datafile.py @@ -83,6 +83,11 @@ class DataFile(Publisher): self.local_file = None self.local_status = LocalStatus.PENDING + def only_suscriber(self, who): + if len(self._subscribers) != 1: + return + return who in self._subscribers + def upload_required(self): return self.local_status == LocalStatus.READY and self.storage_status == StorageStatus.PENDING @@ -284,6 +289,29 @@ class DataFile(Publisher): self._update_var_with_region_data() self._correct_metadata() Utils.nco.ncks(input=self.local_file, output=self.local_file, options=['--fix_rec_dmn region']) + # handler = Utils.openCdf(self.local_file) + # regions = handler.variables('region')[...].tolist() + # ordered_regions = regions.sorted() + # new_indexes = [ordered_regions.index(region) for region in regions] + # + # for var in handler.variables.values(): + # if 'region' not in var.dimensions(): + # continue + # var_ordered = np.moveaxis(var[...], range(len(regions)), new_indexes) + # handler.close() + # + # pass + # + # for x, region in enumerate(regions): + # Utils.nco.ncks(input=self.local_file, output=self.local_file, options=['--fix_rec_dmn region']) + # handler = Utils.openCdf(self.local_file) + # current = handler.variables['region'][...].tolist().index(region) + # handler.close() + # if current != x: + # Utils.nco.ncap2(input=self.local_file, output=self.local_file, + # options=('-s "region({0})=region({1})'.format(x, current),)) + # pass + def _update_var_with_region_data(self): temp = TempFile.get() diff --git a/earthdiagnostics/datamanager.py b/earthdiagnostics/datamanager.py index e3799d31..b4ab0124 100644 --- a/earthdiagnostics/datamanager.py +++ b/earthdiagnostics/datamanager.py @@ -58,14 +58,20 @@ class DataManager(object): var += box.get_lon_str() + box.get_lat_str() + box.get_depth_str() return var - def get_varfolder(self, domain, var, grid=None): + def get_varfolder(self, domain, var, grid=None, frequency=None): if grid: var = '{0}-{1}'.format(var, grid) if domain in [ModelingRealms.ocean, ModelingRealms.seaIce, ModelingRealms.ocnBgchem]: - return '{0}_f{1}h'.format(var, self.experiment.ocean_timestep) + return self._apply_fxh(var, self.experiment.ocean_timestep, frequency) else: - return '{0}_f{1}h'.format(var, self.experiment.atmos_timestep) + return self._apply_fxh(var, self.experiment.atmos_timestep, frequency) + + def _apply_fxh(self, folder_name, timestep, frequency=None): + is_base_frequency = frequency is not None and frequency.frequency.endswith('hr') + if not is_base_frequency and timestep > 0: + return '{0}_f{1}h'.format(folder_name, timestep) + return folder_name def create_link(self, domain, filepath, frequency, var, grid, move_old, vartype): freq_str = frequency.folder_name(vartype) diff --git a/earthdiagnostics/diagnostic.py b/earthdiagnostics/diagnostic.py index e6bf4bb0..f17d33a3 100644 --- a/earthdiagnostics/diagnostic.py +++ b/earthdiagnostics/diagnostic.py @@ -1,12 +1,12 @@ # coding=utf-8 import datetime -from datafile import StorageStatus, LocalStatus from earthdiagnostics.constants import Basins, Basin +from earthdiagnostics.datafile import StorageStatus, LocalStatus from earthdiagnostics.frequency import Frequency from earthdiagnostics.modelingrealm import ModelingRealms +from earthdiagnostics.publisher import Publisher from earthdiagnostics.variable_type import VariableType -from publisher import Publisher class DiagnosticStatus(object): @@ -242,7 +242,8 @@ class Diagnostic(Publisher): return self.pending_requests() == 0 def pending_requests(self): - return len([request.storage_status != StorageStatus.READY for request in self._requests]) + return len([request.storage_status != StorageStatus.READY or request.local_status != LocalStatus.READY + for request in self._requests]) class DiagnosticOption(object): diff --git a/earthdiagnostics/general/verticalmeanmetersiris.py b/earthdiagnostics/general/verticalmeanmetersiris.py index 92de0bef..23dce4d8 100644 --- a/earthdiagnostics/general/verticalmeanmetersiris.py +++ b/earthdiagnostics/general/verticalmeanmetersiris.py @@ -4,10 +4,10 @@ import iris.analysis import iris.exceptions from earthdiagnostics.box import Box -from earthdiagnostics.diagnostic import Diagnostic, DiagnosticFloatOption, DiagnosticDomainOption, \ - DiagnosticVariableOption -from earthdiagnostics.utils import TempFile +from earthdiagnostics.diagnostic import Diagnostic, DiagnosticFloatOption, \ + DiagnosticDomainOption, DiagnosticVariableListOption from earthdiagnostics.modelingrealm import ModelingRealms +from earthdiagnostics.utils import TempFile class VerticalMeanMetersIris(Diagnostic): @@ -66,10 +66,10 @@ class VerticalMeanMetersIris(Diagnostic): :type options: list[str] :return: """ - options_available = (DiagnosticVariableOption(diags.data_manager.config.var_manager), + options_available = (DiagnosticDomainOption(), + DiagnosticVariableListOption(diags.data_manager.config.var_manager, 'variable'), DiagnosticFloatOption('min_depth', -1), - DiagnosticFloatOption('max_depth', -1), - DiagnosticDomainOption(default_value=ModelingRealms.ocean)) + DiagnosticFloatOption('max_depth', -1)) options = cls.process_options(options, options_available) box = Box(True) @@ -79,9 +79,10 @@ class VerticalMeanMetersIris(Diagnostic): box.max_depth = options['max_depth'] job_list = list() - for startdate, member, chunk in diags.config.experiment.get_chunk_list(): - job_list.append(VerticalMeanMetersIris(diags.data_manager, startdate, member, chunk, - options['domain'], options['variable'], box)) + for var in options['variable']: + for startdate, member, chunk in diags.config.experiment.get_chunk_list(): + job_list.append(VerticalMeanMetersIris(diags.data_manager, startdate, member, chunk, + options['domain'], var, box)) return job_list def request_data(self): diff --git a/earthdiagnostics/obsreconmanager.py b/earthdiagnostics/obsreconmanager.py index 661986c9..b75e7c0f 100644 --- a/earthdiagnostics/obsreconmanager.py +++ b/earthdiagnostics/obsreconmanager.py @@ -88,7 +88,6 @@ class ObsReconManager(DataManager): """ if not frequency: frequency = self.config.frequency - var = self._get_final_var_name(box, var) folder_path = self._get_folder_path(frequency, domain, var, grid, vartype) file_name = self._get_file_name(var, startdate) @@ -97,12 +96,7 @@ class ObsReconManager(DataManager): return filepath def _get_folder_path(self, frequency, domain, variable, grid, vartype): - - if not frequency.frequency.endswith('hr'): - var_folder = self.get_varfolder(domain, variable, grid) - else: - var_folder = variable - + var_folder = self.get_varfolder(domain, variable, grid, frequency) folder_path = os.path.join(self.config.data_dir, self.config.data_type, self.experiment.institute.lower(), self.experiment.model.lower(), @@ -261,7 +255,7 @@ class ObsReconManager(DataManager): cmor_var = self.variable_list.get_variable(var) if cmor_var: var = cmor_var.short_name - final_name = var + final_name = self._get_final_var_name(box, var) filepath = self.get_file_path(startdate, domain, final_name, frequency, vartype, box, grid) netcdf_file = self._declare_generated_file(filepath, domain, final_name, cmor_var, self.config.data_convention, diff --git a/earthdiagnostics/work_manager.py b/earthdiagnostics/work_manager.py index e1ff2a3a..cca45235 100644 --- a/earthdiagnostics/work_manager.py +++ b/earthdiagnostics/work_manager.py @@ -95,6 +95,9 @@ class WorkManager(object): def _job_status_changed(self, job): if job.status == DiagnosticStatus.READY: self.executor.submit(self._run_job, job) + for request in job._requests: + if request.only_suscriber(self): + request.unsubscribe(self) self.check_completion() def _file_object_status_changed(self, file_object): @@ -104,9 +107,20 @@ class WorkManager(object): if file_object.upload_required(): self.uploader.submit(file_object.upload) return + if file_object.only_suscriber(self): + file_object.unsubscribe(self) self.check_completion() def check_completion(self): + counter = 0 + for job in self.jobs: + if job.status == DiagnosticStatus.READY: + counter += 1 + if counter > 20: + break + + self.downloader.on_hold = counter > 20 + for job in self.jobs: if job.status in (DiagnosticStatus.READY, DiagnosticStatus.RUNNING): return False @@ -231,8 +245,8 @@ class Downloader(object): def __init__(self): self._downloads = [] self._lock = threading.Lock() - self._wait = threading.Semaphore() self.stop = False + self.on_hold = False def start(self): self._thread = threading.Thread(target=self.downloader) @@ -277,7 +291,7 @@ class Downloader(object): while True: with self._lock: - if len(self._downloads) == 0: + if len(self._downloads) == 0 or self.on_hold: if self.stop: return time.sleep(0.01) @@ -287,7 +301,7 @@ class Downloader(object): self._downloads.remove(datafile) datafile.download() except Exception as ex: - Log.critical('Unhandled error at downloader: {0}', ex) + Log.critical('Unhandled error at downloader: {0}\n{1}', ex, traceback.print_exc()) def shutdown(self): self.stop = True -- GitLab From 92943a90a59abde2cbaf21ec1b2656653bfbc9c7 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Wed, 8 Nov 2017 16:31:49 +0100 Subject: [PATCH 16/47] First implemntation of skip diags (not working) --- earthdiagnostics/config.py | 1 + earthdiagnostics/diagnostic.py | 11 +++++++++++ earthdiagnostics/work_manager.py | 6 ++++++ 3 files changed, 18 insertions(+) diff --git a/earthdiagnostics/config.py b/earthdiagnostics/config.py index e9be69f6..96c83702 100644 --- a/earthdiagnostics/config.py +++ b/earthdiagnostics/config.py @@ -66,6 +66,7 @@ class Config(object): self.var_manager = VariableManager() self.var_manager.load_variables(self.data_convention) self._diags = parser.get_option('DIAGNOSTICS', 'DIAGS') + self.skip_diags_done = parser.get_bool_option('DIAGNOSTICS', 'SKIP_DIAGS_DONE', True) self.frequency = Frequency(parser.get_option('DIAGNOSTICS', 'FREQUENCY')) "Default data frequency to be used by the diagnostics" diff --git a/earthdiagnostics/diagnostic.py b/earthdiagnostics/diagnostic.py index f17d33a3..6295ef28 100644 --- a/earthdiagnostics/diagnostic.py +++ b/earthdiagnostics/diagnostic.py @@ -1,6 +1,8 @@ # coding=utf-8 import datetime +from bscearth.utils.log import Log + from earthdiagnostics.constants import Basins, Basin from earthdiagnostics.datafile import StorageStatus, LocalStatus from earthdiagnostics.frequency import Frequency @@ -41,6 +43,15 @@ class Diagnostic(Publisher): self.consumed_time = datetime.timedelta() self.subjobs = [] + def can_skip_run(self): + for file_generated in self._generated_files: + if file_generated.storage_status != StorageStatus.READY: + return False + if file_generated.has_modifiers(): + Log.warning('Can not skip diagnostics run when data is going to be modified: {0}'.format(self)) + return False + + def __repr__(self): return str(self) diff --git a/earthdiagnostics/work_manager.py b/earthdiagnostics/work_manager.py index cca45235..647feec7 100644 --- a/earthdiagnostics/work_manager.py +++ b/earthdiagnostics/work_manager.py @@ -68,6 +68,12 @@ class WorkManager(object): subjob.subscribe(self, self._job_status_changed) job.check_is_ready() + if self.config.skip_diags_done: + for job in self.jobs: + if job.can_skip_run(): + Log.info('Diagnostic {0} already done. Skipping !', job) + job.status = DiagnosticStatus.COMPLETED + for file_object in self.data_manager.requested_files.values(): file_object.subscribe(self, self._file_object_status_changed) if file_object.download_required(): -- GitLab From b6e51f17b91aa52e5eb84263510b0d48f46a19c5 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Fri, 10 Nov 2017 10:10:26 +0100 Subject: [PATCH 17/47] Fix for marenostrum 4 release --- earthdiagnostics/cmormanager.py | 49 ++++++++++++++++++----- earthdiagnostics/constants.py | 6 ++- earthdiagnostics/diagnostic.py | 6 ++- earthdiagnostics/statistics/discretize.py | 8 ++-- earthdiagnostics/variable.py | 9 +++-- 5 files changed, 59 insertions(+), 19 deletions(-) diff --git a/earthdiagnostics/cmormanager.py b/earthdiagnostics/cmormanager.py index 231eab59..b454c4f3 100644 --- a/earthdiagnostics/cmormanager.py +++ b/earthdiagnostics/cmormanager.py @@ -484,14 +484,16 @@ class CMORManager(DataManager): tar_path = os.path.join(self.config.data_dir, self.experiment.expid, 'original_files', 'cmorfiles') tar_original_files = os.path.join(self.config.data_dir, 'original_files', self.experiment.expid, 'cmorfiles') - file_name = 'CMOR?_{0}_{1}_{2}_{3}-*.{4}'.format(self.experiment.expid, startdate, - self.experiment.get_member_str(member), - self.experiment.get_chunk_start_str(startdate, chunk), - extension) - filepaths = glob.glob(os.path.join(tar_path, file_name)) - filepaths += glob.glob(os.path.join(tar_path, 'outputs', file_name)) - filepaths += glob.glob(os.path.join(tar_original_files, file_name)) - filepaths += glob.glob(os.path.join(tar_original_files, 'outputs', file_name)) + filepaths = [] + for cmor_prefix in ('CMOR?', 'CMOR'): + file_name = '{5}_{0}_{1}_{2}_{3}-*.{4}'.format(self.experiment.expid, startdate, + self.experiment.get_member_str(member), + self.experiment.get_chunk_start_str(startdate, chunk), + extension, cmor_prefix) + filepaths += glob.glob(os.path.join(tar_path, file_name)) + filepaths += glob.glob(os.path.join(tar_path, 'outputs', file_name)) + filepaths += glob.glob(os.path.join(tar_original_files, file_name)) + filepaths += glob.glob(os.path.join(tar_original_files, 'outputs', file_name)) return filepaths def _correct_paths(self, startdate): @@ -537,6 +539,16 @@ class CMORManager(DataManager): member_str = None Log.info('Creating links for CMOR files ({0})', startdate) path = self._get_startdate_path(startdate) + if self.config.data_convention.upper() in ('SPECS', 'APPLICATE'): + self._create_links_CMIP5(member_str, path) + elif self.config.data_convention.upper() in ('CMIP6', 'PRIMAVERA'): + self._create_links_CMIP6(member_str, path) + else: + raise ValueError('Dataset convention {0} not supported for massive ' + 'link creation'.format(self.config.data_convention)) + Log.debug('Links ready') + + def _create_links_CMIP5(self, member_str, path): for freq in os.listdir(path): frequency = Frequency.parse(freq) for domain in os.listdir(os.path.join(path, freq)): @@ -553,7 +565,26 @@ class CMORManager(DataManager): for filename in os.listdir(filepath): self.create_link(domain, os.path.join(filepath, filename), frequency, var, "", False, vartype=VariableType.MEAN) - Log.debug('Links ready') + + def _create_links_CMIP6(self, member_str, path): + for member in os.listdir(path): + for table in os.listdir(os.path.join(path, member)): + frequency = self.variable_list.tables[table].frequency + domain = None + for var in os.listdir(os.path.join(path, member, table)): + for grid in os.listdir(os.path.join(path, member, table, var)): + if member_str != member: + continue + for name in os.listdir(os.path.join(path, member, table, var, grid)): + filepath = os.path.join(path, member, table, var, grid, name) + if os.path.isfile(filepath): + + self.create_link(domain, filepath, frequency, var, "", False, + vartype=VariableType.MEAN) + else: + for filename in os.listdir(filepath): + self.create_link(domain, os.path.join(filepath, filename), frequency, var, "", + False, vartype=VariableType.MEAN) def _get_startdate_path(self, startdate): """ diff --git a/earthdiagnostics/constants.py b/earthdiagnostics/constants.py index c1e51013..6c66d625 100644 --- a/earthdiagnostics/constants.py +++ b/earthdiagnostics/constants.py @@ -3,6 +3,7 @@ Contains the enumeration-like classes used by the diagnostics """ import netCDF4 + from singleton import SingletonType @@ -47,6 +48,7 @@ class Basins(object): def __init__(self): self.aliases = { + 'Global': ('Global', 'glob'), 'Atlantic_Ocean': ('atl', 'atlantic'), 'North_Atlantic_Ocean': ('natl', 'north_atlantic'), 'Tropical_Atlantic_Ocean': ('tatl', 'tropical_atlantic'), @@ -125,7 +127,9 @@ class Basins(object): self.Indian = Basin('Indian_Ocean') self._known_aliases = {} self._add_alias('glob', self.Global) - self._add_alias(self.Global.name, self.Global) + for basin in (self.Global, self.Atlantic, self.Pacific, self.IndoPacific, self.Indian): + for alias in self.aliases[basin.name]: + self._add_alias(alias, basin) def get_available_basins(self, handler): """ diff --git a/earthdiagnostics/diagnostic.py b/earthdiagnostics/diagnostic.py index e6bf4bb0..bdf25a94 100644 --- a/earthdiagnostics/diagnostic.py +++ b/earthdiagnostics/diagnostic.py @@ -381,7 +381,11 @@ class DiagnosticFrequencyOption(DiagnosticOption): class DiagnosticBasinOption(DiagnosticOption): def parse(self, option_value): - return Basins().parse(self.check_default(option_value)) + value = self.check_default(option_value) + basin = Basins().parse(value) + if basin is None: + raise DiagnosticOptionError('Basin {0} not recognized'.format(value)) + return basin class DiagnosticComplexStrOption(DiagnosticOption): diff --git a/earthdiagnostics/statistics/discretize.py b/earthdiagnostics/statistics/discretize.py index 81ed8232..b7138234 100644 --- a/earthdiagnostics/statistics/discretize.py +++ b/earthdiagnostics/statistics/discretize.py @@ -1,11 +1,11 @@ # coding=utf-8 import math +import cf_units import iris import iris.coord_categorisation import iris.coords import iris.exceptions -import iris.unit import numpy as np import psutil import six @@ -199,9 +199,9 @@ class Discretize(Diagnostic): var_name='leadtime', units='months')) lead_date = add_months(date, leadtime - 1, self.data_manager.config.experiment.calendar) - leadtime_cube.add_aux_coord(iris.coords.AuxCoord(iris.unit.date2num(lead_date, - unit='days since 1950-01-01', - calendar="standard"), + leadtime_cube.add_aux_coord(iris.coords.AuxCoord(cf_units.date2num(lead_date, + unit='days since 1950-01-01', + calendar="standard"), var_name='time', units='days since 1950-01-01')) diff --git a/earthdiagnostics/variable.py b/earthdiagnostics/variable.py index 9a623469..588d18e2 100644 --- a/earthdiagnostics/variable.py +++ b/earthdiagnostics/variable.py @@ -10,7 +10,6 @@ from bscearth.utils.log import Log from earthdiagnostics.constants import Basins from earthdiagnostics.frequency import Frequency from earthdiagnostics.modelingrealm import ModelingRealms -from singleton import SingletonType class VariableJsonException(Exception): @@ -22,6 +21,7 @@ class VariableManager(object): self._cmor_tables_folder = os.path.join(os.path.dirname(os.path.realpath(__file__)), 'cmor_tables') self._aliases_folder = os.path.join(os.path.dirname(os.path.realpath(__file__)), 'variable_alias') self._dict_variables = {} + self.tables = {} def get_variable(self, original_name, silent=False): """ @@ -132,9 +132,9 @@ class VariableManager(object): continue if 'variable_entry' in data: Log.debug('Parsing file {0}'.format(file_name)) - table = CMORTable(data['Header']['table_id'][6:], - Frequency(data['Header']['frequency']), - data['Header']['table_date']) + table_id = data['Header']['table_id'][6:] + table = CMORTable(table_id, Frequency(data['Header']['frequency']), data['Header']['table_date']) + self.tables[table_id] = table self._load_json_variables(data['variable_entry'], table) def _load_json_variables(self, json_data, table): @@ -247,6 +247,7 @@ class VariableManager(object): continue table_frequency, table_date = table_data[sheet.title] table = CMORTable(sheet.title, table_frequency, table_date) + self.tables[sheet.title] = table for row in sheet.rows: if row[0].value == 'Priority' or not row[5].value: continue -- GitLab From f46495ab8cc4816ae1b56f888ec35c80d663fee1 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Tue, 14 Nov 2017 13:32:52 +0100 Subject: [PATCH 18/47] Fixed for weekly data --- diags.conf | 18 +++--- earthdiagnostics/datafile.py | 7 +-- earthdiagnostics/diagnostic.py | 18 +++++- earthdiagnostics/frequency.py | 7 +++ earthdiagnostics/obsreconmanager.py | 11 ++-- earthdiagnostics/ocean/interpolatecdo.py | 71 ++++++++++++++++++------ earthdiagnostics/work_manager.py | 29 +++++++--- 7 files changed, 115 insertions(+), 46 deletions(-) diff --git a/diags.conf b/diags.conf index fa591f64..d6504e3d 100644 --- a/diags.conf +++ b/diags.conf @@ -17,11 +17,11 @@ CON_FILES = /esnas/autosubmit/con_files/ # an alias defined in the ALIAS section (see more below). If you are using the diagnostics just to CMORize, leave it # empty #DIAGS = discretize,atmos,sfcWind,,0,40 -DIAGS = vmean,ocean,uo,0,30 monmean,ocean,uovmean0.0-30.0m,day vmean,ocean,vo,0,30 monmean,ocean,vovmean0.0-30.0m,day +DIAGS = interpcdo,ocean,tas,r240x121,bilinear,False,ecmwf,False # DIAGS = monmean,ocean,uovmean0.0-30.0m,day monmean,ocean,vovmean0.0-30.0m,day # Frequency of the data you want to use by default. Some diagnostics do not use this value: i.e. monmean always stores # its results at monthly frequency (obvious) and has a parameter to specify input's frequency. -FREQUENCY = day +FREQUENCY = weekly # Path to CDFTOOLS binaries CDFTOOLS_PATH = ~jvegas/CDFTOOLS/bin # If true, copies the mesh files regardless of presence in scratch dir @@ -70,14 +70,14 @@ SERVER_URL = https://earth.bsc.es/thredds [EXPERIMENT] # Experiments parameters as defined in CMOR standard -INSTITUTE = mercator -MODEL = glorys2_v4 +INSTITUTE = ecmwf +MODEL = erainterim # Model version: Available versions MODEL_VERSION = # Atmospheric output timestep in hours -ATMOS_TIMESTEP = 0 +ATMOS_TIMESTEP = 6 # Ocean output timestep in hours -OCEAN_TIMESTEP = 0 +OCEAN_TIMESTEP = 6 # For those who use Autosubmit, this will be easy # EXPID is the unique identifier of the experiment. @@ -88,9 +88,9 @@ OCEAN_TIMESTEP = 0 # CHUNK_SIZE is the size of each data file, given in months # CHUNKS is the number of chunks. You can specify less chunks than present on the experiment EXPID = testing_erainterim -STARTDATES = 199[3-9]0[1-9]01 199[3-9]1[0-2]01 200[0-9]0[1-9]01 200[0-9]1[0-2]01 201[0-5]0[1-9]01 201[0-5]1[0-2]01 -# STARTDATES = 19840101 19850101 -# STARTDATES = 19930101 +#STARTDATES = 199[3-9]0[1-9]01 199[3-9]1[0-2]01 200[0-9]0[1-9]01 200[0-9]1[0-2]01 201[0-5]0[1-9]01 201[0-5]1[0-2]01 +#STARTDATES = 19840101 19850101 +STARTDATES = 19960104 MEMBERS = 0 MEMBER_DIGITS = 1 CHUNK_SIZE = 1 diff --git a/earthdiagnostics/datafile.py b/earthdiagnostics/datafile.py index 866c9310..fc3032d5 100644 --- a/earthdiagnostics/datafile.py +++ b/earthdiagnostics/datafile.py @@ -59,7 +59,6 @@ class DataFile(Publisher): def unsubscribe(self, who): super(DataFile, self).unsubscribe(who) - self._clean_local() @property def size(self): @@ -74,8 +73,9 @@ class DataFile(Publisher): except Exception: self._size = None - def _clean_local(self): - if self.local_status != LocalStatus.READY or len(self.suscribers) > 0 or self.upload_required(): + def clean_local(self): + if self.local_status != LocalStatus.READY or len(self.suscribers) > 0 or self.upload_required() or \ + self.storage_status == StorageStatus.UPLOADING: return Log.debug('File {0} no longer needed. Deleting from scratch...'.format(self.remote_file)) os.remove(self.local_file) @@ -185,7 +185,6 @@ class DataFile(Publisher): except Exception as ex: Log.warning('Link for file {0} can not be created: {1}', self.remote_file, ex) self.storage_status = StorageStatus.READY - self._clean_local() def set_local_file(self, local_file, diagnostic=None, rename_var=''): if diagnostic in self._modifiers: diff --git a/earthdiagnostics/diagnostic.py b/earthdiagnostics/diagnostic.py index 6295ef28..02d0619e 100644 --- a/earthdiagnostics/diagnostic.py +++ b/earthdiagnostics/diagnostic.py @@ -212,6 +212,19 @@ class Diagnostic(Publisher): """ return 'Developer must override base class __str__ method' + def add_subjob(self, subjob): + """ + Adds a subjob + :param subjob: + :type subjob: Diagnostic + :return: + """ + self.subjobs.append(subjob) + subjob.subscribe(self, self._subjob_status_changed) + + def _subjob_status_changed(self, job): + self.check_is_ready() + def request_chunk(self, domain, var, startdate, member, chunk, grid=None, box=None, frequency=None, to_modify=False, vartype=VariableType.MEAN): request = self.data_manager.request_chunk(domain, var, startdate, member, chunk, grid, box, frequency, vartype) @@ -242,7 +255,8 @@ class Diagnostic(Publisher): self.check_is_ready() def check_is_ready(self): - if all([request.ready_to_run(self) for request in self._requests]): + if all([request.ready_to_run(self) for request in self._requests]) and\ + all([subjob.status == DiagnosticStatus.COMPLETED for subjob in self.subjobs]): self.status = DiagnosticStatus.READY def _unsuscribe_requests(self): @@ -366,7 +380,7 @@ class DiagnosticVariableListOption(DiagnosticOption): def parse(self, option_value): option_value = self.check_default(option_value) var_names = [] - for value in option_value.split('-'): + for value in option_value.split(':'): real_name = self.var_manager.get_variable(value, False) if real_name is None: var_names.append(value) diff --git a/earthdiagnostics/frequency.py b/earthdiagnostics/frequency.py index 09ebe3de..9a95f26e 100644 --- a/earthdiagnostics/frequency.py +++ b/earthdiagnostics/frequency.py @@ -9,6 +9,7 @@ class Frequency(object): 'dec': 'dec', 'decadal': 'dec', 'y': 'year', 'yr': 'year', 'year': 'year', 'yearly': 'year', 'm': 'mon', '1m': 'mon', 'mon': 'mon', 'monthly': 'mon', 'mm': 'mon', + 'w': 'week', '1w': 'week', 'week': 'week', 'weekly': 'week', 'd': 'day', '1d': 'day', 'daily': 'day', 'day': 'day', '15': '15hr', '15h': '15hr', '15hr': '15hr', '15_hourly': '15hr', '15hourly': '15hr', '15 hourly': '15hr', @@ -28,12 +29,17 @@ class Frequency(object): def __eq__(self, other): return self.frequency == other.frequency + def __ne__(self, other): + return not self == other + def __str__(self): return self.frequency def folder_name(self, vartype): if self == Frequencies.daily: freq_str = 'daily_{0}'.format(VariableType.to_str(vartype)) + elif self == Frequencies.weekly: + freq_str = 'weekly_{0}'.format(VariableType.to_str(vartype)) elif self == Frequencies.climatology: freq_str = 'clim' elif self in (Frequencies.three_hourly, Frequencies.six_hourly, Frequencies.hourly): @@ -56,6 +62,7 @@ class Frequencies(object): climatology = Frequency('clim') yearly = Frequency('year') monthly = Frequency('mon') + weekly = Frequency('week') daily = Frequency('day') six_hourly = Frequency('6hr') three_hourly = Frequency('3hr') diff --git a/earthdiagnostics/obsreconmanager.py b/earthdiagnostics/obsreconmanager.py index b75e7c0f..356eac77 100644 --- a/earthdiagnostics/obsreconmanager.py +++ b/earthdiagnostics/obsreconmanager.py @@ -4,6 +4,7 @@ import os from bscearth.utils.log import Log from earthdiagnostics.datamanager import DataManager +from earthdiagnostics.frequency import Frequencies from earthdiagnostics.variable_type import VariableType @@ -90,7 +91,7 @@ class ObsReconManager(DataManager): frequency = self.config.frequency folder_path = self._get_folder_path(frequency, domain, var, grid, vartype) - file_name = self._get_file_name(var, startdate) + file_name = self._get_file_name(var, startdate, frequency) filepath = os.path.join(folder_path, file_name) return filepath @@ -147,12 +148,12 @@ class ObsReconManager(DataManager): var = self._get_final_var_name(box, var) full_path = os.path.join(self.config.data_dir, self.config.data_type, self.experiment.institute, self.experiment.model, frequency.folder_name(vartype)) - full_path = os.path.join(full_path, var, self._get_file_name(var, startdate)) + full_path = os.path.join(full_path, var, self._get_file_name(var, startdate, frequency)) return full_path - def _get_file_name(self, var, startdate): + def _get_file_name(self, var, startdate, frequency): if startdate: - if self.config.data_type != 'exp': + if self.config.data_type != 'exp' and frequency != Frequencies.weekly: startdate = startdate[0:6] return '{0}_{1}.nc'.format(var, startdate) else: @@ -216,7 +217,7 @@ class ObsReconManager(DataManager): :rtype: str """ var = self._get_final_var_name(box, var) - filepath = self.get_file_path(startdate, domain, var, frequency, vartype, grid, box) + filepath = self.get_file_path(startdate, domain, var, frequency, vartype, box, grid) Log.debug('{0} requested', filepath) return self._get_file_from_storage(filepath) diff --git a/earthdiagnostics/ocean/interpolatecdo.py b/earthdiagnostics/ocean/interpolatecdo.py index 0bc7709b..1dc0719f 100644 --- a/earthdiagnostics/ocean/interpolatecdo.py +++ b/earthdiagnostics/ocean/interpolatecdo.py @@ -97,32 +97,37 @@ class InterpolateCDO(Diagnostic): job_list = list() weights = TempFile.get() method = options['method'].lower() - cls._compute_weights(diags, method, options, target_grid, weights) + if options['weights_from_mask']: + temp = cls.get_sample_grid_file() + cls.compute_weights(method, target_grid, temp, weights) + os.remove(temp) + weights_job = None + else: + startdate, member, chunk = diags.config.experiment.get_chunk_list()[0] + weights_job = ComputeWeights(diags.data_manager, startdate, member, chunk, options['domain'], + options['variables'][0],target_grid, options['original_grid'], weights, + options['method']) + for var in options['variables']: for startdate, member, chunk in diags.config.experiment.get_chunk_list(): - job_list.append(InterpolateCDO(diags.data_manager, startdate, member, chunk, - options['domain'], var, target_grid, - diags.config.experiment.model_version, options['mask_oceans'], - options['original_grid'], weights)) + job = InterpolateCDO(diags.data_manager, startdate, member, chunk, options['domain'], var, target_grid, + diags.config.experiment.model_version, options['mask_oceans'], + options['original_grid'], weights) + if weights_job is not None: + job.add_subjob(weights_job) + job_list.append(job) return job_list @classmethod - def _compute_weights(cls, diags, method, options, target_grid, weights): - if options['weights_from_mask']: - temp = cls.get_sample_grid_file() - else: - startdate, member, chunk = diags.config.experiment.get_chunk_list()[0] - temp = diags.data_manager.get_file(options['domain'], options['variable'], startdate, member, chunk, - grid=options['original_grid']) + def compute_weights(cls, method, target_grid, sample_file, weights): if method == InterpolateCDO.BILINEAR: - Utils.cdo.genbil(target_grid, input=temp, output=weights) + Utils.cdo.genbil(target_grid, input=sample_file, output=weights) elif method == InterpolateCDO.BICUBIC: - Utils.cdo.genbic(target_grid, input=temp, output=weights) + Utils.cdo.genbic(target_grid, input=sample_file, output=weights) elif method == InterpolateCDO.CONSERVATIVE: - Utils.cdo.genycon(target_grid, input=temp, output=weights) + Utils.cdo.genycon(target_grid, input=sample_file, output=weights) elif method == InterpolateCDO.CONSERVATIVE2: - Utils.cdo.gencon2(target_grid, input=temp, output=weights) - os.remove(temp) + Utils.cdo.gencon2(target_grid, input=sample_file, output=weights) @classmethod def get_sample_grid_file(cls): @@ -235,6 +240,38 @@ class InterpolateCDO(Diagnostic): self.regridded.set_local_file(temp) +class ComputeWeights(Diagnostic): + alias = 'computeinterpcdoweights' + "Diagnostic alias for the configuration file" + @classmethod + def generate_jobs(cls, diags, options): + pass + + def __init__(self, data_manager, startdate, member, chunk, domain, variable, target_grid, + original_grid, weights_file, method): + Diagnostic.__init__(self, data_manager) + self.startdate = startdate + self.member = member + self.chunk = chunk + self.variable = variable + self.domain = domain + self.grid = target_grid + self.original_grid = original_grid + self.weights_file = weights_file + self.method = method + + def __str__(self): + return 'Computing weights for CDO interpolation: Method {0.method} Target grid: {0.grid}'.format(self) + + def compute(self): + InterpolateCDO.compute_weights(self.method, self.grid, self.sample_data.local_file, self.weights_file) + + def request_data(self): + self.sample_data = self.request_chunk(self.domain, self.variable, self.startdate, self.member, self.chunk, + grid=self.original_grid) + + def declare_data_generated(self): + pass diff --git a/earthdiagnostics/work_manager.py b/earthdiagnostics/work_manager.py index 647feec7..5c9b3e93 100644 --- a/earthdiagnostics/work_manager.py +++ b/earthdiagnostics/work_manager.py @@ -39,6 +39,8 @@ class WorkManager(object): try: for job in diag_class.generate_jobs(self, diag_options): list_jobs.append(job) + for subjob in job.subjobs: + list_jobs.append(subjob) continue except DiagnosticOptionError as ex: Log.error('Can not configure diagnostic {0}: {1}', diag_options[0], ex) @@ -64,8 +66,6 @@ class WorkManager(object): job.request_data() job.declare_data_generated() job.subscribe(self, self._job_status_changed) - for subjob in job.subjobs: - subjob.subscribe(self, self._job_status_changed) job.check_is_ready() if self.config.skip_diags_done: @@ -83,7 +83,7 @@ class WorkManager(object): self.lock = threading.Lock() self.lock.acquire() - self.check_completion() + # self.check_completion() self.lock.acquire() self.downloader.shutdown() @@ -103,18 +103,26 @@ class WorkManager(object): self.executor.submit(self._run_job, job) for request in job._requests: if request.only_suscriber(self): + del self.data_manager.requested_files[request.remote_file] request.unsubscribe(self) + request.clean_local() self.check_completion() def _file_object_status_changed(self, file_object): + Log.debug('Checking file {0}. Local status {0.local_status} Storage status{0.storage_status}', file_object) if file_object.download_required(): self.downloader.submit(file_object) return if file_object.upload_required(): + file_object.storage_status = StorageStatus.UPLOADING self.uploader.submit(file_object.upload) return - if file_object.only_suscriber(self): + if file_object.local_status != LocalStatus.COMPUTING and \ + file_object.storage_status != StorageStatus.UPLOADING and \ + file_object.only_suscriber(self): + del self.data_manager.requested_files[file_object.remote_file] file_object.unsubscribe(self) + file_object.clean_local() self.check_completion() def check_completion(self): @@ -137,14 +145,17 @@ class WorkManager(object): for request in self.data_manager.requested_files.values(): if request.storage_status == StorageStatus.UPLOADING: - return + return False if request.local_status == LocalStatus.DOWNLOADING: - return + return False if request.upload_required(): - return + return False if request.download_required(): - return - self.lock.release() + return False + try: + self.lock.release() + except Exception: + pass return True def print_stats(self): -- GitLab From db8dbe745e981854133302b29422af71dde66188 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Tue, 14 Nov 2017 13:39:15 +0100 Subject: [PATCH 19/47] remove deprecation warning --- earthdiagnostics/statistics/discretize.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/earthdiagnostics/statistics/discretize.py b/earthdiagnostics/statistics/discretize.py index 81ed8232..c997e5ec 100644 --- a/earthdiagnostics/statistics/discretize.py +++ b/earthdiagnostics/statistics/discretize.py @@ -1,11 +1,11 @@ # coding=utf-8 import math +import cf_units import iris import iris.coord_categorisation import iris.coords import iris.exceptions -import iris.unit import numpy as np import psutil import six @@ -199,7 +199,7 @@ class Discretize(Diagnostic): var_name='leadtime', units='months')) lead_date = add_months(date, leadtime - 1, self.data_manager.config.experiment.calendar) - leadtime_cube.add_aux_coord(iris.coords.AuxCoord(iris.unit.date2num(lead_date, + leadtime_cube.add_aux_coord(iris.coords.AuxCoord(cf_units.date2num(lead_date, unit='days since 1950-01-01', calendar="standard"), var_name='time', -- GitLab From 05f3d00bb4f1df7dd91ac59a680d47df02f9da14 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Tue, 14 Nov 2017 15:40:22 +0100 Subject: [PATCH 20/47] Fixed bug when no diagnostics where added --- earthdiagnostics/work_manager.py | 10 +++++++--- 1 file changed, 7 insertions(+), 3 deletions(-) diff --git a/earthdiagnostics/work_manager.py b/earthdiagnostics/work_manager.py index 5c9b3e93..110b9f28 100644 --- a/earthdiagnostics/work_manager.py +++ b/earthdiagnostics/work_manager.py @@ -51,8 +51,12 @@ class WorkManager(object): self.jobs = list_jobs def run(self): - time = datetime.datetime.now() - Log.info("Starting to compute at {0}", time) + if len(self.jobs) == 0: + Log.result('No diagnostics to run') + return + + start_time = datetime.datetime.now() + Log.info("Starting to compute at {0}", start_time) self.threads = Utils.available_cpu_count() if 0 < self.config.max_cores < self.threads: self.threads = self.config.max_cores @@ -93,7 +97,7 @@ class WorkManager(object): TempFile.clean() finish_time = datetime.datetime.now() Log.result("Diagnostics finished at {0}", finish_time) - Log.result("Elapsed time: {0}\n", finish_time - time) + Log.result("Elapsed time: {0}\n", finish_time - start_time) self.print_errors() self.print_stats() return not self.had_errors -- GitLab From 85a4d9bd585385677aa9e4b6eb497c8d5b36d54c Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Tue, 14 Nov 2017 15:47:58 +0100 Subject: [PATCH 21/47] Fixed bug when no diagnostics where added --- earthdiagnostics/work_manager.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/earthdiagnostics/work_manager.py b/earthdiagnostics/work_manager.py index 110b9f28..33576f7c 100644 --- a/earthdiagnostics/work_manager.py +++ b/earthdiagnostics/work_manager.py @@ -53,7 +53,7 @@ class WorkManager(object): def run(self): if len(self.jobs) == 0: Log.result('No diagnostics to run') - return + return True start_time = datetime.datetime.now() Log.info("Starting to compute at {0}", start_time) -- GitLab From 7be6a500af326287eac8a7cf011fce0db8e6b447 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Wed, 15 Nov 2017 12:05:57 +0100 Subject: [PATCH 22/47] Fixed region order --- earthdiagnostics/datafile.py | 43 ++++++++++++---------------- earthdiagnostics/ocean/regionmean.py | 4 +-- 2 files changed, 21 insertions(+), 26 deletions(-) diff --git a/earthdiagnostics/datafile.py b/earthdiagnostics/datafile.py index fc3032d5..c7518506 100644 --- a/earthdiagnostics/datafile.py +++ b/earthdiagnostics/datafile.py @@ -186,9 +186,10 @@ class DataFile(Publisher): Log.warning('Link for file {0} can not be created: {1}', self.remote_file, ex) self.storage_status = StorageStatus.READY - def set_local_file(self, local_file, diagnostic=None, rename_var=''): + def set_local_file(self, local_file, diagnostic=None, rename_var='', region=None): if diagnostic in self._modifiers: self._modifiers.remove(diagnostic) + self.region = region.name self.local_file = local_file self.prepare_to_upload(rename_var) self.local_status = LocalStatus.READY @@ -288,29 +289,23 @@ class DataFile(Publisher): self._update_var_with_region_data() self._correct_metadata() Utils.nco.ncks(input=self.local_file, output=self.local_file, options=['--fix_rec_dmn region']) - # handler = Utils.openCdf(self.local_file) - # regions = handler.variables('region')[...].tolist() - # ordered_regions = regions.sorted() - # new_indexes = [ordered_regions.index(region) for region in regions] - # - # for var in handler.variables.values(): - # if 'region' not in var.dimensions(): - # continue - # var_ordered = np.moveaxis(var[...], range(len(regions)), new_indexes) - # handler.close() - # - # pass - # - # for x, region in enumerate(regions): - # Utils.nco.ncks(input=self.local_file, output=self.local_file, options=['--fix_rec_dmn region']) - # handler = Utils.openCdf(self.local_file) - # current = handler.variables['region'][...].tolist().index(region) - # handler.close() - # if current != x: - # Utils.nco.ncap2(input=self.local_file, output=self.local_file, - # options=('-s "region({0})=region({1})'.format(x, current),)) - # pass - + handler = Utils.openCdf(self.local_file) + regions = handler.variables['region'][...].tolist() + if len(regions) > 1: + ordered_regions = sorted(regions) + print(regions) + print(ordered_regions) + new_indexes = [regions.index(region) for region in ordered_regions] + print(new_indexes) + + for var in handler.variables.values(): + if 'region' not in var.dimensions: + continue + index_region = var.dimensions.index('region') + var_values = var[...] + var_ordered = np.take(var_values, new_indexes, index_region) + var[...] = var_ordered + handler.close() def _update_var_with_region_data(self): temp = TempFile.get() diff --git a/earthdiagnostics/ocean/regionmean.py b/earthdiagnostics/ocean/regionmean.py index bb4b93c8..edc5e212 100644 --- a/earthdiagnostics/ocean/regionmean.py +++ b/earthdiagnostics/ocean/regionmean.py @@ -60,7 +60,7 @@ class RegionMean(Diagnostic): def __str__(self): return 'Region mean Startdate: {0.startdate} Member: {0.member} Chunk: {0.chunk} Variable: {0.variable} ' \ 'Grid point: {0.grid_point} Box: {0.box} Save 3D: {0.save3d} Save variance: {0.variance} ' \ - 'Original grid: {0.grid}'.format(self) + 'Original grid: {0.grid} Basin: {0.basin}'.format(self) @classmethod def generate_jobs(cls, diags, options): @@ -166,7 +166,7 @@ class RegionMean(Diagnostic): if hasattr(var_handler, 'valid_max'): del var_handler.valid_max handler.close() - self.declared[final_name].set_local_file(temp2, diagnostic=self, rename_var=original_name) + self.declared[final_name].set_local_file(temp2, diagnostic=self, rename_var=original_name, region=self.basin) def declare_var(self, var, threed, box_save): if threed: -- GitLab From c4db94ff375df87f06c73d0e5f362cf5856bb637 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Wed, 15 Nov 2017 15:27:48 +0100 Subject: [PATCH 23/47] First version of namelist based cdftools --- earthdiagnostics/CDFTOOLS_CMIP6.namlist | 211 ++++++++++++++++++++ earthdiagnostics/CDFTOOLS_PRIMAVERA.namlist | 211 ++++++++++++++++++++ earthdiagnostics/cdftools.py | 12 +- earthdiagnostics/config.py | 5 + earthdiagnostics/earthdiags.py | 8 +- earthdiagnostics/ocean/interpolatecdo.py | 32 ++- earthdiagnostics/ocean/regionsum.py | 172 ++++++++++++++++ 7 files changed, 639 insertions(+), 12 deletions(-) create mode 100644 earthdiagnostics/CDFTOOLS_CMIP6.namlist create mode 100644 earthdiagnostics/CDFTOOLS_PRIMAVERA.namlist create mode 100644 earthdiagnostics/ocean/regionsum.py diff --git a/earthdiagnostics/CDFTOOLS_CMIP6.namlist b/earthdiagnostics/CDFTOOLS_CMIP6.namlist new file mode 100644 index 00000000..7f607659 --- /dev/null +++ b/earthdiagnostics/CDFTOOLS_CMIP6.namlist @@ -0,0 +1,211 @@ + ! Thu Jun 30 16:19:27 2016 + ! Namelist automatically generated by PrintCdfNames + ! Do not edit without changing its name ... + ! ------------------------------------------ + &NAMDIM + CN_X = i + , + CN_Y = j + , + CN_Z = lev + , + CN_T = time + + / + &NAMDIMVAR + CN_VLON2D = longitude + , + CN_VLAT2D = latitude + , + CN_VDEPTHT = lev + , + CN_VDEPTHU = lev + , + CN_VDEPTHV = lev + , + CN_VDEPTHW = lev + , + CN_VTIMEC = time + , + CN_MISSING_VALUE = _FillValue + + / + &NAMMETRICS + CN_VE1T = e1t + , + CN_VE1U = e1u + , + CN_VE1V = e1v + , + CN_VE1F = e1f + , + CN_VE2T = e2t + , + CN_VE2U = e2u + , + CN_VE2V = e2v + , + CN_VE2F = e2f + , + CN_VE3T = e3t + , + CN_VE3W = e3w + , + CN_VFF = ff + , + CN_GLAMT = glamt + , + CN_GLAMU = glamu + , + CN_GLAMV = glamv + , + CN_GLAMF = glamf + , + CN_GPHIT = gphit + , + CN_GPHIU = gphiu + , + CN_GPHIV = gphiv + , + CN_GPHIF = gphif + , + CN_GDEPT = gdept + , + CN_GDEPW = gdepw + , + CN_HDEPT = hdept + , + CN_HDEPW = hdepw + + / + &NAMVARS + CN_VOTEMPER = votemper + , + CN_VOSALINE = vosaline + , + CN_VOZOCRTX = vozocrtx + , + CN_VOMECRTY = vomecrty + , + CN_VOMEEIVV = vomeeivv + , + CN_VOVECRTZ = vovecrtz + , + CN_SOSSHEIG = sossheig + , + CN_SOMXL010 = somxl010 + , + CN_SOMXLT02 = somxlt02 + , + CN_SOHEFLDO = sohefldo + , + CN_SOLHFLUP = solhflup + , + CN_SOSBHFUP = sosbhfup + , + CN_SOLWFLDO = solwfldo + , + CN_SOSHFLDO = soshfldo + , + CN_SOWAFLUP = sowaflup + , + CN_SOWAFLCD = sowaflcd + , + CN_SOWAFLDP = sowafldp + , + CN_IOWAFLUP = iowaflup + , + CN_ZOMSFATL = zomsfatl + , + CN_ZOMSFGLO = zomsfglo + , + CN_ZOMSFPAC = zomsfpac + , + CN_ZOMSFINP = zomsfinp + , + CN_ZOMSFIND = zomsfind + , + CN_ZOISOATL = zoisoatl + , + CN_ZOISOGLO = zoisoglo + , + CN_ZOISOPAC = zoisopac + , + CN_ZOISOINP = zoisoinp + , + CN_ZOISOIND = zoisoind + , + CN_VOZOUT = vozout + , + CN_VOMEVT = vomevt + , + CN_VOZOUS = vozous + , + CN_VOMEVS = vomevs + , + CN_SOZOUT = sozout + , + CN_SOMEVT = somevt + , + CN_SOZOUS = sozous + , + CN_SOMEVS = somevs + , + CN_SOZOUTRP = sozoutrp + , + CN_SOMEVTRP = somevtrp + , + CN_SOICECOV = soicecov + , + CN_VOSIGMA0 = vosigma0 + , + CN_VOSIGMAI = vosigmai + , + CN_VOSIGNTR = vosigntr + , + CN_VODEPISO = vodepiso + , + CN_ISOTHICK = isothick + , + CN_IICETHIC = iicethic + , + CN_ILEADFRA = ileadfra + , + CN_INVCFC = INVCFC + , + CN_CFC11 = CFC11 + , + CN_PENDEP = pendep + + / + &NAMBATHY + CN_FBATHYMET = bathy_meter.nc + , + CN_FBATHYLEV = bathy_level.nc + , + CN_BATHYMET = Bathymetry + , + CN_BATHYLEV = bathy_level + , + CN_MBATHY = mbathy + + / + ! Namelist entry namsqdvar needs manual formating before + ! it can be used as input : put variables names in between ' + ! and separate variables by , + &NAMSQDVAR + NN_SQDVAR = 4, + CN_SQDVAR = vozocrtx vomecrty vovecrtz sossheig + / + &NAMMESHMASK + CN_FZGR = mesh_zgr.nc + , + CN_FHGR = mesh_hgr.nc + , + CN_FMSK = mask.nc + , + CN_FCOO = coordinates.nc + , + CN_FBASINS = new_maskglo.nc + + / diff --git a/earthdiagnostics/CDFTOOLS_PRIMAVERA.namlist b/earthdiagnostics/CDFTOOLS_PRIMAVERA.namlist new file mode 100644 index 00000000..7f607659 --- /dev/null +++ b/earthdiagnostics/CDFTOOLS_PRIMAVERA.namlist @@ -0,0 +1,211 @@ + ! Thu Jun 30 16:19:27 2016 + ! Namelist automatically generated by PrintCdfNames + ! Do not edit without changing its name ... + ! ------------------------------------------ + &NAMDIM + CN_X = i + , + CN_Y = j + , + CN_Z = lev + , + CN_T = time + + / + &NAMDIMVAR + CN_VLON2D = longitude + , + CN_VLAT2D = latitude + , + CN_VDEPTHT = lev + , + CN_VDEPTHU = lev + , + CN_VDEPTHV = lev + , + CN_VDEPTHW = lev + , + CN_VTIMEC = time + , + CN_MISSING_VALUE = _FillValue + + / + &NAMMETRICS + CN_VE1T = e1t + , + CN_VE1U = e1u + , + CN_VE1V = e1v + , + CN_VE1F = e1f + , + CN_VE2T = e2t + , + CN_VE2U = e2u + , + CN_VE2V = e2v + , + CN_VE2F = e2f + , + CN_VE3T = e3t + , + CN_VE3W = e3w + , + CN_VFF = ff + , + CN_GLAMT = glamt + , + CN_GLAMU = glamu + , + CN_GLAMV = glamv + , + CN_GLAMF = glamf + , + CN_GPHIT = gphit + , + CN_GPHIU = gphiu + , + CN_GPHIV = gphiv + , + CN_GPHIF = gphif + , + CN_GDEPT = gdept + , + CN_GDEPW = gdepw + , + CN_HDEPT = hdept + , + CN_HDEPW = hdepw + + / + &NAMVARS + CN_VOTEMPER = votemper + , + CN_VOSALINE = vosaline + , + CN_VOZOCRTX = vozocrtx + , + CN_VOMECRTY = vomecrty + , + CN_VOMEEIVV = vomeeivv + , + CN_VOVECRTZ = vovecrtz + , + CN_SOSSHEIG = sossheig + , + CN_SOMXL010 = somxl010 + , + CN_SOMXLT02 = somxlt02 + , + CN_SOHEFLDO = sohefldo + , + CN_SOLHFLUP = solhflup + , + CN_SOSBHFUP = sosbhfup + , + CN_SOLWFLDO = solwfldo + , + CN_SOSHFLDO = soshfldo + , + CN_SOWAFLUP = sowaflup + , + CN_SOWAFLCD = sowaflcd + , + CN_SOWAFLDP = sowafldp + , + CN_IOWAFLUP = iowaflup + , + CN_ZOMSFATL = zomsfatl + , + CN_ZOMSFGLO = zomsfglo + , + CN_ZOMSFPAC = zomsfpac + , + CN_ZOMSFINP = zomsfinp + , + CN_ZOMSFIND = zomsfind + , + CN_ZOISOATL = zoisoatl + , + CN_ZOISOGLO = zoisoglo + , + CN_ZOISOPAC = zoisopac + , + CN_ZOISOINP = zoisoinp + , + CN_ZOISOIND = zoisoind + , + CN_VOZOUT = vozout + , + CN_VOMEVT = vomevt + , + CN_VOZOUS = vozous + , + CN_VOMEVS = vomevs + , + CN_SOZOUT = sozout + , + CN_SOMEVT = somevt + , + CN_SOZOUS = sozous + , + CN_SOMEVS = somevs + , + CN_SOZOUTRP = sozoutrp + , + CN_SOMEVTRP = somevtrp + , + CN_SOICECOV = soicecov + , + CN_VOSIGMA0 = vosigma0 + , + CN_VOSIGMAI = vosigmai + , + CN_VOSIGNTR = vosigntr + , + CN_VODEPISO = vodepiso + , + CN_ISOTHICK = isothick + , + CN_IICETHIC = iicethic + , + CN_ILEADFRA = ileadfra + , + CN_INVCFC = INVCFC + , + CN_CFC11 = CFC11 + , + CN_PENDEP = pendep + + / + &NAMBATHY + CN_FBATHYMET = bathy_meter.nc + , + CN_FBATHYLEV = bathy_level.nc + , + CN_BATHYMET = Bathymetry + , + CN_BATHYLEV = bathy_level + , + CN_MBATHY = mbathy + + / + ! Namelist entry namsqdvar needs manual formating before + ! it can be used as input : put variables names in between ' + ! and separate variables by , + &NAMSQDVAR + NN_SQDVAR = 4, + CN_SQDVAR = vozocrtx vomecrty vovecrtz sossheig + / + &NAMMESHMASK + CN_FZGR = mesh_zgr.nc + , + CN_FHGR = mesh_hgr.nc + , + CN_FMSK = mask.nc + , + CN_FCOO = coordinates.nc + , + CN_FBASINS = new_maskglo.nc + + / diff --git a/earthdiagnostics/cdftools.py b/earthdiagnostics/cdftools.py index 36fffdaa..b0d03ae4 100644 --- a/earthdiagnostics/cdftools.py +++ b/earthdiagnostics/cdftools.py @@ -1,8 +1,10 @@ # coding=utf-8 -from earthdiagnostics.utils import Utils import os -from bscearth.utils.log import Log + import six +from bscearth.utils.log import Log + +from earthdiagnostics.utils import Utils class CDFTools(object): @@ -15,6 +17,7 @@ class CDFTools(object): def __init__(self, path=''): self.path = path + self.data_convention = '' # noinspection PyShadowingBuiltins def run(self, command, input, output=None, options=None, log_level=Log.INFO, input_option=None): @@ -52,6 +55,11 @@ class CDFTools(object): line.append('-o') line.append(output) Log.debug('Executing {0}', ' '.join(line)) + namelist_file = os.path.join(os.path.dirname(__file__), 'CDFTOOLS_{0}.namlist'.format(self.data_convention)) + if os.path.isfile(namelist_file): + os.environ['NAM_CDF_NAMES'] = namelist_file + else: + os.environ['NAM_CDF_NAMES'] = None shell_output = Utils.execute_shell_command(line, log_level) self._check_output_was_created(line, output) diff --git a/earthdiagnostics/config.py b/earthdiagnostics/config.py index 96c83702..ece458eb 100644 --- a/earthdiagnostics/config.py +++ b/earthdiagnostics/config.py @@ -6,6 +6,7 @@ from bscearth.utils.config_parser import ConfigParser from bscearth.utils.date import parse_date, chunk_start_date, chunk_end_date, date2str from bscearth.utils.log import Log +from earthdiagnostics import cdftools from earthdiagnostics.frequency import Frequency, Frequencies from earthdiagnostics.variable import VariableManager from modelingrealm import ModelingRealm @@ -63,6 +64,10 @@ class Config(object): self.data_convention = parser.get_choice_option('DIAGNOSTICS', 'DATA_CONVENTION', ('specs', 'primavera', 'cmip6', 'preface'), 'specs', ignore_case=True) + + if self.data_convention in ('primavera', 'cmip6'): + self.scratch_masks = os.path.join(self.scratch_masks, self.data_convention) + cdftools.data_convention = self.data_convention self.var_manager = VariableManager() self.var_manager.load_variables(self.data_convention) self._diags = parser.get_option('DIAGNOSTICS', 'DIAGS') diff --git a/earthdiagnostics/earthdiags.py b/earthdiagnostics/earthdiags.py index b9ef5aa2..1c1494b4 100755 --- a/earthdiagnostics/earthdiags.py +++ b/earthdiagnostics/earthdiags.py @@ -129,8 +129,12 @@ class EarthDiags(object): self.dic_variables['x'] = 'i' self.dic_variables['y'] = 'j' self.dic_variables['z'] = 'lev' - self.dic_variables['nav_lon'] = 'lon' - self.dic_variables['nav_lat'] = 'lat' + if self.config.data_convention.lower() in ['primavera', 'cmip6']: + self.dic_variables['nav_lon'] = 'longitude' + self.dic_variables['nav_lat'] = 'latitude' + else: + self.dic_variables['nav_lon'] = 'lon' + self.dic_variables['nav_lat'] = 'lat' self.dic_variables['nav_lev'] = 'lev' self.dic_variables['time_counter'] = 'time' self.dic_variables['t'] = 'time' diff --git a/earthdiagnostics/ocean/interpolatecdo.py b/earthdiagnostics/ocean/interpolatecdo.py index 1dc0719f..0e203f43 100644 --- a/earthdiagnostics/ocean/interpolatecdo.py +++ b/earthdiagnostics/ocean/interpolatecdo.py @@ -132,34 +132,50 @@ class InterpolateCDO(Diagnostic): @classmethod def get_sample_grid_file(cls): temp = TempFile.get() + + lat_name = 'lat' + handler = Utils.openCdf('mask.nc') + for lat_alias in ['lat', 'latitude']: + if lat_alias in handler.variables: + lat_name = lat_alias + break + + lon_name = None + for lon_alias in ['lon', 'longitude']: + if lon_alias in handler.variables: + lon_name = lon_alias + break + lon_bnds_name = '{0}_bnds'.format(lon_name) + lat_bnds_name = '{0}_bnds'.format(lat_name) + Utils.nco.ncks(input='mask.nc', output=temp, options=('-O -v tmask,lat,lon,gphif,glamf',)) handler = Utils.openCdf(temp) - lon = handler.variables['lon'] + lon = handler.variables[lon_name] lon.units = "degrees_east" lon.long_name = "Longitude" lon.nav_model = "Default grid" lon.standard_name = "longitude" - lon.short_name = "lon" - lon.bounds = 'lon_bnds' + lon.short_name = lon_name + lon.bounds = lon_bnds_name - lat = handler.variables['lat'] + lat = handler.variables[lat_name] lat.units = "degrees_north" lat.long_name = "Latitude" lat.nav_model = "Default grid" lat.standard_name = "latitude" - lat.short_name = "lat" - lat.bounds = 'lat_bnds' + lat.short_name = lat_name + lat.bounds = lat_bnds_name handler.createDimension('bounds', 4) - lon_bnds = handler.createVariable('lon_bnds', lon.datatype, ('j', 'i', 'bounds')) + lon_bnds = handler.createVariable(lon_bnds_name, lon.datatype, ('j', 'i', 'bounds')) corner_lat = handler.variables['glamf'][0, ...] lon_bnds[:, :, 0] = corner_lat lon_bnds[:, :, 1] = np.roll(corner_lat, 1, 0) lon_bnds[:, :, 2] = np.roll(corner_lat, -1, 1) lon_bnds[:, :, 3] = np.roll(lon_bnds[:, :, 1], -1, 1) - lat_bnds = handler.createVariable('lat_bnds', lat.datatype, ('j', 'i', 'bounds')) + lat_bnds = handler.createVariable(lat_bnds_name, lat.datatype, ('j', 'i', 'bounds')) corner_lat = handler.variables['gphif'][0, ...] lat_bnds[:, :, 0] = corner_lat lat_bnds[:, :, 1] = np.roll(corner_lat, 1, 0) diff --git a/earthdiagnostics/ocean/regionsum.py b/earthdiagnostics/ocean/regionsum.py new file mode 100644 index 00000000..52b49f91 --- /dev/null +++ b/earthdiagnostics/ocean/regionsum.py @@ -0,0 +1,172 @@ +# coding=utf-8 +import os + +from earthdiagnostics import cdftools +from earthdiagnostics.box import Box +from earthdiagnostics.constants import Basins +from earthdiagnostics.diagnostic import Diagnostic, DiagnosticOption, DiagnosticIntOption, DiagnosticDomainOption, \ + DiagnosticBoolOption, DiagnosticBasinOption, DiagnosticVariableOption +from earthdiagnostics.modelingrealm import ModelingRealms +from earthdiagnostics.utils import Utils, TempFile + + +class RegionSum(Diagnostic): + """ + Computes the mean value of the field (3D, weighted). For 3D fields, + a horizontal mean for each level is also given. If a spatial window + is specified, the mean value is computed only in this window. + + :original author: Javier Vegas-Regidor + + :created: March 2017 + + :param data_manager: data management object + :type data_manager: DataManager + :param startdate: startdate + :type startdate: str + :param member: member number + :type member: int + :param chunk: chunk's number + :type chunk: int + :param variable: variable to average + :type variable: str + :param box: box used to restrict the vertical mean + :type box: Box + """ + + alias = 'regsum' + "Diagnostic alias for the configuration file" + + def __init__(self, data_manager, startdate, member, chunk, domain, variable, grid_point, box, save3d, basin, + variance, grid): + Diagnostic.__init__(self, data_manager) + self.startdate = startdate + self.member = member + self.chunk = chunk + self.domain = domain + self.variable = variable + self.grid_point = grid_point.upper() + self.box = box + self.save3d = save3d + self.basin = basin + self.variance = variance + self.grid = grid + self.declared = {} + + def __eq__(self, other): + return self.startdate == other.startdate and self.member == other.member and self.chunk == other.chunk and \ + self.box == other.box and self.variable == other.variable + + def __str__(self): + return 'Region sum Startdate: {0.startdate} Member: {0.member} Chunk: {0.chunk} Variable: {0.variable} ' \ + 'Grid point: {0.grid_point} Box: {0.box} Save 3D: {0.save3d}' \ + 'Original grid: {0.grid} Basin: {0.basin}'.format(self) + + @classmethod + def generate_jobs(cls, diags, options): + """ + Creates a job for each chunk to compute the diagnostic + + :param diags: Diagnostics manager class + :type diags: Diags + :param options: variable, minimum depth (level), maximum depth (level) + :type options: list[str] + :return: + """ + options_available = (DiagnosticDomainOption(), + DiagnosticVariableOption(diags.data_manager.config.var_manager), + DiagnosticOption('grid_point', 'T'), + DiagnosticBasinOption('basin', Basins().Global), + DiagnosticIntOption('min_depth', 0), + DiagnosticIntOption('max_depth', 0), + DiagnosticBoolOption('save3D', True), + DiagnosticOption('grid', '')) + options = cls.process_options(options, options_available) + + box = Box() + box.min_depth = options['min_depth'] + box.max_depth = options['max_depth'] + + job_list = list() + for startdate, member, chunk in diags.config.experiment.get_chunk_list(): + job_list.append(RegionSum(diags.data_manager, startdate, member, chunk, + options['domain'], options['variable'], options['grid_point'], box, + options['save3D'], options['basin'], options['variance'], options['grid'])) + return job_list + + def request_data(self): + self.variable_file = self.request_chunk(self.domain, self.variable, self.startdate, self.member, self.chunk, + grid=self.grid) + + def declare_data_generated(self): + if self.box.min_depth == 0: + # To cdftools, this means all levels + box_save = None + else: + box_save = self.box + + self.declare_var('sum', False, box_save) + self.declare_var('sum', True, box_save) + + def compute(self): + """ + Runs the diagnostic + """ + mean_file = TempFile.get() + + variable_file = self.variable_file.local_file + + handler = Utils.openCdf(variable_file) + self.save3d &= 'lev' in handler.dimensions + handler.close() + + cdfmean_options = [self.variable, self.grid_point, 0, 0, 0, 0, self.box.min_depth, self.box.max_depth] + if self.variance: + cdfmean_options += ['-var'] + if self.basin != Basins().Global: + cdfmean_options.append('-M') + cdfmean_options.append('mask_regions.3d.nc') + cdfmean_options.append(self.basin.name) + + cdftools.run('cdfsum', input=variable_file, output=mean_file, options=cdfmean_options) + Utils.rename_variables(mean_file, {'gdept': 'lev', 'gdepw': 'lev'}, must_exist=False, rename_dimension=True) + + self.send_var('mean', False, mean_file) + self.send_var('mean', True, mean_file) + + os.remove(mean_file) + + def send_var(self, var, threed, mean_file): + if threed: + if not self.save3d: + return False + original_name = '{0}_{1}'.format(var, self.variable) + final_name = '{1}3d{0}'.format(var, self.variable) + levels = ',lev' + else: + original_name = '{0}_3D{1}'.format(var, self.variable) + final_name = '{1}{0}'.format(var, self.variable) + levels = '' + + temp2 = TempFile.get() + Utils.nco.ncks(input=mean_file, output=temp2, options=('-v {0},lat,lon{1}'.format(original_name, levels),)) + handler = Utils.openCdf(temp2) + var_handler = handler.variables[original_name] + if hasattr(var_handler, 'valid_min'): + del var_handler.valid_min + if hasattr(var_handler, 'valid_max'): + del var_handler.valid_max + handler.close() + self.declared[final_name].set_local_file(temp2, diagnostic=self, rename_var=original_name, region=self.basin) + + def declare_var(self, var, threed, box_save): + if threed: + if not self.save3d: + return False + final_name = '{1}3d{0}'.format(var, self.variable) + else: + final_name = '{1}{0}'.format(var, self.variable) + + self.declared[final_name] = self.declare_chunk(ModelingRealms.ocean, final_name, self.startdate, self.member, + self.chunk, box=box_save, region=self.basin, grid=self.grid) + -- GitLab From 04278c664d57b362d331a922fb5ded3332c92d9b Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Wed, 15 Nov 2017 16:18:38 +0100 Subject: [PATCH 24/47] Fixed namelist activation --- .../{CDFTOOLS_CMIP6.namlist => CDFTOOLS_cmip6.namlist} | 0 ...DFTOOLS_PRIMAVERA.namlist => CDFTOOLS_primavera.namlist} | 6 +++--- earthdiagnostics/cdftools.py | 6 +----- earthdiagnostics/config.py | 6 ++++++ earthdiagnostics/ocean/interpolatecdo.py | 5 +++-- earthdiagnostics/utils.py | 3 +-- 6 files changed, 14 insertions(+), 12 deletions(-) rename earthdiagnostics/{CDFTOOLS_CMIP6.namlist => CDFTOOLS_cmip6.namlist} (100%) rename earthdiagnostics/{CDFTOOLS_PRIMAVERA.namlist => CDFTOOLS_primavera.namlist} (99%) diff --git a/earthdiagnostics/CDFTOOLS_CMIP6.namlist b/earthdiagnostics/CDFTOOLS_cmip6.namlist similarity index 100% rename from earthdiagnostics/CDFTOOLS_CMIP6.namlist rename to earthdiagnostics/CDFTOOLS_cmip6.namlist diff --git a/earthdiagnostics/CDFTOOLS_PRIMAVERA.namlist b/earthdiagnostics/CDFTOOLS_primavera.namlist similarity index 99% rename from earthdiagnostics/CDFTOOLS_PRIMAVERA.namlist rename to earthdiagnostics/CDFTOOLS_primavera.namlist index 7f607659..d9abb15e 100644 --- a/earthdiagnostics/CDFTOOLS_PRIMAVERA.namlist +++ b/earthdiagnostics/CDFTOOLS_primavera.namlist @@ -3,11 +3,11 @@ ! Do not edit without changing its name ... ! ------------------------------------------ &NAMDIM - CN_X = i + CN_X = "i" , - CN_Y = j + CN_Y = "j" , - CN_Z = lev + CN_Z = "lev" , CN_T = time diff --git a/earthdiagnostics/cdftools.py b/earthdiagnostics/cdftools.py index b0d03ae4..ad0355c3 100644 --- a/earthdiagnostics/cdftools.py +++ b/earthdiagnostics/cdftools.py @@ -55,11 +55,7 @@ class CDFTools(object): line.append('-o') line.append(output) Log.debug('Executing {0}', ' '.join(line)) - namelist_file = os.path.join(os.path.dirname(__file__), 'CDFTOOLS_{0}.namlist'.format(self.data_convention)) - if os.path.isfile(namelist_file): - os.environ['NAM_CDF_NAMES'] = namelist_file - else: - os.environ['NAM_CDF_NAMES'] = None + shell_output = Utils.execute_shell_command(line, log_level) self._check_output_was_created(line, output) diff --git a/earthdiagnostics/config.py b/earthdiagnostics/config.py index ece458eb..f3c8d638 100644 --- a/earthdiagnostics/config.py +++ b/earthdiagnostics/config.py @@ -68,6 +68,12 @@ class Config(object): if self.data_convention in ('primavera', 'cmip6'): self.scratch_masks = os.path.join(self.scratch_masks, self.data_convention) cdftools.data_convention = self.data_convention + namelist_file = os.path.join(os.path.dirname(__file__), 'CDFTOOLS_{0}.namlist'.format(self.data_convention)) + Log.debug(namelist_file) + if os.path.isfile(namelist_file): + Log.debug('Setting namelist {0}', namelist_file) + os.environ['NAM_CDF_NAMES'] = namelist_file + self.var_manager = VariableManager() self.var_manager.load_variables(self.data_convention) self._diags = parser.get_option('DIAGNOSTICS', 'DIAGS') diff --git a/earthdiagnostics/ocean/interpolatecdo.py b/earthdiagnostics/ocean/interpolatecdo.py index 0e203f43..b8b81620 100644 --- a/earthdiagnostics/ocean/interpolatecdo.py +++ b/earthdiagnostics/ocean/interpolatecdo.py @@ -148,7 +148,8 @@ class InterpolateCDO(Diagnostic): lon_bnds_name = '{0}_bnds'.format(lon_name) lat_bnds_name = '{0}_bnds'.format(lat_name) - Utils.nco.ncks(input='mask.nc', output=temp, options=('-O -v tmask,lat,lon,gphif,glamf',)) + Utils.nco.ncks(input='mask.nc', output=temp, + options=('-O -v tmask,{0},{1},gphif,glamf'.format(lat_name, lon_name),)) handler = Utils.openCdf(temp) lon = handler.variables[lon_name] lon.units = "degrees_east" @@ -185,7 +186,7 @@ class InterpolateCDO(Diagnostic): lat_bnds[0, :, 3] = lat_bnds[1, 0, 3] - 1 tmask = handler.variables['tmask'] - tmask.coordinates = 'time lev lat lon' + tmask.coordinates = 'time lev {0} {1}'.format(lat_name, lon_name) handler.close() diff --git a/earthdiagnostics/utils.py b/earthdiagnostics/utils.py index b0629f78..54e927bd 100644 --- a/earthdiagnostics/utils.py +++ b/earthdiagnostics/utils.py @@ -386,8 +386,7 @@ class Utils(object): Log.log.log(log_level, line) output.append(line) if process.returncode != 0: - raise Utils.ExecutionError('Error executing {0}\n Return code: {1}'.format(' '.join(command), - process.returncode)) + raise Utils.ExecutionError('Error executing {0}\n Return code: {1}'.format(' '.join(command), process.returncode)) return output _cpu_count = None -- GitLab From d514269e8ab9bc06821270ceb5632c07951ac101 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Wed, 15 Nov 2017 16:50:08 +0100 Subject: [PATCH 25/47] Fixed cdftools namelist --- earthdiagnostics/CDFTOOLS_cmip6.namlist | 204 ++++++++++---------- earthdiagnostics/CDFTOOLS_primavera.namlist | 184 +++++++++--------- 2 files changed, 194 insertions(+), 194 deletions(-) diff --git a/earthdiagnostics/CDFTOOLS_cmip6.namlist b/earthdiagnostics/CDFTOOLS_cmip6.namlist index 7f607659..95eda2b1 100644 --- a/earthdiagnostics/CDFTOOLS_cmip6.namlist +++ b/earthdiagnostics/CDFTOOLS_cmip6.namlist @@ -3,209 +3,209 @@ ! Do not edit without changing its name ... ! ------------------------------------------ &NAMDIM - CN_X = i + CN_X = "i" , - CN_Y = j + CN_Y = "j" , - CN_Z = lev + CN_Z = "lev" , - CN_T = time - + CN_T = "time" + / &NAMDIMVAR - CN_VLON2D = longitude + CN_VLON2D = "longitude" , - CN_VLAT2D = latitude + CN_VLAT2D = "latitude" , - CN_VDEPTHT = lev + CN_VDEPTHT = "lev" , - CN_VDEPTHU = lev + CN_VDEPTHU = "lev" , - CN_VDEPTHV = lev + CN_VDEPTHV = "lev" , - CN_VDEPTHW = lev + CN_VDEPTHW = "lev" , - CN_VTIMEC = time + CN_VTIMEC = "time" , - CN_MISSING_VALUE = _FillValue - + CN_MISSING_VALUE = "_FillValue" + / &NAMMETRICS - CN_VE1T = e1t + CN_VE1T = "e1t" , - CN_VE1U = e1u + CN_VE1U = "e1u" , - CN_VE1V = e1v + CN_VE1V = "e1v" , - CN_VE1F = e1f + CN_VE1F = "e1f" , - CN_VE2T = e2t + CN_VE2T = "e2t" , - CN_VE2U = e2u + CN_VE2U = "e2u" , - CN_VE2V = e2v + CN_VE2V = "e2v" , - CN_VE2F = e2f + CN_VE2F = "e2f" , - CN_VE3T = e3t + CN_VE3T = "e3t" , - CN_VE3W = e3w + CN_VE3W = "e3w" , - CN_VFF = ff + CN_VFF = "ff" , - CN_GLAMT = glamt + CN_GLAMT = "glamt" , - CN_GLAMU = glamu + CN_GLAMU = "glamu" , - CN_GLAMV = glamv + CN_GLAMV = "glamv" , - CN_GLAMF = glamf + CN_GLAMF = "glamf" , - CN_GPHIT = gphit + CN_GPHIT = "gphit" , - CN_GPHIU = gphiu + CN_GPHIU = "gphiu" , - CN_GPHIV = gphiv + CN_GPHIV = "gphiv" , - CN_GPHIF = gphif + CN_GPHIF = "gphif" , - CN_GDEPT = gdept + CN_GDEPT = "gdept" , - CN_GDEPW = gdepw + CN_GDEPW = "gdepw" , - CN_HDEPT = hdept + CN_HDEPT = "hdept" , - CN_HDEPW = hdepw - + CN_HDEPW = "hdepw" + / &NAMVARS - CN_VOTEMPER = votemper + CN_VOTEMPER = "votemper" , - CN_VOSALINE = vosaline + CN_VOSALINE = "vosaline" , - CN_VOZOCRTX = vozocrtx + CN_VOZOCRTX = "vozocrtx" , - CN_VOMECRTY = vomecrty + CN_VOMECRTY = "vomecrty" , - CN_VOMEEIVV = vomeeivv + CN_VOMEEIVV = "vomeeivv" , - CN_VOVECRTZ = vovecrtz + CN_VOVECRTZ = "vovecrtz" , - CN_SOSSHEIG = sossheig + CN_SOSSHEIG = "sossheig" , - CN_SOMXL010 = somxl010 + CN_SOMXL010 = "somxl010" , - CN_SOMXLT02 = somxlt02 + CN_SOMXLT02 = "somxlt02" , - CN_SOHEFLDO = sohefldo + CN_SOHEFLDO = "sohefldo" , - CN_SOLHFLUP = solhflup + CN_SOLHFLUP = "solhflup" , - CN_SOSBHFUP = sosbhfup + CN_SOSBHFUP = "sosbhfup" , - CN_SOLWFLDO = solwfldo + CN_SOLWFLDO = "solwfldo" , - CN_SOSHFLDO = soshfldo + CN_SOSHFLDO = "soshfldo" , - CN_SOWAFLUP = sowaflup + CN_SOWAFLUP = "sowaflup" , - CN_SOWAFLCD = sowaflcd + CN_SOWAFLCD = "sowaflcd" , - CN_SOWAFLDP = sowafldp + CN_SOWAFLDP = "sowafldp" , - CN_IOWAFLUP = iowaflup + CN_IOWAFLUP = "iowaflup" , - CN_ZOMSFATL = zomsfatl + CN_ZOMSFATL = "zomsfatl" , - CN_ZOMSFGLO = zomsfglo + CN_ZOMSFGLO = "zomsfglo" , - CN_ZOMSFPAC = zomsfpac + CN_ZOMSFPAC = "zomsfpac" , - CN_ZOMSFINP = zomsfinp + CN_ZOMSFINP = "zomsfinp" , - CN_ZOMSFIND = zomsfind + CN_ZOMSFIND = "zomsfind" , - CN_ZOISOATL = zoisoatl + CN_ZOISOATL = "zoisoatl" , - CN_ZOISOGLO = zoisoglo + CN_ZOISOGLO = "zoisoglo" , - CN_ZOISOPAC = zoisopac + CN_ZOISOPAC = "zoisopac" , - CN_ZOISOINP = zoisoinp + CN_ZOISOINP = "zoisoinp" , - CN_ZOISOIND = zoisoind + CN_ZOISOIND = "zoisoind" , - CN_VOZOUT = vozout + CN_VOZOUT = "vozout" , - CN_VOMEVT = vomevt + CN_VOMEVT = "vomevt" , - CN_VOZOUS = vozous + CN_VOZOUS = "vozous" , - CN_VOMEVS = vomevs + CN_VOMEVS = "vomevs" , - CN_SOZOUT = sozout + CN_SOZOUT = "sozout" , - CN_SOMEVT = somevt + CN_SOMEVT = "somevt" , - CN_SOZOUS = sozous + CN_SOZOUS = "sozous" , - CN_SOMEVS = somevs + CN_SOMEVS = "somevs" , - CN_SOZOUTRP = sozoutrp + CN_SOZOUTRP = "sozoutrp" , - CN_SOMEVTRP = somevtrp + CN_SOMEVTRP = "somevtrp" , - CN_SOICECOV = soicecov + CN_SOICECOV = "soicecov" , - CN_VOSIGMA0 = vosigma0 + CN_VOSIGMA0 = "vosigma0" , - CN_VOSIGMAI = vosigmai + CN_VOSIGMAI = "vosigmai" , - CN_VOSIGNTR = vosigntr + CN_VOSIGNTR = "vosigntr" , - CN_VODEPISO = vodepiso + CN_VODEPISO = "vodepiso" , - CN_ISOTHICK = isothick + CN_ISOTHICK = "isothick" , - CN_IICETHIC = iicethic + CN_IICETHIC = "iicethic" , - CN_ILEADFRA = ileadfra + CN_ILEADFRA = "ileadfra" , - CN_INVCFC = INVCFC + CN_INVCFC = "INVCFC" , - CN_CFC11 = CFC11 + CN_CFC11 = "CFC11" , - CN_PENDEP = pendep - + CN_PENDEP = "pendep" + / &NAMBATHY - CN_FBATHYMET = bathy_meter.nc + CN_FBATHYMET = "bathy_meter.nc" , - CN_FBATHYLEV = bathy_level.nc + CN_FBATHYLEV = "bathy_level.nc" , - CN_BATHYMET = Bathymetry + CN_BATHYMET = "Bathymetry" , - CN_BATHYLEV = bathy_level + CN_BATHYLEV = "bathy_level" , - CN_MBATHY = mbathy - + CN_MBATHY = "mbathy" + / ! Namelist entry namsqdvar needs manual formating before - ! it can be used as input : put variables names in between ' - ! and separate variables by , + ! it can be used as input : put variables names in between ' + ! and separate variables by , &NAMSQDVAR NN_SQDVAR = 4, - CN_SQDVAR = vozocrtx vomecrty vovecrtz sossheig + CN_SQDVAR = "vozocrtx vomecrty vovecrtz sossheig" , / &NAMMESHMASK - CN_FZGR = mesh_zgr.nc + CN_FZGR = "mesh_zgr.nc" , - CN_FHGR = mesh_hgr.nc + CN_FHGR = "mesh_hgr.nc" , - CN_FMSK = mask.nc + CN_FMSK = "mask.nc" , - CN_FCOO = coordinates.nc + CN_FCOO = "coordinates.nc" , - CN_FBASINS = new_maskglo.nc + CN_FBASINS = "new_maskglo.nc" / diff --git a/earthdiagnostics/CDFTOOLS_primavera.namlist b/earthdiagnostics/CDFTOOLS_primavera.namlist index d9abb15e..7a890404 100644 --- a/earthdiagnostics/CDFTOOLS_primavera.namlist +++ b/earthdiagnostics/CDFTOOLS_primavera.namlist @@ -9,185 +9,185 @@ , CN_Z = "lev" , - CN_T = time + CN_T = "time" / &NAMDIMVAR - CN_VLON2D = longitude + CN_VLON2D = "longitude" , - CN_VLAT2D = latitude + CN_VLAT2D = "latitude" , - CN_VDEPTHT = lev + CN_VDEPTHT = "lev" , - CN_VDEPTHU = lev + CN_VDEPTHU = "lev" , - CN_VDEPTHV = lev + CN_VDEPTHV = "lev" , - CN_VDEPTHW = lev + CN_VDEPTHW = "lev" , - CN_VTIMEC = time + CN_VTIMEC = "time" , - CN_MISSING_VALUE = _FillValue + CN_MISSING_VALUE = "_FillValue" / &NAMMETRICS - CN_VE1T = e1t + CN_VE1T = "e1t" , - CN_VE1U = e1u + CN_VE1U = "e1u" , - CN_VE1V = e1v + CN_VE1V = "e1v" , - CN_VE1F = e1f + CN_VE1F = "e1f" , - CN_VE2T = e2t + CN_VE2T = "e2t" , - CN_VE2U = e2u + CN_VE2U = "e2u" , - CN_VE2V = e2v + CN_VE2V = "e2v" , - CN_VE2F = e2f + CN_VE2F = "e2f" , - CN_VE3T = e3t + CN_VE3T = "e3t" , - CN_VE3W = e3w + CN_VE3W = "e3w" , - CN_VFF = ff + CN_VFF = "ff" , - CN_GLAMT = glamt + CN_GLAMT = "glamt" , - CN_GLAMU = glamu + CN_GLAMU = "glamu" , - CN_GLAMV = glamv + CN_GLAMV = "glamv" , - CN_GLAMF = glamf + CN_GLAMF = "glamf" , - CN_GPHIT = gphit + CN_GPHIT = "gphit" , - CN_GPHIU = gphiu + CN_GPHIU = "gphiu" , - CN_GPHIV = gphiv + CN_GPHIV = "gphiv" , - CN_GPHIF = gphif + CN_GPHIF = "gphif" , - CN_GDEPT = gdept + CN_GDEPT = "gdept" , - CN_GDEPW = gdepw + CN_GDEPW = "gdepw" , - CN_HDEPT = hdept + CN_HDEPT = "hdept" , - CN_HDEPW = hdepw + CN_HDEPW = "hdepw" / &NAMVARS - CN_VOTEMPER = votemper + CN_VOTEMPER = "votemper" , - CN_VOSALINE = vosaline + CN_VOSALINE = "vosaline" , - CN_VOZOCRTX = vozocrtx + CN_VOZOCRTX = "vozocrtx" , - CN_VOMECRTY = vomecrty + CN_VOMECRTY = "vomecrty" , - CN_VOMEEIVV = vomeeivv + CN_VOMEEIVV = "vomeeivv" , - CN_VOVECRTZ = vovecrtz + CN_VOVECRTZ = "vovecrtz" , - CN_SOSSHEIG = sossheig + CN_SOSSHEIG = "sossheig" , - CN_SOMXL010 = somxl010 + CN_SOMXL010 = "somxl010" , - CN_SOMXLT02 = somxlt02 + CN_SOMXLT02 = "somxlt02" , - CN_SOHEFLDO = sohefldo + CN_SOHEFLDO = "sohefldo" , - CN_SOLHFLUP = solhflup + CN_SOLHFLUP = "solhflup" , - CN_SOSBHFUP = sosbhfup + CN_SOSBHFUP = "sosbhfup" , - CN_SOLWFLDO = solwfldo + CN_SOLWFLDO = "solwfldo" , - CN_SOSHFLDO = soshfldo + CN_SOSHFLDO = "soshfldo" , - CN_SOWAFLUP = sowaflup + CN_SOWAFLUP = "sowaflup" , - CN_SOWAFLCD = sowaflcd + CN_SOWAFLCD = "sowaflcd" , - CN_SOWAFLDP = sowafldp + CN_SOWAFLDP = "sowafldp" , - CN_IOWAFLUP = iowaflup + CN_IOWAFLUP = "iowaflup" , - CN_ZOMSFATL = zomsfatl + CN_ZOMSFATL = "zomsfatl" , - CN_ZOMSFGLO = zomsfglo + CN_ZOMSFGLO = "zomsfglo" , - CN_ZOMSFPAC = zomsfpac + CN_ZOMSFPAC = "zomsfpac" , - CN_ZOMSFINP = zomsfinp + CN_ZOMSFINP = "zomsfinp" , - CN_ZOMSFIND = zomsfind + CN_ZOMSFIND = "zomsfind" , - CN_ZOISOATL = zoisoatl + CN_ZOISOATL = "zoisoatl" , - CN_ZOISOGLO = zoisoglo + CN_ZOISOGLO = "zoisoglo" , - CN_ZOISOPAC = zoisopac + CN_ZOISOPAC = "zoisopac" , - CN_ZOISOINP = zoisoinp + CN_ZOISOINP = "zoisoinp" , - CN_ZOISOIND = zoisoind + CN_ZOISOIND = "zoisoind" , - CN_VOZOUT = vozout + CN_VOZOUT = "vozout" , - CN_VOMEVT = vomevt + CN_VOMEVT = "vomevt" , - CN_VOZOUS = vozous + CN_VOZOUS = "vozous" , - CN_VOMEVS = vomevs + CN_VOMEVS = "vomevs" , - CN_SOZOUT = sozout + CN_SOZOUT = "sozout" , - CN_SOMEVT = somevt + CN_SOMEVT = "somevt" , - CN_SOZOUS = sozous + CN_SOZOUS = "sozous" , - CN_SOMEVS = somevs + CN_SOMEVS = "somevs" , - CN_SOZOUTRP = sozoutrp + CN_SOZOUTRP = "sozoutrp" , - CN_SOMEVTRP = somevtrp + CN_SOMEVTRP = "somevtrp" , - CN_SOICECOV = soicecov + CN_SOICECOV = "soicecov" , - CN_VOSIGMA0 = vosigma0 + CN_VOSIGMA0 = "vosigma0" , - CN_VOSIGMAI = vosigmai + CN_VOSIGMAI = "vosigmai" , - CN_VOSIGNTR = vosigntr + CN_VOSIGNTR = "vosigntr" , - CN_VODEPISO = vodepiso + CN_VODEPISO = "vodepiso" , - CN_ISOTHICK = isothick + CN_ISOTHICK = "isothick" , - CN_IICETHIC = iicethic + CN_IICETHIC = "iicethic" , - CN_ILEADFRA = ileadfra + CN_ILEADFRA = "ileadfra" , - CN_INVCFC = INVCFC + CN_INVCFC = "INVCFC" , - CN_CFC11 = CFC11 + CN_CFC11 = "CFC11" , - CN_PENDEP = pendep + CN_PENDEP = "pendep" / &NAMBATHY - CN_FBATHYMET = bathy_meter.nc + CN_FBATHYMET = "bathy_meter.nc" , - CN_FBATHYLEV = bathy_level.nc + CN_FBATHYLEV = "bathy_level.nc" , - CN_BATHYMET = Bathymetry + CN_BATHYMET = "Bathymetry" , - CN_BATHYLEV = bathy_level + CN_BATHYLEV = "bathy_level" , - CN_MBATHY = mbathy + CN_MBATHY = "mbathy" / ! Namelist entry namsqdvar needs manual formating before @@ -195,17 +195,17 @@ ! and separate variables by , &NAMSQDVAR NN_SQDVAR = 4, - CN_SQDVAR = vozocrtx vomecrty vovecrtz sossheig + CN_SQDVAR = "vozocrtx vomecrty vovecrtz sossheig" , / &NAMMESHMASK - CN_FZGR = mesh_zgr.nc + CN_FZGR = "mesh_zgr.nc" , - CN_FHGR = mesh_hgr.nc + CN_FHGR = "mesh_hgr.nc" , - CN_FMSK = mask.nc + CN_FMSK = "mask.nc" , - CN_FCOO = coordinates.nc + CN_FCOO = "coordinates.nc" , - CN_FBASINS = new_maskglo.nc + CN_FBASINS = "new_maskglo.nc" / -- GitLab From dff5ebc407e666c50bdb0cc488dbae28d61187fb Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Thu, 16 Nov 2017 12:52:41 +0100 Subject: [PATCH 26/47] Tweaked namelist --- earthdiagnostics/CDFTOOLS_cmip6.namlist | 14 +++++++------- earthdiagnostics/CDFTOOLS_primavera.namlist | 14 +++++++------- 2 files changed, 14 insertions(+), 14 deletions(-) diff --git a/earthdiagnostics/CDFTOOLS_cmip6.namlist b/earthdiagnostics/CDFTOOLS_cmip6.namlist index 95eda2b1..25fa1e18 100644 --- a/earthdiagnostics/CDFTOOLS_cmip6.namlist +++ b/earthdiagnostics/CDFTOOLS_cmip6.namlist @@ -79,13 +79,13 @@ / &NAMVARS - CN_VOTEMPER = "votemper" + CN_VOTEMPER = "thetao" , - CN_VOSALINE = "vosaline" + CN_VOSALINE = "so" , - CN_VOZOCRTX = "vozocrtx" + CN_VOZOCRTX = "uo" , - CN_VOMECRTY = "vomecrty" + CN_VOMECRTY = "vo" , CN_VOMEEIVV = "vomeeivv" , @@ -93,7 +93,7 @@ , CN_SOSSHEIG = "sossheig" , - CN_SOMXL010 = "somxl010" + CN_SOMXL010 = "mlotst" , CN_SOMXLT02 = "somxlt02" , @@ -206,6 +206,6 @@ , CN_FCOO = "coordinates.nc" , - CN_FBASINS = "new_maskglo.nc" - + CN_FBASINS = "new_maskglo.nc", + / diff --git a/earthdiagnostics/CDFTOOLS_primavera.namlist b/earthdiagnostics/CDFTOOLS_primavera.namlist index 7a890404..dc36a1c0 100644 --- a/earthdiagnostics/CDFTOOLS_primavera.namlist +++ b/earthdiagnostics/CDFTOOLS_primavera.namlist @@ -79,13 +79,13 @@ / &NAMVARS - CN_VOTEMPER = "votemper" + CN_VOTEMPER = "thetao" , - CN_VOSALINE = "vosaline" + CN_VOSALINE = "so" , - CN_VOZOCRTX = "vozocrtx" + CN_VOZOCRTX = "uo" , - CN_VOMECRTY = "vomecrty" + CN_VOMECRTY = "vo" , CN_VOMEEIVV = "vomeeivv" , @@ -93,7 +93,7 @@ , CN_SOSSHEIG = "sossheig" , - CN_SOMXL010 = "somxl010" + CN_SOMXL010 = "mlotst" , CN_SOMXLT02 = "somxlt02" , @@ -206,6 +206,6 @@ , CN_FCOO = "coordinates.nc" , - CN_FBASINS = "new_maskglo.nc" - + CN_FBASINS = "new_maskglo.nc", + / -- GitLab From fdf87e870ce1ae2d2b52d4507c47802f81651e14 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Thu, 16 Nov 2017 19:17:18 +0100 Subject: [PATCH 27/47] i j fix --- earthdiagnostics/cmorizer.py | 26 ++++++++---- earthdiagnostics/cmormanager.py | 41 ++++++++++++++++++- earthdiagnostics/constants.py | 2 +- earthdiagnostics/datafile.py | 38 ++++++++++------- .../general/simplify_dimensions.py | 35 ++++++++++------ earthdiagnostics/ocean/areamoc.py | 29 ++++++++----- earthdiagnostics/ocean/maxmoc.py | 10 +++-- earthdiagnostics/ocean/mxl.py | 8 ++-- earthdiagnostics/utils.py | 12 ++++-- 9 files changed, 141 insertions(+), 60 deletions(-) diff --git a/earthdiagnostics/cmorizer.py b/earthdiagnostics/cmorizer.py index c4e4a93e..4bfde9de 100644 --- a/earthdiagnostics/cmorizer.py +++ b/earthdiagnostics/cmorizer.py @@ -1,11 +1,11 @@ # coding=utf-8 import glob import os +import pygrib import shutil import uuid from datetime import datetime -import pygrib from bscearth.utils.date import parse_date, chunk_end_date, previous_day, date2str, add_months from bscearth.utils.log import Log from cdo import CDOException @@ -29,7 +29,8 @@ class Cmorizer(object): """ - NON_DATA_VARIABLES = ('lon', 'lat', 'time', 'time_bnds', 'leadtime', 'lev', 'lev_2', 'icethi', + NON_DATA_VARIABLES = ('lon', 'lat', 'longitude', 'latitude', 'plev', 'time', 'time_bnds', 'leadtime', 'lev', + 'lev_2', 'icethi', 'deptht', 'depthu', 'depthw', 'depthv', 'time_centered', 'time_centered_bounds', 'deptht_bounds', 'depthu_bounds', 'depthv_bounds', 'depthw_bounds', 'deptht_bnds', 'depthu_bnds', 'depthv_bnds', 'depthw_bnds', @@ -39,9 +40,6 @@ class Cmorizer(object): 'depth_bnds', 'depth_2_bnds', 'depth_3_bnds', 'depth_4_bnds', 'mlev', 'hyai', 'hybi', 'hyam', 'hybm') - ALT_COORD_NAMES = {'time_counter': 'time', 'time_counter_bnds': 'time_bnds', 'time_counter_bounds': 'time_bnds', - 'tbnds': 'bnds', 'nav_lat': 'lat', 'nav_lon': 'lon', 'x': 'i', 'y': 'j'} - def __init__(self, data_manager, startdate, member): self.data_manager = data_manager self.startdate = startdate @@ -55,6 +53,17 @@ class Cmorizer(object): self.atmos_timestep = None self.cmor_scratch = str(os.path.join(self.config.scratch_dir, 'CMOR', self.startdate, self.member_str)) + if self.config.data_convention in ('primavera', 'cmip6'): + self.lon_name = 'longitude' + self.lat_name = 'latitude' + else: + self.lon_name = 'lon' + self.lat_name = 'lat' + + self.alt_coord_names = {'time_counter': 'time', 'time_counter_bnds': 'time_bnds', + 'time_counter_bounds': 'time_bnds', + 'tbnds': 'bnds', 'nav_lat': self.lat_name, 'nav_lon': self.lon_name, 'x': 'i', 'y': 'j'} + def cmorize_ocean(self): """ CMORizes ocean files from MMO files @@ -491,11 +500,10 @@ class Cmorizer(object): raise Exception('File {0} start date is not a valid chunk start date'.format(file_path)) return chunk - @staticmethod - def _add_coordinate_variables(handler, temp): + def _add_coordinate_variables(self, handler, temp): handler_cmor = Utils.openCdf(temp) - Utils.copy_variable(handler, handler_cmor, 'lon', False) - Utils.copy_variable(handler, handler_cmor, 'lat', False) + Utils.copy_variable(handler, handler_cmor, self.lon_name, False) + Utils.copy_variable(handler, handler_cmor, self.lat_name, False) if 'time' in handler_cmor.dimensions.keys(): Utils.copy_variable(handler, handler_cmor, 'leadtime', False) handler_cmor.close() diff --git a/earthdiagnostics/cmormanager.py b/earthdiagnostics/cmormanager.py index b454c4f3..8ddd9ef1 100644 --- a/earthdiagnostics/cmormanager.py +++ b/earthdiagnostics/cmormanager.py @@ -578,14 +578,51 @@ class CMORManager(DataManager): for name in os.listdir(os.path.join(path, member, table, var, grid)): filepath = os.path.join(path, member, table, var, grid, name) if os.path.isfile(filepath): - + original_handler = Utils.openCdf(filepath) + if original_handler.dimensions['i'].size < original_handler.dimensions['j'].size: + original_handler.close() + Utils.rename_variables(filepath, {'i': 'j', 'j': 'i'}, False, True) + else: + original_handler.close() self.create_link(domain, filepath, frequency, var, "", False, vartype=VariableType.MEAN) else: for filename in os.listdir(filepath): - self.create_link(domain, os.path.join(filepath, filename), frequency, var, "", + if not filename.endswith('.nc') or filename.startswith('.'): + return + cmorfile = os.path.join(filepath, filename) + original_handler = Utils.openCdf(cmorfile) + if original_handler.dimensions['i'].size < original_handler.dimensions['j'].size: + temp = TempFile.get() + new_handler = Utils.openCdf(temp, 'w') + for attribute in original_handler.ncattrs(): + original = getattr(original_handler, attribute) + setattr(new_handler, attribute, + Utils.convert_to_ASCII_if_possible(original)) + for dimension in original_handler.dimensions.keys(): + if dimension == 'i': + new_name = 'j' + elif dimension == 'j': + new_name = 'i' + else: + new_name = dimension + new_handler.createDimension(new_name, original_handler.dimensions[dimension].size) + for variable in original_handler.variables.keys(): + original_var = original_handler.variables[variable] + Log.debug(str(original_var.dimensions)) + translated_dimensions = Utils._translate(original_var.dimensions, {'i': 'j', 'j': 'i'}) + Log.debug(str(translated_dimensions)) + new_var = new_handler.createVariable(variable, original_var.datatype, + translated_dimensions) + Utils.copy_attributes(new_var, original_var) + new_var[:] = original_var[:] + original_handler.close() + new_handler.close() + Utils.move_file(temp, cmorfile) + self.create_link(domain, cmorfile, frequency, var, "", False, vartype=VariableType.MEAN) + def _get_startdate_path(self, startdate): """ Returns the path to the startdate's CMOR folder diff --git a/earthdiagnostics/constants.py b/earthdiagnostics/constants.py index 6c66d625..229a61b0 100644 --- a/earthdiagnostics/constants.py +++ b/earthdiagnostics/constants.py @@ -139,7 +139,7 @@ class Basins(object): """ basin_names = handler.variables.keys() - ignored_names = ('lat', 'lon', 'i', 'j', 'time', 'lev') + ignored_names = ('lat', 'latitude', 'lon', 'longitude', 'i', 'j', 'time', 'lev') for basin in basin_names: if basin in ignored_names: diff --git a/earthdiagnostics/datafile.py b/earthdiagnostics/datafile.py index c7518506..3b38e077 100644 --- a/earthdiagnostics/datafile.py +++ b/earthdiagnostics/datafile.py @@ -156,6 +156,13 @@ class DataFile(Publisher): raise NotImplementedError('Class must implement the download method') def prepare_to_upload(self, rename_var): + if self.data_convention in ('primavera', 'cmip6'): + self.lon_name = 'longitude' + self.lat_name = 'latitude' + else: + self.lon_name = 'longitude' + self.lat_name = 'latitude' + Utils.convert2netcdf4(self.local_file) if rename_var: original_name = rename_var @@ -189,7 +196,10 @@ class DataFile(Publisher): def set_local_file(self, local_file, diagnostic=None, rename_var='', region=None): if diagnostic in self._modifiers: self._modifiers.remove(diagnostic) - self.region = region.name + if region is not None: + self.region = region.name + else: + self.region = None self.local_file = local_file self.prepare_to_upload(rename_var) self.local_status = LocalStatus.READY @@ -200,7 +210,7 @@ class DataFile(Publisher): def _correct_metadata(self): handler = Utils.openCdf(self.local_file) var_handler = handler.variables[self.final_name] - coords = set.intersection({'time', 'lev', 'lat', 'lon'}, set(handler.variables.keys())) + coords = set.intersection({'time', 'lev', self.lat_name, self.lon_name}, set(handler.variables.keys())) var_handler.coordinates = ' '.join(coords) if not self.cmor_var: handler.close() @@ -245,12 +255,12 @@ class DataFile(Publisher): handler.variables['lev'].short_name = 'lev' if self.domain == ModelingRealms.ocean: handler.variables['lev'].standard_name = 'depth' - if 'lon' in handler.variables: - handler.variables['lon'].short_name = 'lon' - handler.variables['lon'].standard_name = 'longitude' - if 'lat' in handler.variables: - handler.variables['lat'].short_name = 'lat' - handler.variables['lat'].standard_name = 'latitude' + if self.lon_name in handler.variables: + handler.variables[self.lon_name].short_name = self.lon_name + handler.variables[self.lon_name].standard_name = 'longitude' + if self.lat_name in handler.variables: + handler.variables[self.lat_name].short_name = self.lat_name + handler.variables[self.lat_name].standard_name = 'latitude' def _fix_units(self, var_handler): if 'units' not in var_handler.ncattrs(): @@ -362,12 +372,12 @@ class DataFile(Publisher): variables = dict() variables['x'] = 'i' variables['y'] = 'j' - variables['nav_lat_grid_V'] = 'lat' - variables['nav_lon_grid_V'] = 'lon' - variables['nav_lat_grid_U'] = 'lat' - variables['nav_lon_grid_U'] = 'lon' - variables['nav_lat_grid_T'] = 'lat' - variables['nav_lon_grid_T'] = 'lon' + variables['nav_lat_grid_V'] = self.lat_name + variables['nav_lon_grid_V'] = self.lon_name + variables['nav_lat_grid_U'] = self.lat_name + variables['nav_lon_grid_U'] = self.lon_name + variables['nav_lat_grid_T'] = self.lat_name + variables['nav_lon_grid_T'] = self.lon_name Utils.rename_variables(self.local_file, variables, False, True) def add_diagnostic_history(self): diff --git a/earthdiagnostics/general/simplify_dimensions.py b/earthdiagnostics/general/simplify_dimensions.py index 579a5473..c903af0a 100644 --- a/earthdiagnostics/general/simplify_dimensions.py +++ b/earthdiagnostics/general/simplify_dimensions.py @@ -1,9 +1,10 @@ # coding=utf-8 +import numpy as np + from earthdiagnostics.diagnostic import Diagnostic, DiagnosticOption, DiagnosticDomainOption, \ DiagnosticVariableListOption from earthdiagnostics.modelingrealm import ModelingRealm from earthdiagnostics.utils import Utils, TempFile -import numpy as np class SimplifyDimensions(Diagnostic): @@ -32,7 +33,7 @@ class SimplifyDimensions(Diagnostic): alias = 'simdim' "Diagnostic alias for the configuration file" - def __init__(self, data_manager, startdate, member, chunk, domain, variable, grid): + def __init__(self, data_manager, startdate, member, chunk, domain, variable, grid, data_convention): Diagnostic.__init__(self, data_manager) self.startdate = startdate self.member = member @@ -40,6 +41,12 @@ class SimplifyDimensions(Diagnostic): self.variable = variable self.domain = domain self.grid = grid + if data_convention in ('cmip6', 'primavera'): + self.lon_name = 'longitude' + self.lat_name = 'latitude' + else: + self.lon_name = 'lon' + self.lat_name = 'lat' def __str__(self): return 'Simplify dimension Startdate: {0} Member: {1} Chunk: {2} ' \ @@ -71,7 +78,8 @@ class SimplifyDimensions(Diagnostic): for startdate, member, chunk in diags.config.experiment.get_chunk_list(): job_list.append(SimplifyDimensions(diags.data_manager, startdate, member, chunk, - options['domain'], var, options['grid'])) + options['domain'], var, options['grid'], + diags.config.data_convention)) return job_list def request_data(self): @@ -89,14 +97,14 @@ class SimplifyDimensions(Diagnostic): handler = Utils.openCdf(self.variable_file.local_file) if 'i' not in handler.dimensions: raise Exception('Variable {0.domain}:{0.variable} does not have i,j dimensions'.format(self)) - lat = handler.variables['lat'] + lat = handler.variables[self.lat_name] lat_values = lat[:, 0:1] # noinspection PyTypeChecker if np.any((lat[:] - lat_values) != 0): raise Exception('Latitude is not constant over i dimension for variable ' '{0.domain}:{0.variable}'.format(self)) - lon = handler.variables['lon'] + lon = handler.variables[self.lon_name] lon_values = lon[0:1, :] # noinspection PyTypeChecker if np.any((lon[:] - lon) != 0): @@ -106,21 +114,22 @@ class SimplifyDimensions(Diagnostic): temp = TempFile.get() new_file = Utils.openCdf(temp, 'w') for dim in handler.dimensions.keys(): - if dim in ('lat', 'lon', 'i', 'j', 'vertices'): + if dim in (self.lon_name, self.lat_name, 'i', 'j', 'vertices'): continue - Utils.copy_dimension(handler, new_file, dim, new_names={'i': 'lon', 'j': 'lat'}) + Utils.copy_dimension(handler, new_file, dim, new_names={'i': self.lon_name, 'j': self.lat_name}) - new_file.createDimension('lon', handler.dimensions['i'].size) - new_file.createDimension('lat', handler.dimensions['j'].size) + new_file.createDimension(self.lon_name, handler.dimensions['i'].size) + new_file.createDimension(self.lat_name, handler.dimensions['j'].size) new_file.createDimension('vertices', 2) for var in handler.variables.keys(): - if var in ('lat', 'lon', 'i', 'j', 'lat_vertices', 'lon_vertices'): + if var in (self.lon_name, self.lat_name, 'i', 'j', + '{0}_vertices'.format(self.lon_name), '{0}_vertices'.format(self.lat_name)): continue - Utils.copy_variable(handler, new_file, var, new_names={'i': 'lon', 'j': 'lat'}) + Utils.copy_variable(handler, new_file, var, new_names={'i': self.lon_name, 'j': self.lat_name}) - self._create_var('lon', lon_values, handler, new_file) - self._create_var('lat', lat_values, handler, new_file) + self._create_var(self.lon_name, lon_values, handler, new_file) + self._create_var(self.lat_name, lat_values, handler, new_file) handler.close() new_file.close() diff --git a/earthdiagnostics/ocean/areamoc.py b/earthdiagnostics/ocean/areamoc.py index ff23513d..c73895fd 100644 --- a/earthdiagnostics/ocean/areamoc.py +++ b/earthdiagnostics/ocean/areamoc.py @@ -117,10 +117,15 @@ class AreaMoc(Diagnostic): handler = Utils.openCdf(temp) basin_index = np.where(handler.variables['basin'][:] == self.basin.name) - lat_values = handler.variables['lat'][:] - lat_type = handler.variables['lat'].dtype - lat_units = handler.variables['lat'].units - lat_long_name = handler.variables['lat'].long_name + if 'lat' in handler.variables: + lat_name = 'lat' + else: + lat_name = 'latitude' + var_lat = handler.variables[lat_name] + lat_values = var_lat[:] + lat_type = var_lat.dtype + lat_units = var_lat.units + lat_long_name = var_lat.long_name handler.close() @@ -135,29 +140,31 @@ class AreaMoc(Diagnostic): Utils.copy_dimension(source, destiny, 'time') Utils.copy_dimension(source, destiny, 'lev') - Utils.copy_dimension(source, destiny, 'j', new_names={'j': 'lat'}) + Utils.copy_dimension(source, destiny, 'j', new_names={'j': lat_name}) - lat_variable = destiny.createVariable('lat', lat_type, 'lat') + lat_variable = destiny.createVariable(lat_name, lat_type, lat_name) lat_variable[:] = lat_values[:] lat_variable.units = lat_units lat_variable.long_name = lat_long_name Utils.copy_variable(source, destiny, 'lev') Utils.copy_variable(source, destiny, 'time') - Utils.copy_variable(source, destiny, 'vsftmyz', new_names={'j': 'lat'}) + Utils.copy_variable(source, destiny, 'vsftmyz', new_names={'j': lat_name}) source.close() destiny.close() nco.ncks(input=temp2, output=temp, - options=('-d lev,{0:.1f},{1:.1f} -d lat,{2:.1f},{3:.1f}'.format(self.box.min_depth, + options=('-d lev,{0:.1f},{1:.1f} -d {4},{2:.1f},{3:.1f}'.format(self.box.min_depth, self.box.max_depth, self.box.min_lat, - self.box.max_lat),)) + self.box.max_lat, + lat_name),)) cdo.vertmean(input=temp, output=temp2) os.remove(temp) - nco.ncap2(input=temp2, output=temp2, options=('-s "coslat[lat]=cos(lat[lat]*3.141592657/180.0)"',)) - nco.ncwa(input=temp2, output=temp2, options=('-w coslat -a lat',)) + nco.ncap2(input=temp2, output=temp2, + options=('-s "coslat[{0}]=cos({0}[{0}]*3.141592657/180.0)"'.format(lat_name),)) + nco.ncwa(input=temp2, output=temp2, options=('-w coslat -a {0}'.format(lat_name),)) nco.ncks(input=temp2, output=temp2, options=('-v vsftmyz,time',)) self.results.set_local_file(temp2) diff --git a/earthdiagnostics/ocean/maxmoc.py b/earthdiagnostics/ocean/maxmoc.py index 2be7110e..fb86ecb5 100644 --- a/earthdiagnostics/ocean/maxmoc.py +++ b/earthdiagnostics/ocean/maxmoc.py @@ -2,11 +2,12 @@ import netCDF4 import numpy as np from bscearth.utils.log import Log -from earthdiagnostics.constants import Basins + from earthdiagnostics.box import Box +from earthdiagnostics.constants import Basins from earthdiagnostics.diagnostic import Diagnostic, DiagnosticBasinOption, DiagnosticFloatOption -from earthdiagnostics.utils import Utils, TempFile from earthdiagnostics.modelingrealm import ModelingRealms +from earthdiagnostics.utils import Utils, TempFile from earthdiagnostics.variable_type import VariableType @@ -134,7 +135,10 @@ class MaxMoc(Diagnostic): basin_index = basin_index[0][0] lev = handler.variables['lev'][:] - lat = handler.variables['lat'][:] + if "lat" in handler.variables: + lat = handler.variables['lat'][:] + else: + lat = handler.variables['latitude'][:] if self.box.min_lat == self.box.max_lat: lat_inds = ((np.abs(lat - self.box.min_lat)).argmin(),) diff --git a/earthdiagnostics/ocean/mxl.py b/earthdiagnostics/ocean/mxl.py index fe531b76..b5e7c980 100644 --- a/earthdiagnostics/ocean/mxl.py +++ b/earthdiagnostics/ocean/mxl.py @@ -3,8 +3,8 @@ import os from earthdiagnostics import cdftools from earthdiagnostics.diagnostic import Diagnostic -from earthdiagnostics.utils import Utils, TempFile from earthdiagnostics.modelingrealm import ModelingRealms +from earthdiagnostics.utils import Utils, TempFile class Mxl(Diagnostic): @@ -71,8 +71,10 @@ class Mxl(Diagnostic): source = Utils.openCdf(temp) destiny = Utils.openCdf(temp2, 'w') Utils.copy_variable(source, destiny, 'somxl010', must_exist=True, add_dimensions=True) - Utils.copy_variable(source, destiny, 'lat') - Utils.copy_variable(source, destiny, 'lon') + Utils.copy_variable(source, destiny, 'lat', must_exist=False) + Utils.copy_variable(source, destiny, 'latitude', must_exist=False) + Utils.copy_variable(source, destiny, 'lon', must_exist=False) + Utils.copy_variable(source, destiny, 'longitude', must_exist=False) source.close() destiny.close() self.mlotst_file.set_local_file(temp2, rename_var='somxl010') diff --git a/earthdiagnostics/utils.py b/earthdiagnostics/utils.py index 54e927bd..83d3239f 100644 --- a/earthdiagnostics/utils.py +++ b/earthdiagnostics/utils.py @@ -150,7 +150,8 @@ class Utils(object): try: Utils._rename_vars_directly(dic_names, filepath, handler, must_exist, rename_dimension) - except RuntimeError: + except RuntimeError as ex: + Log.debug('Renaming error: {0}', ex) error = True handler.close() @@ -179,13 +180,16 @@ class Utils(object): cubes = iris.load(filepath) if len(cubes) == 0: return False - except iris.exceptions.IrisError: + except iris.exceptions.IrisError as ex: + Log.debug('netCDF checks failed: {0}', ex) return False - except RuntimeError: + except RuntimeError as ex: # HDF error, usually + Log.debug('netCDF checks failed: {0}', ex) return False - except Exception: + except Exception as ex: # HDF error, usually + Log.debug('netCDF checks failed: {0}', ex) return False return True -- GitLab From d776e2c8f0be38c8853170108981aaee92067f71 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Fri, 17 Nov 2017 14:39:10 +0100 Subject: [PATCH 28/47] fixed cmorization unpack --- earthdiagnostics/cmormanager.py | 59 +++++++++++++++++---------------- earthdiagnostics/earthdiags.py | 5 ++- earthdiagnostics/utils.py | 4 +-- 3 files changed, 37 insertions(+), 31 deletions(-) diff --git a/earthdiagnostics/cmormanager.py b/earthdiagnostics/cmormanager.py index 8ddd9ef1..cfa67cae 100644 --- a/earthdiagnostics/cmormanager.py +++ b/earthdiagnostics/cmormanager.py @@ -591,37 +591,40 @@ class CMORManager(DataManager): if not filename.endswith('.nc') or filename.startswith('.'): return cmorfile = os.path.join(filepath, filename) - original_handler = Utils.openCdf(cmorfile) - if original_handler.dimensions['i'].size < original_handler.dimensions['j'].size: - temp = TempFile.get() - new_handler = Utils.openCdf(temp, 'w') - for attribute in original_handler.ncattrs(): - original = getattr(original_handler, attribute) - setattr(new_handler, attribute, - Utils.convert_to_ASCII_if_possible(original)) - for dimension in original_handler.dimensions.keys(): - if dimension == 'i': - new_name = 'j' - elif dimension == 'j': - new_name = 'i' - else: - new_name = dimension - new_handler.createDimension(new_name, original_handler.dimensions[dimension].size) - for variable in original_handler.variables.keys(): - original_var = original_handler.variables[variable] - Log.debug(str(original_var.dimensions)) - translated_dimensions = Utils._translate(original_var.dimensions, {'i': 'j', 'j': 'i'}) - Log.debug(str(translated_dimensions)) - new_var = new_handler.createVariable(variable, original_var.datatype, - translated_dimensions) - Utils.copy_attributes(new_var, original_var) - new_var[:] = original_var[:] - original_handler.close() - new_handler.close() - Utils.move_file(temp, cmorfile) + self._fix_ij_swap(cmorfile) self.create_link(domain, cmorfile, frequency, var, "", False, vartype=VariableType.MEAN) + def _fix_ij_swap(self, cmorfile): + return + original_handler = Utils.openCdf(cmorfile) + if original_handler.dimensions['i'].size < original_handler.dimensions['j'].size: + temp = TempFile.get() + new_handler = Utils.openCdf(temp, 'w') + for attribute in original_handler.ncattrs(): + original = getattr(original_handler, attribute) + setattr(new_handler, attribute, + Utils.convert_to_ASCII_if_possible(original)) + for dimension in original_handler.dimensions.keys(): + if dimension == 'i': + new_name = 'j' + elif dimension == 'j': + new_name = 'i' + else: + new_name = dimension + new_handler.createDimension(new_name, original_handler.dimensions[dimension].size) + for variable in original_handler.variables.keys(): + original_var = original_handler.variables[variable] + translated_dimensions = Utils._translate(original_var.dimensions, + {'i': 'j', 'j': 'i'}) + new_var = new_handler.createVariable(variable, original_var.datatype, + translated_dimensions) + Utils.copy_attributes(new_var, original_var) + new_var[:] = original_var[:] + original_handler.close() + new_handler.close() + Utils.move_file(temp, cmorfile, save_hash=True) + Log.debug('File {0} translated', cmorfile) def _get_startdate_path(self, startdate): """ diff --git a/earthdiagnostics/earthdiags.py b/earthdiagnostics/earthdiags.py index 1c1494b4..44c7fba5 100755 --- a/earthdiagnostics/earthdiags.py +++ b/earthdiagnostics/earthdiags.py @@ -374,7 +374,10 @@ class EarthDiags(object): if os.path.lexists(destiny): try: os.remove(destiny) - except OSError: + except OSError as ex: + if ex.errno == 13: #Permission denied + Log.info('Link already created') + return pass os.symlink(source, destiny) diff --git a/earthdiagnostics/utils.py b/earthdiagnostics/utils.py index 83d3239f..7c70b56e 100644 --- a/earthdiagnostics/utils.py +++ b/earthdiagnostics/utils.py @@ -244,7 +244,7 @@ class Utils(object): handler.sync() @staticmethod - def copy_file(source, destiny, save_hash=False): + def copy_file(source, destiny, save_hash=False, use_stored_hash=True): """ Copies a file from source to destiny, creating dirs if necessary @@ -266,7 +266,7 @@ class Utils(object): raise ex hash_destiny = None Log.debug('Hashing original file... {0}', datetime.datetime.now()) - hash_original = Utils.get_file_hash(source, use_stored=True) + hash_original = Utils.get_file_hash(source, use_stored=use_stored_hash) retrials = 3 while hash_original != hash_destiny: -- GitLab From 752ea59c73ee500561d7720c4ef969cebdeefd92 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Fri, 17 Nov 2017 15:34:25 +0100 Subject: [PATCH 29/47] Fixed heatc results names --- earthdiagnostics/ocean/heatcontent.py | 2 +- test/unit/ocean/test_heatcontent.py | 7 ++++--- 2 files changed, 5 insertions(+), 4 deletions(-) diff --git a/earthdiagnostics/ocean/heatcontent.py b/earthdiagnostics/ocean/heatcontent.py index d44e6492..81ef23cc 100644 --- a/earthdiagnostics/ocean/heatcontent.py +++ b/earthdiagnostics/ocean/heatcontent.py @@ -77,7 +77,7 @@ class HeatContent(Diagnostic): DiagnosticIntOption('min_depth'), DiagnosticIntOption('max_depth')) options = cls.process_options(options, options_available) - box = Box(True) + box = Box() box.min_depth = options['min_depth'] box.max_depth = options['max_depth'] min_level = 0 diff --git a/test/unit/ocean/test_heatcontent.py b/test/unit/ocean/test_heatcontent.py index c58d1217..f842bc13 100644 --- a/test/unit/ocean/test_heatcontent.py +++ b/test/unit/ocean/test_heatcontent.py @@ -1,10 +1,11 @@ # coding=utf-8 from unittest import TestCase +from mock import Mock, patch + from earthdiagnostics.box import Box from earthdiagnostics.constants import Basins from earthdiagnostics.ocean.heatcontent import HeatContent -from mock import Mock, patch # noinspection PyUnusedLocal @@ -21,7 +22,7 @@ class TestHeatContent(TestCase): self.diags.model_version = 'model_version' self.diags.config.experiment.get_chunk_list.return_value = (('20010101', 0, 0), ('20010101', 0, 1)) - self.box = Box(True) + self.box = Box() self.box.min_depth = 0 self.box.max_depth = 100 @@ -43,5 +44,5 @@ class TestHeatContent(TestCase): def test_str(self): diag = HeatContent(self.data_manager, '20010101', 0, 0, Basins().Global, -1, self.box, 1, 20) - self.assertEquals(str(diag), 'Heat content Startdate: 20010101 Member: 0 Chunk: 0 Mixed layer: -1 Box: 0-100m ' + self.assertEquals(str(diag), 'Heat content Startdate: 20010101 Member: 0 Chunk: 0 Mixed layer: -1 Box: 0-100 ' 'Basin: Global') -- GitLab From 5903a9810b10ac87b7a601f7d1c4405f5beaf8ab Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Fri, 17 Nov 2017 16:24:23 +0100 Subject: [PATCH 30/47] Fixed box string representation --- earthdiagnostics/box.py | 6 +++--- test/unit/ocean/test_maxmoc.py | 5 +++-- test/unit/ocean/test_region_mean.py | 16 +++++++++------- 3 files changed, 15 insertions(+), 12 deletions(-) diff --git a/earthdiagnostics/box.py b/earthdiagnostics/box.py index f3dc7669..fe5334fd 100644 --- a/earthdiagnostics/box.py +++ b/earthdiagnostics/box.py @@ -153,10 +153,10 @@ class Box(object): else: suffix = '' - string = str(abs(self.max_depth)) + suffix - if self.min_depth != self.max_depth: - string = '{0}-{1}'.format(str(abs(self.min_depth)), string) + string = '{0:d}-{1:d}{2}'.format(int(abs(self.min_depth)), abs(self.max_depth), suffix) + else: + string = '{0:d}{1}'.format(int(abs(self.max_depth)), suffix) return string diff --git a/test/unit/ocean/test_maxmoc.py b/test/unit/ocean/test_maxmoc.py index f6f12b34..a1141d01 100644 --- a/test/unit/ocean/test_maxmoc.py +++ b/test/unit/ocean/test_maxmoc.py @@ -1,10 +1,11 @@ # coding=utf-8 from unittest import TestCase +from mock import Mock, patch + from earthdiagnostics.box import Box from earthdiagnostics.constants import Basins, Basin from earthdiagnostics.ocean.maxmoc import MaxMoc -from mock import Mock, patch class TestMaxMoc(TestCase): @@ -63,4 +64,4 @@ class TestMaxMoc(TestCase): def test_str(self): self.assertEquals(str(self.maxmoc), 'Max moc Startdate: 20000101 Member: 1 Year: 2000 ' - 'Box: 0.0N0.0m Basin: Global') + 'Box: 0.0N0m Basin: Global') diff --git a/test/unit/ocean/test_region_mean.py b/test/unit/ocean/test_region_mean.py index e527feda..efeeb7d7 100644 --- a/test/unit/ocean/test_region_mean.py +++ b/test/unit/ocean/test_region_mean.py @@ -1,11 +1,13 @@ # coding=utf-8 from unittest import TestCase -from earthdiagnostics.ocean.regionmean import RegionMean -from earthdiagnostics.modelingrealm import ModelingRealms -from earthdiagnostics.constants import Basins + +from mock import Mock, patch + from earthdiagnostics.box import Box +from earthdiagnostics.constants import Basins from earthdiagnostics.diagnostic import DiagnosticOptionError, DiagnosticVariableOption -from mock import Mock, patch +from earthdiagnostics.modelingrealm import ModelingRealms +from earthdiagnostics.ocean.regionmean import RegionMean class TestRegionMean(TestCase): @@ -49,8 +51,8 @@ class TestRegionMean(TestCase): box, True, Basins().Global, False, '')) box = Box() - box.min_depth = 1 - box.max_depth = 10 + box.min_depth = 1.0 + box.max_depth = 10.0 jobs = RegionMean.generate_jobs(self.diags, ['diagnostic', 'ocean', 'var', 'U', 'global', '1', '10']) self.assertEqual(len(jobs), 2) @@ -97,4 +99,4 @@ class TestRegionMean(TestCase): diag = RegionMean(self.data_manager, '20010101', 0, 0, ModelingRealms.ocean, 'var', 'U', box, False, Basins().Global, True, 'grid') self.assertEquals(str(diag), 'Region mean Startdate: 20010101 Member: 0 Chunk: 0 Variable: var Grid point: U ' - 'Box: 1-10 Save 3D: False Save variance: True Original grid: grid') + 'Box: 1-10 Save 3D: False Save variance: True Original grid: grid Basin: Global') -- GitLab From 0ece4e5650274b66c672024cc9f62b5e604f645e Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Fri, 17 Nov 2017 16:40:21 +0100 Subject: [PATCH 31/47] added missing int transformation --- earthdiagnostics/box.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/earthdiagnostics/box.py b/earthdiagnostics/box.py index fe5334fd..ea7ccc15 100644 --- a/earthdiagnostics/box.py +++ b/earthdiagnostics/box.py @@ -154,7 +154,7 @@ class Box(object): suffix = '' if self.min_depth != self.max_depth: - string = '{0:d}-{1:d}{2}'.format(int(abs(self.min_depth)), abs(self.max_depth), suffix) + string = '{0:d}-{1:d}{2}'.format(int(abs(self.min_depth)), int(abs(self.max_depth)), suffix) else: string = '{0:d}{1}'.format(int(abs(self.max_depth)), suffix) return string -- GitLab From fab7addcc939e35766b4ca79ae7b3b520b8f718e Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Mon, 20 Nov 2017 13:33:10 +0100 Subject: [PATCH 32/47] Codacy config --- .codacy.yml | 36 +++++ .editorconfig | 26 ++++ .prospector.yml | 28 ++++ .pylintrc | 407 ++++++++++++++++++++++++++++++++++++++++++++++++ README | 3 +- environment.yml | 30 ++++ 6 files changed, 529 insertions(+), 1 deletion(-) create mode 100644 .codacy.yml create mode 100644 .editorconfig create mode 100644 .prospector.yml create mode 100644 .pylintrc create mode 100644 environment.yml diff --git a/.codacy.yml b/.codacy.yml new file mode 100644 index 00000000..3dc3bb8c --- /dev/null +++ b/.codacy.yml @@ -0,0 +1,36 @@ +# codacy configuration file + +--- + +engines: + coverage: + enabled: true + exclude_paths: [ + 'tests', + ] + metrics: + enabled: true + duplication: + enabled: true + prospector: + enabled: true + pylint: + enabled: true + python_version: 3 + +exclude_paths: [ + 'doc/sphinx/**', + 'esmvaltool/doc/sphinx/**', + # cmor tables + 'esmvaltool/interface_scripts/cmip*-cmor-tables/**', + # old stuff + 'backend/**', + 'diag_scripts/**', + 'interface_data/**', + 'interface_scripts/**', + 'main.py', + 'nml/**', + 'plot_scripts/**', + 'reformat_scripts/**', + 'variable_defs/**', +] diff --git a/.editorconfig b/.editorconfig new file mode 100644 index 00000000..2a7a00f3 --- /dev/null +++ b/.editorconfig @@ -0,0 +1,26 @@ +# EditorConfig is awesome: http://EditorConfig.org + +# top-most EditorConfig file +root = true + +# Unix-style newlines with a newline ending every file +[*] +end_of_line = lf +insert_final_newline = true +trim_trailing_whitespace = true +# Set default charset +charset = utf-8 + +# Matches multiple files with brace expansion notation + +# 4 space indentation +[*.{py,java,r,R}] +indent_size = 4 + +# 2 space indentation +[*.{js,json,yml,html,xml,ncl}] +indent_size = 2 + +[*.{md,Rmd}] +trim_trailing_whitespace = false + diff --git a/.prospector.yml b/.prospector.yml new file mode 100644 index 00000000..58d4946d --- /dev/null +++ b/.prospector.yml @@ -0,0 +1,28 @@ +# prospector configuration file + +--- + +output-format: grouped + +strictness: veryhigh +doc-warnings: true +test-warnings: true +member-warnings: false + +pyroma: + run: true + +pep8: + full: true + +pep257: + # see http://pep257.readthedocs.io/en/latest/error_codes.html + disable: [ + # For short descriptions it makes sense not to end with a period: + D400, # First line should end with a period + # Disable because not part of PEP257 official convention: + D203, # 1 blank line required before class docstring + D212, # Multi-line docstring summary should start at the first line + D213, # Multi-line docstring summary should start at the second line + D404, # First word of the docstring should not be This + ] diff --git a/.pylintrc b/.pylintrc new file mode 100644 index 00000000..4094c1f4 --- /dev/null +++ b/.pylintrc @@ -0,0 +1,407 @@ +[MASTER] + +# Specify a configuration file. +#rcfile= + +# Python code to execute, usually for sys.path manipulation such as +# pygtk.require(). +#init-hook= + +# Add files or directories to the blacklist. They should be base names, not +# paths. +ignore=CVS + +# Add files or directories matching the regex patterns to the blacklist. The +# regex matches against base names, not paths. +ignore-patterns= + +# Pickle collected data for later comparisons. +persistent=yes + +# List of plugins (as comma separated values of python modules names) to load, +# usually to register additional checkers. +load-plugins= + +# Use multiple processes to speed up Pylint. +jobs=1 + +# Allow loading of arbitrary C extensions. Extensions are imported into the +# active Python interpreter and may run arbitrary code. +unsafe-load-any-extension=no + +# A comma-separated list of package or module names from where C extensions may +# be loaded. Extensions are loading into the active Python interpreter and may +# run arbitrary code +extension-pkg-whitelist= + +# Allow optimization of some AST trees. This will activate a peephole AST +# optimizer, which will apply various small optimizations. For instance, it can +# be used to obtain the result of joining multiple strings with the addition +# operator. Joining a lot of strings can lead to a maximum recursion error in +# Pylint and this flag can prevent that. It has one side effect, the resulting +# AST will be different than the one from reality. This option is deprecated +# and it will be removed in Pylint 2.0. +optimize-ast=no + + +[MESSAGES CONTROL] + +# Only show warnings with the listed confidence levels. Leave empty to show +# all. Valid levels: HIGH, INFERENCE, INFERENCE_FAILURE, UNDEFINED +confidence= + +# Enable the message, report, category or checker with the given id(s). You can +# either give multiple identifier separated by comma (,) or put this option +# multiple time (only on the command line, not in the configuration file where +# it should appear only once). See also the "--disable" option for examples. +#enable= + +# Disable the message, report, category or checker with the given id(s). You +# can either give multiple identifiers separated by comma (,) or put this +# option multiple times (only on the command line, not in the configuration +# file where it should appear only once).You can also use "--disable=all" to +# disable everything first and then reenable specific checks. For example, if +# you want to run only the similarities checker, you can use "--disable=all +# --enable=similarities". If you want to run only the classes checker, but have +# no Warning level messages displayed, use"--disable=all --enable=classes +# --disable=W" +disable=import-star-module-level,old-octal-literal,oct-method,print-statement,unpacking-in-except,parameter-unpacking,backtick,old-raise-syntax,old-ne-operator,long-suffix,dict-view-method,dict-iter-method,metaclass-assignment,next-method-called,raising-string,indexing-exception,raw_input-builtin,long-builtin,file-builtin,execfile-builtin,coerce-builtin,cmp-builtin,buffer-builtin,basestring-builtin,apply-builtin,filter-builtin-not-iterating,using-cmp-argument,useless-suppression,range-builtin-not-iterating,suppressed-message,no-absolute-import,old-division,cmp-method,reload-builtin,zip-builtin-not-iterating,intern-builtin,unichr-builtin,reduce-builtin,standarderror-builtin,unicode-builtin,xrange-builtin,coerce-method,delslice-method,getslice-method,setslice-method,input-builtin,round-builtin,hex-method,nonzero-method,map-builtin-not-iterating + + +[REPORTS] + +# Set the output format. Available formats are text, parseable, colorized, msvs +# (visual studio) and html. You can also give a reporter class, eg +# mypackage.mymodule.MyReporterClass. +output-format=text + +# Put messages in a separate file for each module / package specified on the +# command line instead of printing them on stdout. Reports (if any) will be +# written in a file name "pylint_global.[txt|html]". This option is deprecated +# and it will be removed in Pylint 2.0. +files-output=no + +# Tells whether to display a full report or only the messages +reports=yes + +# Python expression which should return a note less than 10 (10 is the highest +# note). You have access to the variables errors warning, statement which +# respectively contain the number of errors / warnings messages and the total +# number of statements analyzed. This is used by the global evaluation report +# (RP0004). +evaluation=10.0 - ((float(5 * error + warning + refactor + convention) / statement) * 10) + +# Template used to display messages. This is a python new-style format string +# used to format the message information. See doc for all details +#msg-template= + + +[FORMAT] + +# Maximum number of characters on a single line. +max-line-length=79 + +# Regexp for a line that is allowed to be longer than the limit. +ignore-long-lines=^\s*(# )??$ + +# Allow the body of an if to be on the same line as the test if there is no +# else. +single-line-if-stmt=no + +# List of optional constructs for which whitespace checking is disabled. `dict- +# separator` is used to allow tabulation in dicts, etc.: {1 : 1,\n222: 2}. +# `trailing-comma` allows a space between comma and closing bracket: (a, ). +# `empty-line` allows space-only lines. +no-space-check=trailing-comma,dict-separator + +# Maximum number of lines in a module +max-module-lines=1000 + +# String used as indentation unit. This is usually " " (4 spaces) or "\t" (1 +# tab). +indent-string=' ' + +# Number of spaces of indent required inside a hanging or continued line. +indent-after-paren=4 + +# Expected format of line ending, e.g. empty (any line ending), LF or CRLF. +expected-line-ending-format=LF + + +[MISCELLANEOUS] + +# List of note tags to take in consideration, separated by a comma. +notes=FIXME,FIX-ME,XXX,TODO + + +[LOGGING] + +# Logging modules to check that the string format arguments are in logging +# function parameter format +logging-modules=logging + + +[VARIABLES] + +# Tells whether we should check for unused import in __init__ files. +init-import=no + +# A regular expression matching the name of dummy variables (i.e. expectedly +# not used). +dummy-variables-rgx=(_+[a-zA-Z0-9]*?$)|dummy + +# List of additional names supposed to be defined in builtins. Remember that +# you should avoid to define new builtins when possible. +additional-builtins= + +# List of strings which can identify a callback function by name. A callback +# name must start or end with one of those strings. +callbacks=cb_,_cb + +# List of qualified module names which can have objects that can redefine +# builtins. +redefining-builtins-modules=six.moves,future.builtins + + +[TYPECHECK] + +# Tells whether missing members accessed in mixin class should be ignored. A +# mixin class is detected if its name ends with "mixin" (case insensitive). +ignore-mixin-members=yes + +# List of module names for which member attributes should not be checked +# (useful for modules/projects where namespaces are manipulated during runtime +# and thus existing member attributes cannot be deduced by static analysis. It +# supports qualified module names, as well as Unix pattern matching. +ignored-modules= + +# List of class names for which member attributes should not be checked (useful +# for classes with dynamically set attributes). This supports the use of +# qualified names. +ignored-classes=optparse.Values,thread._local,_thread._local + +# List of members which are set dynamically and missed by pylint inference +# system, and so shouldn't trigger E1101 when accessed. Python regular +# expressions are accepted. +generated-members= + +# List of decorators that produce context managers, such as +# contextlib.contextmanager. Add to this list to register other decorators that +# produce valid context managers. +contextmanager-decorators=contextlib.contextmanager + + +[BASIC] + +# Good variable names which should always be accepted, separated by a comma +good-names=i,j,k,ex,Run,_,logger + +# Bad variable names which should always be refused, separated by a comma +bad-names=foo,bar,baz,toto,tutu,tata + +# Colon-delimited sets of names that determine each other's naming style when +# the name regexes allow several styles. +name-group= + +# Include a hint for the correct naming format with invalid-name +include-naming-hint=yes + +# List of decorators that produce properties, such as abc.abstractproperty. Add +# to this list to register other decorators that produce valid properties. +property-classes=abc.abstractproperty + +# Regular expression matching correct function names +function-rgx=[a-z_][a-z0-9_]{2,30}$ + +# Naming hint for function names +function-name-hint=[a-z_][a-z0-9_]{2,30}$ + +# Regular expression matching correct variable names +variable-rgx=[a-z_][a-z0-9_]{2,30}$ + +# Naming hint for variable names +variable-name-hint=[a-z_][a-z0-9_]{2,30}$ + +# Regular expression matching correct constant names +const-rgx=(([A-Z_][A-Z0-9_]*)|(__.*__))$ + +# Naming hint for constant names +const-name-hint=(([A-Z_][A-Z0-9_]*)|(__.*__))$ + +# Regular expression matching correct attribute names +attr-rgx=[a-z_][a-z0-9_]{2,30}$ + +# Naming hint for attribute names +attr-name-hint=[a-z_][a-z0-9_]{2,30}$ + +# Regular expression matching correct argument names +argument-rgx=[a-z_][a-z0-9_]{2,30}$ + +# Naming hint for argument names +argument-name-hint=[a-z_][a-z0-9_]{2,30}$ + +# Regular expression matching correct class attribute names +class-attribute-rgx=([A-Za-z_][A-Za-z0-9_]{2,30}|(__.*__))$ + +# Naming hint for class attribute names +class-attribute-name-hint=([A-Za-z_][A-Za-z0-9_]{2,30}|(__.*__))$ + +# Regular expression matching correct inline iteration names +inlinevar-rgx=[A-Za-z_][A-Za-z0-9_]*$ + +# Naming hint for inline iteration names +inlinevar-name-hint=[A-Za-z_][A-Za-z0-9_]*$ + +# Regular expression matching correct class names +class-rgx=[A-Z_][a-zA-Z0-9]+$ + +# Naming hint for class names +class-name-hint=[A-Z_][a-zA-Z0-9]+$ + +# Regular expression matching correct module names +module-rgx=(([a-z_][a-z0-9_]*)|([A-Z][a-zA-Z0-9]+))$ + +# Naming hint for module names +module-name-hint=(([a-z_][a-z0-9_]*)|([A-Z][a-zA-Z0-9]+))$ + +# Regular expression matching correct method names +method-rgx=[a-z_][a-z0-9_]{2,30}$ + +# Naming hint for method names +method-name-hint=[a-z_][a-z0-9_]{2,30}$ + +# Regular expression which should only match function or class names that do +# not require a docstring. +no-docstring-rgx=^_ + +# Minimum line length for functions/classes that require docstrings, shorter +# ones are exempt. +docstring-min-length=-1 + + +[ELIF] + +# Maximum number of nested blocks for function / method body +max-nested-blocks=5 + + +[SPELLING] + +# Spelling dictionary name. Available dictionaries: none. To make it working +# install python-enchant package. +spelling-dict= + +# List of comma separated words that should not be checked. +spelling-ignore-words= + +# A path to a file that contains private dictionary; one word per line. +spelling-private-dict-file= + +# Tells whether to store unknown words to indicated private dictionary in +# --spelling-private-dict-file option instead of raising a message. +spelling-store-unknown-words=no + + +[SIMILARITIES] + +# Minimum lines number of a similarity. +min-similarity-lines=4 + +# Ignore comments when computing similarities. +ignore-comments=yes + +# Ignore docstrings when computing similarities. +ignore-docstrings=yes + +# Ignore imports when computing similarities. +ignore-imports=no + + +[DESIGN] + +# Maximum number of arguments for function / method +max-args=5 + +# Argument names that match this expression will be ignored. Default to name +# with leading underscore +ignored-argument-names=_.* + +# Maximum number of locals for function / method body +max-locals=15 + +# Maximum number of return / yield for function / method body +max-returns=6 + +# Maximum number of branch for function / method body +max-branches=12 + +# Maximum number of statements in function / method body +max-statements=50 + +# Maximum number of parents for a class (see R0901). +max-parents=7 + +# Maximum number of attributes for a class (see R0902). +max-attributes=7 + +# Minimum number of public methods for a class (see R0903). +min-public-methods=2 + +# Maximum number of public methods for a class (see R0904). +max-public-methods=20 + +# Maximum number of boolean expressions in a if statement +max-bool-expr=5 + + +[IMPORTS] + +# Deprecated modules which should not be used, separated by a comma +deprecated-modules=regsub,TERMIOS,Bastion,rexec,optparse + +# Create a graph of every (i.e. internal and external) dependencies in the +# given file (report RP0402 must not be disabled) +import-graph= + +# Create a graph of external dependencies in the given file (report RP0402 must +# not be disabled) +ext-import-graph= + +# Create a graph of internal dependencies in the given file (report RP0402 must +# not be disabled) +int-import-graph= + +# Force import order to recognize a module as part of the standard +# compatibility libraries. +known-standard-library= + +# Force import order to recognize a module as part of a third party library. +known-third-party=enchant + +# Analyse import fallback blocks. This can be used to support both Python 2 and +# 3 compatible code, which means that the block might have code that exists +# only in one or another interpreter, leading to false positives when analysed. +analyse-fallback-blocks=no + + +[CLASSES] + +# List of method names used to declare (i.e. assign) instance attributes. +defining-attr-methods=__init__,__new__,setUp + +# List of valid names for the first argument in a class method. +valid-classmethod-first-arg=cls + +# List of valid names for the first argument in a metaclass class method. +valid-metaclass-classmethod-first-arg=mcs + +# List of member names, which should be excluded from the protected access +# warning. +exclude-protected=_asdict,_fields,_replace,_source,_make + + +[EXCEPTIONS] + +# Exceptions that will emit a warning when being caught. Defaults to +# "Exception" +overgeneral-exceptions=Exception diff --git a/README b/README index f247d009..79c3a704 100644 --- a/README +++ b/README @@ -1,3 +1,4 @@ +[![Codacy Badge](https://api.codacy.com/project/badge/Grade/206d0f75e8c64742a4fb4a0bd3015565)](https://www.codacy.com/app/BSC-Earth/earthdiagnostics?utm_source=earth.bsc.es&utm_medium=referral&utm_content=gitlab/es/earthdiagnostics&utm_campaign=Badge_Grade) This tool is a set of diagnostics used at BSC-ES department for NEMO and EC-EARTH models postprocessing. They are based on CDO, NCO and CDFTOOLS 3.0. For CDFTOOLS, a custom build is required. @@ -9,4 +10,4 @@ Check the Earth Diagnostics documentation in PDF format in EarthDiagnostics.pdf CONTACT ======= -For any doubts or suggestions, contact javier.vegas@bsc.es \ No newline at end of file +For any doubts or suggestions, contact javier.vegas@bsc.es diff --git a/environment.yml b/environment.yml new file mode 100644 index 00000000..3a3ca170 --- /dev/null +++ b/environment.yml @@ -0,0 +1,30 @@ +--- + +name: earthdiagnostics +channels: +- conda-forge +#- defaults # in case of missing packages +#- Clyde_Fare #for scientific python + + +dependencies: +- iris +- netcdf4 +- numpy +- cdo +- nco +- python-cdo +- coverage +- pygrib +- psutil +- six +- cf_units +- openpyxl +- mock +- cmake + +- pip: + - bscearth.utils + - futures + - nco + - exrex -- GitLab From 9ee9ca9dc7c4dfe921d3985899a5a938eb69fc39 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Mon, 20 Nov 2017 14:25:07 +0100 Subject: [PATCH 33/47] fixed codacy config --- .codacy.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.codacy.yml b/.codacy.yml index 3dc3bb8c..c0f0e505 100644 --- a/.codacy.yml +++ b/.codacy.yml @@ -16,7 +16,7 @@ engines: enabled: true pylint: enabled: true - python_version: 3 + python_version: 2 exclude_paths: [ 'doc/sphinx/**', -- GitLab From 87875b93307937098a43fa98ffe914a3c8eba824 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Mon, 20 Nov 2017 14:26:52 +0100 Subject: [PATCH 34/47] Changed readme extension --- README => README.md | 0 1 file changed, 0 insertions(+), 0 deletions(-) rename README => README.md (100%) diff --git a/README b/README.md similarity index 100% rename from README rename to README.md -- GitLab From 70992937cd85ffccf6bcc8d72b4017eacfbd10a2 Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Mon, 20 Nov 2017 14:28:15 +0100 Subject: [PATCH 35/47] Updated readme --- README.md | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/README.md b/README.md index 79c3a704..b8f950dd 100644 --- a/README.md +++ b/README.md @@ -1,4 +1,5 @@ [![Codacy Badge](https://api.codacy.com/project/badge/Grade/206d0f75e8c64742a4fb4a0bd3015565)](https://www.codacy.com/app/BSC-Earth/earthdiagnostics?utm_source=earth.bsc.es&utm_medium=referral&utm_content=gitlab/es/earthdiagnostics&utm_campaign=Badge_Grade) + This tool is a set of diagnostics used at BSC-ES department for NEMO and EC-EARTH models postprocessing. They are based on CDO, NCO and CDFTOOLS 3.0. For CDFTOOLS, a custom build is required. @@ -10,4 +11,4 @@ Check the Earth Diagnostics documentation in PDF format in EarthDiagnostics.pdf CONTACT ======= -For any doubts or suggestions, contact javier.vegas@bsc.es +For any doubts or suggestions, contact javier.vegas[at]bsc.es -- GitLab From ae60b16e98ce97011eb41d8dac45c988219a46ab Mon Sep 17 00:00:00 2001 From: Javier Vegas-Regidor Date: Mon, 20 Nov 2017 14:31:43 +0100 Subject: [PATCH 36/47] Updated max line length for pylint --- .pylintrc | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.pylintrc b/.pylintrc index 4094c1f4..db7741b9 100644 --- a/.pylintrc +++ b/.pylintrc @@ -99,7 +99,7 @@ evaluation=10.0 - ((float(5 * error + warning + refactor + convention) / stateme [FORMAT] # Maximum number of characters on a single line. -max-line-length=79 +max-line-length=120 # Regexp for a line that is allowed to be longer than the limit. ignore-long-lines=^\s*(# )??$ -- GitLab From 5803bcc31b875d64389226954b4ff08805973d59 Mon Sep 17 00:00:00 2001 From: jvegasbsc Date: Mon, 20 Nov 2017 16:00:27 +0100 Subject: [PATCH 37/47] Fixed environment yml --- earthdiagnostics/ocean/siasiesiv.py | 3 ++- environment.yml | 5 ++--- setup.py | 2 +- 3 files changed, 5 insertions(+), 5 deletions(-) diff --git a/earthdiagnostics/ocean/siasiesiv.py b/earthdiagnostics/ocean/siasiesiv.py index 21adfc0f..bd2c41c8 100644 --- a/earthdiagnostics/ocean/siasiesiv.py +++ b/earthdiagnostics/ocean/siasiesiv.py @@ -2,7 +2,7 @@ import os # noinspection PyUnresolvedReferences -import earthdiagnostics.cdftoolspython as cdftoolspython + import netCDF4 import numpy as np from bscearth.utils.log import Log @@ -117,6 +117,7 @@ class Siasiesiv(Diagnostic): """ Runs the diagnostic """ + import earthdiagnostics.cdftoolspython as cdftoolspython sit_handler = Utils.openCdf(self.sit.local_file) sit = np.asfortranarray(sit_handler.variables[self.sit_varname][:]) timesteps = sit_handler.dimensions['time'].size diff --git a/environment.yml b/environment.yml index 3a3ca170..8de32f66 100644 --- a/environment.yml +++ b/environment.yml @@ -3,9 +3,6 @@ name: earthdiagnostics channels: - conda-forge -#- defaults # in case of missing packages -#- Clyde_Fare #for scientific python - dependencies: - iris @@ -22,9 +19,11 @@ dependencies: - openpyxl - mock - cmake +- cfunits - pip: - bscearth.utils - futures - nco - exrex + - xxhash diff --git a/setup.py b/setup.py index 0e68a089..a9ff71b6 100644 --- a/setup.py +++ b/setup.py @@ -27,7 +27,7 @@ setup( keywords=['climate', 'weather', 'diagnostic'], setup_requires=['pyproj'], install_requires=['numpy', 'netCDF4', 'bscearth.utils', 'cdo>=1.3.4', 'nco>=0.0.3', 'iris>=1.12.0', 'coverage', - 'pygrib', 'openpyxl', 'mock', 'futures', 'cf_units', 'cfunits', 'xxhash', 'six', 'psutil', + 'pygrib', 'openpyxl', 'mock', 'futures', 'cf_units', 'xxhash', 'six', 'psutil', 'exrex'], packages=find_packages(), include_package_data=True, -- GitLab From bdaaac2579a7f171e5a311d9250b6904a12aca31 Mon Sep 17 00:00:00 2001 From: jvegasbsc Date: Mon, 20 Nov 2017 18:21:24 +0100 Subject: [PATCH 38/47] Setting automated tests --- .gitlab-ci.yml | 8 ++++++++ 1 file changed, 8 insertions(+) create mode 100644 .gitlab-ci.yml diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml new file mode 100644 index 00000000..61b71586 --- /dev/null +++ b/.gitlab-ci.yml @@ -0,0 +1,8 @@ +test: + script: + - module purge + - module load Miniconda2 + - conda env update -n environment.yml + - source activate earthdiagnostics + - unittest test + -- GitLab From 9bf7ae39f4d17b9abd8770ccd93f2299bab304df Mon Sep 17 00:00:00 2001 From: jvegasbsc Date: Mon, 20 Nov 2017 18:29:55 +0100 Subject: [PATCH 39/47] Added coverage support for codacy --- .gitlab-ci.yml | 6 ++++-- environment.yml | 1 + 2 files changed, 5 insertions(+), 2 deletions(-) diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml index 61b71586..74c23b89 100644 --- a/.gitlab-ci.yml +++ b/.gitlab-ci.yml @@ -1,8 +1,10 @@ test: script: - - module purge - - module load Miniconda2 + - echo $USER - conda env update -n environment.yml + - pip install codacy-coverage - source activate earthdiagnostics - unittest test + - coverage xml + - python-codacy-coverage -r coverage.xml diff --git a/environment.yml b/environment.yml index 8de32f66..772ab619 100644 --- a/environment.yml +++ b/environment.yml @@ -20,6 +20,7 @@ dependencies: - mock - cmake - cfunits +- coverage - pip: - bscearth.utils -- GitLab From dcc9c8bac4f964d6a36db15918496b7523eed2cf Mon Sep 17 00:00:00 2001 From: jvegasbsc Date: Wed, 22 Nov 2017 09:48:34 +0100 Subject: [PATCH 40/47] Update to gitlab-runner --- .gitlab-ci.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml index 74c23b89..9085bfeb 100644 --- a/.gitlab-ci.yml +++ b/.gitlab-ci.yml @@ -1,6 +1,7 @@ test: script: - echo $USER + - echo $PATH - conda env update -n environment.yml - pip install codacy-coverage - source activate earthdiagnostics -- GitLab From 99ce3bd09954b7f662c757a0620eadab295ba2c8 Mon Sep 17 00:00:00 2001 From: jvegasbsc Date: Wed, 22 Nov 2017 09:52:17 +0100 Subject: [PATCH 41/47] Update to gitlab-runner --- .gitlab-ci.yml | 2 +- environment.yml | 1 + 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml index 9085bfeb..0b55374d 100644 --- a/.gitlab-ci.yml +++ b/.gitlab-ci.yml @@ -1,9 +1,9 @@ test: script: - echo $USER + - export PATH="$HOME/miniconda2/bin:$PATH" - echo $PATH - conda env update -n environment.yml - - pip install codacy-coverage - source activate earthdiagnostics - unittest test - coverage xml diff --git a/environment.yml b/environment.yml index 772ab619..4fa44d13 100644 --- a/environment.yml +++ b/environment.yml @@ -28,3 +28,4 @@ dependencies: - nco - exrex - xxhash + - codacy-coverage -- GitLab From bec61fce46b36e6638d25117d684d2b281dacd0d Mon Sep 17 00:00:00 2001 From: jvegasbsc Date: Wed, 22 Nov 2017 10:08:22 +0100 Subject: [PATCH 42/47] Update to gitlab-runner --- .coveragerc | 2 ++ .gitlab-ci.yml | 2 +- .prospector.yml | 1 + 3 files changed, 4 insertions(+), 1 deletion(-) create mode 100644 .coveragerc diff --git a/.coveragerc b/.coveragerc new file mode 100644 index 00000000..398ff08a --- /dev/null +++ b/.coveragerc @@ -0,0 +1,2 @@ +[run] +branch = True diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml index 0b55374d..987d6ec3 100644 --- a/.gitlab-ci.yml +++ b/.gitlab-ci.yml @@ -5,7 +5,7 @@ test: - echo $PATH - conda env update -n environment.yml - source activate earthdiagnostics - - unittest test + - echo $PWD - coverage xml - python-codacy-coverage -r coverage.xml diff --git a/.prospector.yml b/.prospector.yml index 58d4946d..b5652ca3 100644 --- a/.prospector.yml +++ b/.prospector.yml @@ -25,4 +25,5 @@ pep257: D212, # Multi-line docstring summary should start at the first line D213, # Multi-line docstring summary should start at the second line D404, # First word of the docstring should not be This + E501, # Line-length, already controlled by pylint ] -- GitLab From d713e456ea7345d7aee0d784bc92513e11a6938b Mon Sep 17 00:00:00 2001 From: jvegasbsc Date: Wed, 22 Nov 2017 10:11:29 +0100 Subject: [PATCH 43/47] Fixed environment error --- .gitlab-ci.yml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml index 987d6ec3..27e0c7d7 100644 --- a/.gitlab-ci.yml +++ b/.gitlab-ci.yml @@ -3,7 +3,7 @@ test: - echo $USER - export PATH="$HOME/miniconda2/bin:$PATH" - echo $PATH - - conda env update -n environment.yml + - conda env update -f environment.yml - source activate earthdiagnostics - echo $PWD - coverage xml -- GitLab From 6b6d5da9ae1b592f7d87dd4946ae7bea3a5fe9b5 Mon Sep 17 00:00:00 2001 From: jvegasbsc Date: Wed, 22 Nov 2017 10:18:16 +0100 Subject: [PATCH 44/47] Getting gitlabb-ci to work --- .gitlab-ci.yml | 1 + 1 file changed, 1 insertion(+) diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml index 27e0c7d7..f0b6fe74 100644 --- a/.gitlab-ci.yml +++ b/.gitlab-ci.yml @@ -6,6 +6,7 @@ test: - conda env update -f environment.yml - source activate earthdiagnostics - echo $PWD + - coverage run - coverage xml - python-codacy-coverage -r coverage.xml -- GitLab From 08e008b56c8e19ba404133ebb908330386f88107 Mon Sep 17 00:00:00 2001 From: jvegasbsc Date: Wed, 22 Nov 2017 10:30:47 +0100 Subject: [PATCH 45/47] Getting gitlabb-ci to work --- .coveragerc | 3 +++ .gitlab-ci.yml | 2 +- 2 files changed, 4 insertions(+), 1 deletion(-) diff --git a/.coveragerc b/.coveragerc index 398ff08a..e41ecaeb 100644 --- a/.coveragerc +++ b/.coveragerc @@ -1,2 +1,5 @@ [run] branch = True +source = earthdiagnostics + + diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml index f0b6fe74..cc29806a 100644 --- a/.gitlab-ci.yml +++ b/.gitlab-ci.yml @@ -6,7 +6,7 @@ test: - conda env update -f environment.yml - source activate earthdiagnostics - echo $PWD - - coverage run + - coverage run -m unittest discover - coverage xml - python-codacy-coverage -r coverage.xml -- GitLab From b08e625c68abd24437a6947ffcc85852a3f5ba74 Mon Sep 17 00:00:00 2001 From: jvegasbsc Date: Wed, 22 Nov 2017 11:36:00 +0100 Subject: [PATCH 46/47] Fixed tests --- test/unit/general/test_simplify_dimensions.py | 15 ++++++++------- test/unit/general/test_verticalmeanmetersiris.py | 15 ++++++++------- test/unit/ocean/test_interpolatecdo.py | 6 ++++-- test/unit/ocean/test_siasiesiv.py | 3 ++- test/unit/statistics/test_daysoverpercentile.py | 5 +++-- test/unit/test_config.py | 7 +------ test/unit/test_diagnostic.py | 2 +- 7 files changed, 27 insertions(+), 26 deletions(-) diff --git a/test/unit/general/test_simplify_dimensions.py b/test/unit/general/test_simplify_dimensions.py index 429ad6f2..48ac6f7c 100644 --- a/test/unit/general/test_simplify_dimensions.py +++ b/test/unit/general/test_simplify_dimensions.py @@ -19,6 +19,7 @@ class TestSimplifyDimensions(TestCase): self.diags.config.experiment.get_chunk_list.return_value = (('20010101', 0, 0), ('20010101', 0, 1)) self.diags.config.experiment.startdates = ['20010101', ] self.diags.config.frequency = Frequencies.monthly + self.diags.config.data_convention = 'convention' self.box = Box() self.box.min_depth = 0 @@ -32,24 +33,24 @@ class TestSimplifyDimensions(TestCase): jobs = SimplifyDimensions.generate_jobs(self.diags, ['diagnostic', 'atmos', 'var']) self.assertEqual(len(jobs), 2) self.assertEqual(jobs[0], SimplifyDimensions(self.data_manager, '20010101', 0, 0, - ModelingRealms.atmos, 'var', '')) + ModelingRealms.atmos, 'var', '', 'convention')) self.assertEqual(jobs[1], SimplifyDimensions(self.data_manager, '20010101', 0, 1, - ModelingRealms.atmos, 'var', '')) + ModelingRealms.atmos, 'var', '', 'convention')) jobs = SimplifyDimensions.generate_jobs(self.diags, ['diagnostic', 'atmos', 'var', 'grid']) self.assertEqual(len(jobs), 2) self.assertEqual(jobs[0], SimplifyDimensions(self.data_manager, '20010101', 0, 0, - ModelingRealms.atmos, 'var', 'grid')) + ModelingRealms.atmos, 'var', 'grid', 'convention')) self.assertEqual(jobs[1], SimplifyDimensions(self.data_manager, '20010101', 0, 1, - ModelingRealms.atmos, 'var', 'grid')) + ModelingRealms.atmos, 'var', 'grid', 'convention')) with self.assertRaises(DiagnosticOptionError): SimplifyDimensions.generate_jobs(self.diags, ['diagnostic']) - with self.assertRaises(DiagnosticOptionError): - SimplifyDimensions.generate_jobs(self.diags, ['diagnostic', 'atmos', 'var', 'grid', 'extra']) + with self.assertRaises(DiagnosticOptionError): + SimplifyDimensions.generate_jobs(self.diags, ['diagnostic', 'atmos', 'var', 'grid', 'extra']) def test_str(self): - mixed = SimplifyDimensions(self.data_manager, '20010101', 0, 0, ModelingRealms.atmos, 'var', 'grid') + mixed = SimplifyDimensions(self.data_manager, '20010101', 0, 0, ModelingRealms.atmos, 'var', 'grid', 'convention') self.assertEquals(str(mixed), 'Simplify dimension Startdate: 20010101 Member: 0 Chunk: 0 Variable: atmos:var ' 'Grid: grid') diff --git a/test/unit/general/test_verticalmeanmetersiris.py b/test/unit/general/test_verticalmeanmetersiris.py index cd2876fe..179b54fa 100644 --- a/test/unit/general/test_verticalmeanmetersiris.py +++ b/test/unit/general/test_verticalmeanmetersiris.py @@ -1,7 +1,7 @@ # coding=utf-8 from unittest import TestCase -from earthdiagnostics.diagnostic import DiagnosticVariableOption, DiagnosticOptionError +from earthdiagnostics.diagnostic import DiagnosticVariableListOption, DiagnosticOptionError from earthdiagnostics.box import Box from earthdiagnostics.general.verticalmeanmetersiris import VerticalMeanMetersIris from earthdiagnostics.frequency import Frequencies @@ -27,14 +27,14 @@ class TestVerticalMeanMetersIris(TestCase): def fake_parse(self, value): if not value: raise DiagnosticOptionError - return value + return [value] - @patch.object(DiagnosticVariableOption, 'parse', fake_parse) + @patch.object(DiagnosticVariableListOption, 'parse', fake_parse) def test_generate_jobs(self): box = Box(True) - jobs = VerticalMeanMetersIris.generate_jobs(self.diags, ['diagnostic', 'var']) + jobs = VerticalMeanMetersIris.generate_jobs(self.diags, ['diagnostic', 'ocean', 'var']) self.assertEqual(len(jobs), 2) self.assertEqual(jobs[0], VerticalMeanMetersIris(self.data_manager, '20010101', 0, 0, ModelingRealms.ocean, 'var', box)) @@ -45,14 +45,14 @@ class TestVerticalMeanMetersIris(TestCase): box.min_depth = 0 box.max_depth = 100 - jobs = VerticalMeanMetersIris.generate_jobs(self.diags, ['diagnostic', 'var', '0', '100']) + jobs = VerticalMeanMetersIris.generate_jobs(self.diags, ['diagnostic', 'ocean', 'var', '0', '100']) self.assertEqual(len(jobs), 2) self.assertEqual(jobs[0], VerticalMeanMetersIris(self.data_manager, '20010101', 0, 0, ModelingRealms.ocean, 'var', box)) self.assertEqual(jobs[1], VerticalMeanMetersIris(self.data_manager, '20010101', 0, 1, ModelingRealms.ocean, 'var', box)) - jobs = VerticalMeanMetersIris.generate_jobs(self.diags, ['diagnostic', 'var', '0', '100', 'seaIce']) + jobs = VerticalMeanMetersIris.generate_jobs(self.diags, ['diagnostic', 'seaice', 'var', '0', '100']) self.assertEqual(len(jobs), 2) self.assertEqual(jobs[0], VerticalMeanMetersIris(self.data_manager, '20010101', 0, 0, ModelingRealms.seaIce, 'var', box)) @@ -63,7 +63,8 @@ class TestVerticalMeanMetersIris(TestCase): VerticalMeanMetersIris.generate_jobs(self.diags, ['diagnostic']) with self.assertRaises(DiagnosticOptionError): - VerticalMeanMetersIris.generate_jobs(self.diags, ['diagnostic', 'var', '0', '100', 'seaIce', 'extra']) + VerticalMeanMetersIris.generate_jobs(self.diags, ['diagnostic', 'ocean', 'var', '0', '100', 'seaIce', + 'extra']) def test_str(self): box = Box(True) diff --git a/test/unit/ocean/test_interpolatecdo.py b/test/unit/ocean/test_interpolatecdo.py index 04b08552..ba238f28 100644 --- a/test/unit/ocean/test_interpolatecdo.py +++ b/test/unit/ocean/test_interpolatecdo.py @@ -24,9 +24,11 @@ class TestInterpolate(TestCase): raise DiagnosticOptionError return value.split('-') - @patch('earthdiagnostics.ocean.interpolatecdo.InterpolateCDO._compute_weights') + @patch('earthdiagnostics.ocean.interpolatecdo.InterpolateCDO.compute_weights') + @patch('earthdiagnostics.ocean.interpolatecdo.InterpolateCDO.get_sample_grid_file') @patch.object(DiagnosticVariableListOption, 'parse', fake_parse) - def test_generate_jobs(self, mock_weights): + @patch('os.remove') + def test_generate_jobs(self, mock_weights, mock_grid_file, mock_remove): mock_weights.return_value = None jobs = InterpolateCDO.generate_jobs(self.diags, ['interpcdo', 'ocean', 'var']) diff --git a/test/unit/ocean/test_siasiesiv.py b/test/unit/ocean/test_siasiesiv.py index 00f7c68c..2457b72d 100644 --- a/test/unit/ocean/test_siasiesiv.py +++ b/test/unit/ocean/test_siasiesiv.py @@ -15,7 +15,8 @@ class TestSiasiesiv(TestCase): self.diags.config.experiment.get_chunk_list.return_value = (('20010101', 0, 0), ('20010101', 0, 1)) self.mask = Mock() - self.psi = Siasiesiv(self.data_manager, '20000101', 1, 1, Basins().Global, self.mask) + self.var_manager = Mock() + self.psi = Siasiesiv(self.data_manager, '20000101', 1, 1, Basins().Global, self.mask, self.var_manager) def test_str(self): self.assertEquals(str(self.psi), 'Siasiesiv Startdate: 20000101 Member: 1 Chunk: 1 Basin: Global') diff --git a/test/unit/statistics/test_daysoverpercentile.py b/test/unit/statistics/test_daysoverpercentile.py index cc225cd6..26e0506a 100644 --- a/test/unit/statistics/test_daysoverpercentile.py +++ b/test/unit/statistics/test_daysoverpercentile.py @@ -13,14 +13,15 @@ class TestDaysOverPercentile(TestCase): self.data_manager = Mock() self.diags = Mock() self.diags.config.experiment.get_chunk_list.return_value = (('20011101', 0, 0), ('20011101', 0, 1)) + self.diags.config.experiment.startdates = ('20001101', '20011101') def test_generate_jobs(self): jobs = DaysOverPercentile.generate_jobs(self.diags, ['monpercent', 'ocean', 'var', '2000', '2001', '11']) self.assertEqual(len(jobs), 2) self.assertEqual(jobs[0], DaysOverPercentile(self.data_manager, ModelingRealms.ocean, 'var', 2000, 2001, - 2000, 11)) + '20001101', 11)) self.assertEqual(jobs[1], DaysOverPercentile(self.data_manager, ModelingRealms.ocean, 'var', 2000, 2001, - 2001, 11)) + '20011101', 11)) with self.assertRaises(Exception): DaysOverPercentile.generate_jobs(self.diags, ['monpercent', 'ocean', 'var', '2000', '2001']) diff --git a/test/unit/test_config.py b/test/unit/test_config.py index 419be475..a1c8d25b 100644 --- a/test/unit/test_config.py +++ b/test/unit/test_config.py @@ -273,6 +273,7 @@ class TestReportConfig(TestCase): self.assertEquals(config.path, 'new_path') def test_priority(self): + self.mock_parser.add_value('REPORT', 'MAXIMUM_PRIORITY', 3) config = ReportConfig(self.mock_parser) self.assertEquals(config.maximum_priority, 3) @@ -294,12 +295,6 @@ class TestExperimentConfig(TestCase): self.assertEquals(config.atmos_timestep, 6) self.assertEquals(config.ocean_timestep, 6) - def test_cmor_version_required(self): - self.mock_parser.add_value('CMOR', 'VERSION', '20001101') - self.mock_parser.add_value('EXPERIMENT', 'DATA_CONVENTION', 'Primavera') - config = ExperimentConfig(self.mock_parser) - self.assertEquals(config.path, 'new_path') - def test_startdates(self): self.mock_parser.add_value('EXPERIMENT', 'STARTDATES', '20001101 20011101') config = ExperimentConfig(self.mock_parser) diff --git a/test/unit/test_diagnostic.py b/test/unit/test_diagnostic.py index ae9921fa..e3cdcd83 100644 --- a/test/unit/test_diagnostic.py +++ b/test/unit/test_diagnostic.py @@ -271,7 +271,7 @@ class TestDiagnosticVariableListOption(TestCase): var_manager_mock = Mock() var_manager_mock.get_variable.side_effect = (self.get_var_mock('var1'), self.get_var_mock('var2')) diag = DiagnosticVariableListOption(var_manager_mock, 'variables') - self.assertEqual(['var1', 'var2'], diag.parse('var1-var2')) + self.assertEqual(['var1', 'var2'], diag.parse('var1:var2')) def test_parse_one(self): var_manager_mock = Mock() -- GitLab From 491febd211c478d1a83c4d04a0ba2802cdb9a11a Mon Sep 17 00:00:00 2001 From: jvegasbsc Date: Wed, 22 Nov 2017 12:08:44 +0100 Subject: [PATCH 47/47] Fixed run test script --- .coveragerc | 2 ++ test/run_test.py | 13 ++++++------- 2 files changed, 8 insertions(+), 7 deletions(-) diff --git a/.coveragerc b/.coveragerc index e41ecaeb..6c77e847 100644 --- a/.coveragerc +++ b/.coveragerc @@ -2,4 +2,6 @@ branch = True source = earthdiagnostics +[html] +title = Coverage report for EarthDiagnostics diff --git a/test/run_test.py b/test/run_test.py index 59eec7e9..765057a5 100644 --- a/test/run_test.py +++ b/test/run_test.py @@ -3,16 +3,15 @@ Script to run the tests for EarthDiagnostics and generate the code coverage report """ + +import os +work_path = os.path.abspath(os.path.join(os.path.dirname(__file__), '..')) +os.chdir(work_path) +print(work_path) import coverage import unittest -import os -work_path = os.path.abspath('.') -source_path = os.path.join(work_path, '..', 'earthdiagnostics', '*') -print(source_path) -cov = coverage.Coverage(include=source_path) -cov.set_option("run:branch", True) -cov.set_option("html:title", 'Coverage report for EarthDiagnostics') +cov = coverage.Coverage() cov.start() suite = unittest.TestLoader().discover('.') unittest.TextTestRunner(verbosity=2).run(suite) -- GitLab