aodn
diff --git a/‎aodntools/timeseries_products/aggregated_timeseries.py‎
Lines changed: 18 additions & 19 deletions b/‎aodntools/timeseries_products/aggregated_timeseries.py‎
Lines changed: 18 additions & 19 deletions
diff --git a/‎aodntools/timeseries_products/aggregated_timeseries_template.json‎
Lines changed: 2 additions & 2 deletions b/‎aodntools/timeseries_products/aggregated_timeseries_template.json‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎aodntools/timeseries_products/common.py‎
Lines changed: 11 additions & 1 deletion b/‎aodntools/timeseries_products/common.py‎
Lines changed: 11 additions & 1 deletion
diff --git a/‎aodntools/timeseries_products/gridded_timeseries.py‎
Lines changed: 8 additions & 10 deletions b/‎aodntools/timeseries_products/gridded_timeseries.py‎
Lines changed: 8 additions & 10 deletions
diff --git a/‎aodntools/timeseries_products/gridded_timeseries_template.json‎
Lines changed: 2 additions & 2 deletions b/‎aodntools/timeseries_products/gridded_timeseries_template.json‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎aodntools/timeseries_products/hourly_timeseries.py‎
Lines changed: 8 additions & 10 deletions b/‎aodntools/timeseries_products/hourly_timeseries.py‎
Lines changed: 8 additions & 10 deletions
diff --git a/‎aodntools/timeseries_products/hourly_timeseries_template.json‎
Lines changed: 2 additions & 2 deletions b/‎aodntools/timeseries_products/hourly_timeseries_template.json‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎aodntools/timeseries_products/velocity_aggregated_timeseries.py‎
Lines changed: 10 additions & 13 deletions b/‎aodntools/timeseries_products/velocity_aggregated_timeseries.py‎
Lines changed: 10 additions & 13 deletions
@@ -5,15 +5,15 @@
 import os
 import shutil
 import tempfile
-from datetime import datetime
 
 import numpy as np
 import xarray as xr
 from netCDF4 import Dataset, num2date, stringtochar
 from pkg_resources import resource_filename
 
 from aodntools import __version__
-from aodntools.timeseries_products.common import NoInputFilesError, check_file, in_water
+from aodntools.timeseries_products.common import (NoInputFilesError, check_file, in_water, current_utc_timestamp,
+                                                  TIMESTAMP_FORMAT, DATESTAMP_FORMAT)
 
 TEMPLATE_JSON = resource_filename(__name__, 'aggregated_timeseries_template.json')
 
@@ -39,7 +39,7 @@ def get_variable_values(nc, variable):
     Get values of the variable and its QC flags.
     If variable is not present, nan returned, its QC flags set to 9
     If variable present but not its QC flags, QC set to 0
-    :param nc: dataset
+    :param nc: xarray dataset
     :param variable: name of the variable to get
     :return: variable values and variable qc flags
     """
@@ -48,6 +48,8 @@ def get_variable_values(nc, variable):
 
     if variable in file_variables:
         variable_values = nc[variable].values
+        if any(np.isnan(variable_values)):
+            variable_values = np.ma.masked_array(variable_values, mask=np.isnan(variable_values))
         if variable+'_quality_control' in file_variables:
             variableQC_values = nc[variable+'_quality_control'].values
         else:
@@ -303,28 +305,25 @@ def main_aggregator(files_to_agg, var_to_agg, site_code, input_dir='', output_di
         ds['source_file'].setncatts(source_file_attributes(download_url_prefix, opendap_url_prefix))
 
     ## set global attrs
-    timeformat = '%Y-%m-%dT%H:%M:%SZ'
-    file_timeformat = '%Y%m%d'
-
-    time_start = num2date(np.min(TIME[:]), time_units, time_calendar).strftime(timeformat)
-    time_end = num2date(np.max(TIME[:]), time_units, time_calendar).strftime(timeformat)
-    time_start_filename = num2date(np.min(TIME[:]), time_units, time_calendar).strftime(file_timeformat)
-    time_end_filename = num2date(np.max(TIME[:]), time_units, time_calendar).strftime(file_timeformat)
+    time_start = num2date(np.min(TIME[:]), time_units, time_calendar).strftime(TIMESTAMP_FORMAT)
+    time_end = num2date(np.max(TIME[:]), time_units, time_calendar).strftime(TIMESTAMP_FORMAT)
+    time_start_filename = num2date(np.min(TIME[:]), time_units, time_calendar).strftime(DATESTAMP_FORMAT)
+    time_end_filename = num2date(np.max(TIME[:]), time_units, time_calendar).strftime(DATESTAMP_FORMAT)
 
     add_attribute = {
                     'title':                    ("Long Timeseries Velocity Aggregated product: " + var_to_agg + " at " +
                                                  site_code + " between " + time_start + " and " + time_end),
                     'site_code':                site_code,
                     'time_coverage_start':      time_start,
                     'time_coverage_end':        time_end,
-                    'geospatial_vertical_min':  np.min(ds['DEPTH']),
-                    'geospatial_vertical_max':  np.max(ds['DEPTH']),
-                    'geospatial_lat_min':       np.min(ds['LATITUDE']),
-                    'geospatial_lat_max':       np.max(ds['LATITUDE']),
-                    'geospatial_lon_min':       np.min(ds['LONGITUDE']),
-                    'geospatial_lon_max':       np.max(ds['LONGITUDE']),
-                    'date_created':             datetime.utcnow().strftime(timeformat),
-                    'history':                  datetime.utcnow().strftime(timeformat) + ': Aggregated file created.',
+                    'geospatial_vertical_min':  np.min(ds['DEPTH'][:]),
+                    'geospatial_vertical_max':  np.max(ds['DEPTH'][:]),
+                    'geospatial_lat_min':       np.min(ds['LATITUDE'][:]),
+                    'geospatial_lat_max':       np.max(ds['LATITUDE'][:]),
+                    'geospatial_lon_min':       np.min(ds['LONGITUDE'][:]),
+                    'geospatial_lon_max':       np.max(ds['LONGITUDE'][:]),
+                    'date_created': current_utc_timestamp(),
+                    'history': current_utc_timestamp() + ': Aggregated file created.',
                     'keywords':                 ', '.join([var_to_agg, 'AGGREGATED']),
                     'rejected_files':           "\n".join(rejected_files),
                     'generating_code_version':  __version__}
@@ -346,7 +345,7 @@ def main_aggregator(files_to_agg, var_to_agg, site_code, input_dir='', output_di
     file_version = 1
     output_name = '_'.join(['IMOS', facility_code, data_code, time_start_filename, site_code, ('FV0'+str(file_version)),
                             (var_to_agg + "-" + product_type),
-                            ('END-'+ time_end_filename), 'C-' + datetime.utcnow().strftime(file_timeformat)]) + '.nc'
+                            ('END-'+ time_end_filename), 'C-' + current_utc_timestamp(DATESTAMP_FORMAT)]) + '.nc'
     ncout_path = os.path.join(output_dir, output_name)
     shutil.move(temp_outfile, os.path.join(output_dir, ncout_path))
 
 
@@ -289,8 +289,8 @@
     "_global":{
         "abstract": "Aggregated Time-series Product: This file contains all measurements of the selected variable from all instruments deployed at the selected site. Timestamps are chronologically ordered, but may not be at uniform intervals. Instrument details are stored as a variable in order to keep a record of the origin of each measurement. The quality control flags of the variable of interest and DEPTH are preserved. Out-of-water measurements have been excluded, but no other filtering has been applied to the input data.",
         "acknowledgement": "Any users of IMOS data are required to clearly acknowledge the source of the material derived from IMOS in the format: \"Data was sourced from the Integrated Marine Observing System (IMOS) - IMOS is a national collaborative research infrastructure, supported by the Australian Government.\" If relevant, also credit other organisations involved in collection of this particular datastream (as listed in 'credit' in the metadata record).",
-        "author": "Klein, Eduardo",
-        "author_email": "eduardo.kleinsalas@utas.edu.au",
+        "author": "Australian Ocean Data Network (AODN)",
+        "author_email": "info@aodn.org.au",
         "citation": "The citation in a list of references is: \"IMOS [year-of-data-download], [Title], [data-access-URL], accessed [date-of-access].\".",
         "Conventions": "CF-1.6,IMOS-1.4",
         "data_centre": "Australian Ocean Data Network (AODN)",
 
@@ -1,6 +1,12 @@
 """Code shared by all timeseries product generating code"""
+from datetime import datetime, timezone
+
 import numpy as np
 
+# Common date/time format strings
+TIMESTAMP_FORMAT = '%Y-%m-%dT%H:%M:%SZ'
+DATESTAMP_FORMAT = '%Y%m%d'
+
 
 class NoInputFilesError(Exception):
     """Exception raised if there are no valid input files to aggregate"""
@@ -183,4 +189,8 @@ def in_water(nc):
     :param nc: xarray dataset
     :return: xarray dataset
     """
-    return nc.where(in_water_index(nc), drop=True)
+    return nc.where(in_water_index(nc), drop=True)
+
+
+def current_utc_timestamp(format=TIMESTAMP_FORMAT):
+    return datetime.now(timezone.utc).strftime(format)
@@ -3,14 +3,15 @@
 import argparse
 import os.path
 import json
-from datetime import datetime
+from datetime import datetime, timezone
 
 import xarray as xr
 import pandas as pd
 
 from pkg_resources import resource_filename
 
 from aodntools import __version__
+from aodntools.timeseries_products.common import current_utc_timestamp, TIMESTAMP_FORMAT, DATESTAMP_FORMAT
 import aodntools.timeseries_products.aggregated_timeseries as TStools
 
 
@@ -122,14 +123,12 @@ def generate_netcdf_output_filename(nc, facility_code, data_code, VoI, site_code
     :return: name of the output file
     """
 
-    file_timeformat = '%Y%m%d'
-
     if '_' in VoI:
         VoI = VoI.replace('_', '-')
-    t_start = pd.to_datetime(nc.TIME.min().values).strftime(file_timeformat)
-    t_end = pd.to_datetime(nc.TIME.max().values).strftime(file_timeformat)
+    t_start = pd.to_datetime(nc.TIME.min().values).strftime(DATESTAMP_FORMAT)
+    t_end = pd.to_datetime(nc.TIME.max().values).strftime(DATESTAMP_FORMAT)
 
-    output_name = '_'.join(['IMOS', facility_code, data_code, t_start, site_code, ('FV0'+str(file_version)), (VoI+"-"+product_type), ('END-'+ t_end), 'C-' + datetime.utcnow().strftime(file_timeformat)]) + '.nc'
+    output_name = '_'.join(['IMOS', facility_code, data_code, t_start, site_code, ('FV0'+str(file_version)), (VoI+"-"+product_type), ('END-'+ t_end), 'C-' + current_utc_timestamp(DATESTAMP_FORMAT)]) + '.nc'
 
     return output_name
 
@@ -250,10 +249,9 @@ def grid_variable(input_file, VoI, depth_bins=None, max_separation=50, depth_bin
     for attr in ('geospatial_lat_min', 'geospatial_lat_max', 'geospatial_lon_min', 'geospatial_lon_max', 'site_code',
                  'included_values_flagged_as', 'contributor_name', 'contributor_role', 'contributor_email'):
         VoI_interpolated.attrs[attr] = input_global_attributes[attr]
-    timeformat = '%Y-%m-%dT%H:%M:%SZ'
-    date_start = pd.to_datetime(VoI_interpolated.TIME.values.min()).strftime(timeformat)
-    date_end = pd.to_datetime(VoI_interpolated.TIME.values.max()).strftime(timeformat)
-    date_created = datetime.utcnow().strftime(timeformat)
+    date_start = pd.to_datetime(VoI_interpolated.TIME.values.min()).strftime(TIMESTAMP_FORMAT)
+    date_end = pd.to_datetime(VoI_interpolated.TIME.values.max()).strftime(TIMESTAMP_FORMAT)
+    date_created = current_utc_timestamp()
     VoI_interpolated.attrs.update(global_attribute_dictionary)
     VoI_interpolated.attrs.update({
         'source_file':           input_file,
 
@@ -77,8 +77,8 @@
         "title": "Gridded Time Series Product: {VoI} interpolated at {site_code} to fixed target depths at 1-hour time intervals, between {time_min} and {time_max} and {depth_min} and {depth_max} meters.",
         "abstract": "Gridded Time Series Product: This file contains {VoI} readings from all instruments deployed at the {site_code} mooring site. The source of the values is the Hourly Time Series Product where TIME is fixed to 1-hour interval. The variable values are interpolated to a fixed target depths using a linear interpolation between consecutive existing depths. Only values flagged as 1 or 2 are used in the interpolation.",
        "acknowledgement": "Any users of IMOS data are required to clearly acknowledge the source of the material derived from IMOS in the format: \"Data was sourced from the Integrated Marine Observing System (IMOS) - IMOS is a national collaborative research infrastructure, supported by the Australian Government.\" If relevant, also credit other organisations involved in collection of this particular datastream (as listed in 'credit' in the metadata record).",
-        "author": "Klein, Eduardo",
-        "author_email": "eduardo.kleinsalas@utas.edu.au",
+        "author": "Australian Ocean Data Network (AODN)",
+        "author_email": "info@aodn.org.au",
         "citation": "The citation in a list of references is: \"IMOS [year-of-data-download], [Title], [data-access-URL], accessed [date-of-access].\".",
         "Conventions": "CF-1.6,IMOS-1.4",
         "data_centre": "Australian Ocean Data Network (AODN)",
 
@@ -4,7 +4,6 @@
 import json
 import os.path
 from collections import OrderedDict
-from datetime import datetime
 
 import numpy as np
 import pandas as pd
@@ -14,7 +13,8 @@
 
 from aodntools import __version__
 from aodntools.timeseries_products import aggregated_timeseries as utils
-from aodntools.timeseries_products.common import NoInputFilesError, check_file, get_qc_variable_names, in_water
+from aodntools.timeseries_products.common import (NoInputFilesError, check_file, get_qc_variable_names, in_water,
+                                                  current_utc_timestamp, TIMESTAMP_FORMAT, DATESTAMP_FORMAT)
 
 TEMPLATE_JSON = resource_filename(__name__, 'hourly_timeseries_template.json')
 BINNING_METHOD_JSON = resource_filename(__name__, 'binning_method.json')
@@ -180,8 +180,8 @@ def set_globalattr(nc_aggregated, templatefile, site_code, add_attribute, parame
                 'geospatial_lat_max': nc_aggregated.LATITUDE.values.max(),
                 'geospatial_lon_min': nc_aggregated.LONGITUDE.values.min(),
                 'geospatial_lon_max': nc_aggregated.LONGITUDE.values.max(),
-                'date_created': datetime.utcnow().strftime(timeformat),
-                'history': datetime.utcnow().strftime(timeformat) + ': Hourly aggregated file created.',
+                'date_created': current_utc_timestamp(),
+                'history': current_utc_timestamp() + ': Hourly aggregated file created.',
                 'keywords': ', '.join(parameter_names + ['HOURLY', 'AGGREGATED'])}
     global_metadata.update(agg_attr)
     global_metadata.update(add_attribute)
@@ -259,14 +259,12 @@ def generate_netcdf_output_filename(nc, facility_code, data_code, site_code, pro
     :return: name of the output file
     """
 
-    file_timeformat = '%Y%m%d'
-
-    t_start = pd.to_datetime(nc.TIME.min().values).strftime(file_timeformat)
-    t_end = pd.to_datetime(nc.TIME.max().values).strftime(file_timeformat)
+    t_start = pd.to_datetime(nc.TIME.min().values).strftime(DATESTAMP_FORMAT)
+    t_end = pd.to_datetime(nc.TIME.max().values).strftime(DATESTAMP_FORMAT)
 
     output_name = '_'.join(
         ['IMOS', facility_code, data_code, t_start, site_code, ('FV0' + str(file_version)), product_type,
-         ('END-' + t_end), 'C-' + datetime.utcnow().strftime(file_timeformat)]) + '.nc'
+         ('END-' + t_end), 'C-' + current_utc_timestamp(DATESTAMP_FORMAT)]) + '.nc'
 
     return output_name
 
@@ -567,4 +565,4 @@ def hourly_aggregator(files_to_aggregate, site_code, qcflags, input_dir='', outp
     qcflags = [int(i) for i in args.qcflags]
 
     hourly_aggregator(files_to_aggregate=files_to_aggregate, site_code=args.site_code, qcflags=qcflags,
-                      input_dir=args.input_dir, output_dir=args.output_path)
+                      input_dir=args.input_dir, output_dir=args.output_dir)
@@ -368,8 +368,8 @@
     "_global":{
         "abstract": "Hourly Time Series Product: This file contains selected variables from all instruments deployed at the {site_code} mooring site. The values are binned to a fixed 1-hour interval. Instrument details are stored as variables in order to keep a record of the origin of each measurement. Out-of-water measurements have been excluded. Only values flagged as {flags} are retained in the aggregation.",
         "acknowledgement": "Any users of IMOS data are required to clearly acknowledge the source of the material derived from IMOS in the format: \"Data was sourced from the Integrated Marine Observing System (IMOS) - IMOS is a national collaborative research infrastructure, supported by the Australian Government.\" If relevant, also credit other organisations involved in collection of this particular datastream (as listed in 'credit' in the metadata record).",
-        "author": "Klein, Eduardo",
-        "author_email": "eduardo.kleinsalas@utas.edu.au",
+        "author": "Australian Ocean Data Network (AODN)",
+        "author_email": "info@aodn.org.au",
         "citation": "The citation in a list of references is: \"IMOS [year-of-data-download], [Title], [data-access-URL], accessed [date-of-access].\".",
         "Conventions": "CF-1.6,IMOS-1.4",
         "data_centre": "Australian Ocean Data Network (AODN)",
 
@@ -4,15 +4,15 @@
 from  netCDF4 import Dataset, num2date, stringtochar
 import numpy as np
 import json
-from datetime import datetime
 import argparse
 from pkg_resources import resource_filename
 from aodntools import __version__
 
 import xarray as xr
 
 from aodntools.timeseries_products import aggregated_timeseries as utils
-from aodntools.timeseries_products.common import NoInputFilesError, check_velocity_file
+from aodntools.timeseries_products.common import (NoInputFilesError, check_velocity_file, current_utc_timestamp,
+                                                  TIMESTAMP_FORMAT, DATESTAMP_FORMAT)
 
 TEMPLATE_JSON = resource_filename(__name__, 'velocity_aggregated_timeseries_template.json')
 
@@ -144,7 +144,7 @@ def velocity_aggregated(files_to_agg, site_code, input_dir='', output_dir='./',
                 WCUR[start:end] = flat_variable(nc, 'WCUR')
                 WCURqc[start:end] = flat_variable(nc, 'WCUR_quality_control')
             else:
-                WCUR[start:end] = np.full(n_obs, np.nan)
+                WCUR[start:end] = np.ma.masked
                 WCURqc[start:end] = np.full(n_obs, 9)
 
             ##calculate depth and add CELL_INDEX
@@ -188,13 +188,10 @@ def velocity_aggregated(files_to_agg, site_code, input_dir='', output_dir='./',
         ds['source_file'].setncatts(utils.source_file_attributes(download_url_prefix, opendap_url_prefix))
 
     ## set global attrs
-    timeformat = '%Y-%m-%dT%H:%M:%SZ'
-    file_timeformat = '%Y%m%d'
-
-    time_start = num2date(np.min(TIME[:]), time_units, time_calendar).strftime(timeformat)
-    time_end = num2date(np.max(TIME[:]), time_units, time_calendar).strftime(timeformat)
-    time_start_filename = num2date(np.min(TIME[:]), time_units, time_calendar).strftime(file_timeformat)
-    time_end_filename = num2date(np.max(TIME[:]), time_units, time_calendar).strftime(file_timeformat)
+    time_start = num2date(np.min(TIME[:]), time_units, time_calendar).strftime(TIMESTAMP_FORMAT)
+    time_end = num2date(np.max(TIME[:]), time_units, time_calendar).strftime(TIMESTAMP_FORMAT)
+    time_start_filename = num2date(np.min(TIME[:]), time_units, time_calendar).strftime(DATESTAMP_FORMAT)
+    time_end_filename = num2date(np.max(TIME[:]), time_units, time_calendar).strftime(DATESTAMP_FORMAT)
 
     add_attribute = {
                     'title':                    ("Long Timeseries Velocity Aggregated product: " + ', '.join(varlist) + " at " +
@@ -208,8 +205,8 @@ def velocity_aggregated(files_to_agg, site_code, input_dir='', output_dir='./',
                     'geospatial_lat_max':       np.max(ds['LATITUDE']),
                     'geospatial_lon_min':       np.min(ds['LONGITUDE']),
                     'geospatial_lon_max':       np.max(ds['LONGITUDE']),
-                    'date_created':             datetime.utcnow().strftime(timeformat),
-                    'history':                  datetime.utcnow().strftime(timeformat) + ': Aggregated file created.',
+                    'date_created':             current_utc_timestamp(),
+                    'history':                  current_utc_timestamp() + ': Aggregated file created.',
                     'keywords':                 ', '.join(varlist + ['AGGREGATED']),
                     'rejected_files':           "\n".join(bad_files.keys()),
                     'generating_code_version':  __version__
@@ -235,7 +232,7 @@ def velocity_aggregated(files_to_agg, site_code, input_dir='', output_dir='./',
     file_version = 1
     output_name = '_'.join(['IMOS', facility_code, data_code, time_start_filename, site_code, ('FV0'+str(file_version)),
                             ("velocity-"+product_type),
-                            ('END-'+ time_end_filename), 'C-' + datetime.utcnow().strftime(file_timeformat)]) + '.nc'
+                            ('END-'+ time_end_filename), 'C-' + current_utc_timestamp(DATESTAMP_FORMAT)]) + '.nc'
     ncout_path = os.path.join(output_dir, output_name)
     shutil.move(temp_outfile, ncout_path)