Source code for temporal.mapcalc

"""
Raster and 3d raster mapcalculation functions

(C) 2012-2013 by the GRASS Development Team
This program is free software under the GNU General Public
License (>=v2). Read the file COPYING that comes with GRASS
for details.

:authors: Soeren Gebbert
"""

import copy
import sys
from datetime import datetime
from multiprocessing import Process

import grass.script as gs
from grass.exceptions import CalledModuleError

from .core import (
    SQLDatabaseInterfaceConnection,
    get_current_mapset,
    get_tgis_message_interface,
)
from .datetime_math import time_delta_to_relative_time
from .open_stds import check_new_stds, open_new_stds, open_old_stds

_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME = (
    "The temporal operators <%s> support only absolute time."
)
############################################################################


[docs]def dataset_mapcalculator( inputs, output, type, expression, base, method, nprocs: int = 1, register_null: bool = False, spatial: bool = False, ): """Perform map-calculations of maps from different space time raster/raster3d datasets, using a specific sampling method to select temporal related maps. A mapcalc expression must be provided to process the temporal selected maps. Temporal operators are available in addition to the r.mapcalc operators: Supported operators for relative and absolute time are: - td() - the time delta of the current interval in days and fractions of days or the unit in case of relative time - start_time() - The start time of the interval from the begin of the time series in days and fractions of days or the unit in case of relative time - end_time() - The end time of the current interval from the begin of the time series in days and fractions of days or the unit in case of relative time Supported operators for absolute time: - start_doy() - Day of year (doy) from the start time [1 - 366] - start_dow() - Day of week (dow) from the start time [1 - 7], the start of the week is monday == 1 - start_year() - The year of the start time [0 - 9999] - start_month() - The month of the start time [1 - 12] - start_week() - Week of year of the start time [1 - 54] - start_day() - Day of month from the start time [1 - 31] - start_hour() - The hour of the start time [0 - 23] - start_minute() - The minute of the start time [0 - 59] - start_second() - The second of the start time [0 - 59] - end_doy() - Day of year (doy) from the end time [1 - 366] - end_dow() - Day of week (dow) from the end time [1 - 7], the start of the week is monday == 1 - end_year() - The year of the end time [0 - 9999] - end_month() - The month of the end time [1 - 12] - end_week() - Week of year of the end time [1 - 54] - end_day() - Day of month from the end time [1 - 31] - end_hour() - The hour of the end time [0 - 23] - end_minute() - The minute of the end time [0 - 59] - end_second() - The minute of the end time [0 - 59] :param inputs: The names of the input space time raster/raster3d datasets :param output: The name of the extracted new space time raster(3d) dataset :param type: The type of the dataset: "raster" or "raster3d" :param expression: The r(3).mapcalc expression :param base: The base name of the new created maps in case a mapcalc expression is provided :param method: The method to be used for temporal sampling :param nprocs: The number of parallel processes to be used for mapcalc processing :param register_null: Set this number True to register empty maps :param spatial: Check spatial overlap """ # We need a database interface for fast computation dbif = SQLDatabaseInterfaceConnection() dbif.connect() mapset = get_current_mapset() msgr = get_tgis_message_interface() input_name_list = inputs.split(",") first_input = open_old_stds(input_name_list[0], type, dbif) # skip sampling when only one dataset specified (with different # band filters) input_name_list_uniq = [] for input_name in input_name_list: ds = open_old_stds(input_name, type, dbif) ds_name = ds.get_name(semantic_label=False) if ds_name not in input_name_list_uniq: input_name_list_uniq.append(ds_name) do_sampling = len(input_name_list_uniq) > 1 # All additional inputs in reverse sorted order to avoid # wrong name substitution input_name_list = input_name_list[1:] input_name_list.sort() input_name_list.reverse() input_list = [] for input in input_name_list: sp = open_old_stds(input, type, dbif) input_list.append(copy.copy(sp)) new_sp = check_new_stds(output, type, dbif, gs.overwrite()) # Sample all inputs by the first input and create a sample matrix if spatial: msgr.message(_("Starting spatio-temporal sampling...")) else: msgr.message(_("Starting temporal sampling...")) map_matrix = [] id_list = [] sample_map_list = [] if len(input_list) > 0 and do_sampling: # First entry is the first dataset id id_list.append(first_input.get_name()) has_samples = False for dataset in input_list: list = dataset.sample_by_dataset( stds=first_input, method=method, spatial=spatial, dbif=dbif ) # In case samples are not found if not list or len(list) == 0: dbif.close() msgr.message(_("No samples found for map calculation")) return 0 # The fist entries are the samples map_name_list = [] if not has_samples: for entry in list: granule = entry["granule"] # Do not consider gaps if granule.get_id() is None: continue sample_map_list.append(granule) map_name_list.append(granule.get_name()) # Attach the map names map_matrix.append(copy.copy(map_name_list)) has_samples = True map_name_list = [] for entry in list: maplist = entry["samples"] granule = entry["granule"] # Do not consider gaps in the sampler if granule.get_id() is None: continue if len(maplist) > 1: msgr.warning( _( "Found more than a single map in a sample " "granule. Only the first map is used for " "computation. Use t.rast.aggregate.ds to " "create synchronous raster datasets." ) ) # Store all maps! This includes non existent maps, # identified by id == None map_name_list.append(maplist[0].get_name()) # Attach the map names map_matrix.append(copy.copy(map_name_list)) id_list.append(dataset.get_name()) else: input_list.insert(0, first_input) for dataset in input_list: list = dataset.get_registered_maps_as_objects(dbif=dbif) if list is None or len(list) < 1: dbif.close() msgr.message( _("No maps registered in input dataset <{}>").format( dataset.get_name() ) ) return 0 map_name_list = [] for map in list: map_name_list.append(map.get_name()) sample_map_list.append(map) # Attach the map names map_matrix.append(copy.copy(map_name_list)) id_list.append(dataset.get_name()) # Needed for map registration map_list = [] if len(map_matrix) > 0: msgr.message(_("Starting mapcalc computation...")) count = 0 # Get the number of samples num = len(map_matrix[0]) # Parallel processing proc_list = [] proc_count = 0 # For all samples for i in range(num): count += 1 msgr.percent(count, num, 10) # Create the r.mapcalc statement for the current time step map_name = "{base}_{suffix}".format( base=base, suffix=gs.get_num_suffix(count, num) ) # Remove spaces and new lines expr = expression.replace(" ", "") # Check that all maps are in the sample valid_maps = True # Replace all dataset names with their map names of the # current time step for j in range(len(map_matrix)): if map_matrix[j][i] is None: valid_maps = False break # Substitute the dataset name with the map name expr = expr.replace(id_list[j], map_matrix[j][i]) # Proceed with the next sample if not valid_maps: continue # Create the new map id and check if the map is already # in the database map_id = map_name + "@" + mapset new_map = first_input.get_new_map_instance(map_id) # Check if new map is in the temporal database if new_map.is_in_db(dbif): if gs.overwrite(): # Remove the existing temporal database entry new_map.delete(dbif) new_map = first_input.get_new_map_instance(map_id) else: msgr.error( _( "Map <%s> is already in temporal database, " "use overwrite flag to overwrite" ) ) continue # Set the time stamp if sample_map_list[i].is_time_absolute(): start, end = sample_map_list[i].get_absolute_time() new_map.set_absolute_time(start, end) else: start, end, unit = sample_map_list[i].get_relative_time() new_map.set_relative_time(start, end, unit) # Set the semantic label semantic_label = sample_map_list[i].metadata.get_semantic_label() if semantic_label is not None: new_map.set_semantic_label(semantic_label) # Parse the temporal expressions expr = _operator_parser(expr, sample_map_list[0], sample_map_list[i]) # Add the output map name expr = "%s=%s" % (map_name, expr) map_list.append(new_map) msgr.verbose(_('Apply mapcalc expression: "%s"') % expr) # Start the parallel r.mapcalc computation if type == "raster": proc_list.append(Process(target=_run_mapcalc2d, args=(expr,))) else: proc_list.append(Process(target=_run_mapcalc3d, args=(expr,))) proc_list[proc_count].start() proc_count += 1 if proc_count not in {nprocs, num} and count != num: continue proc_count = 0 exitcodes = 0 for proc in proc_list: proc.join() exitcodes += proc.exitcode if exitcodes != 0: dbif.close() msgr.fatal(_("Error while mapcalc computation")) # Empty process list proc_list = [] # Register the new maps in the output space time dataset msgr.message(_("Starting map registration in temporal database...")) ( temporal_type, semantic_type, title, description, ) = first_input.get_initial_values() new_sp = open_new_stds( output, type, temporal_type, title, description, semantic_type, dbif, gs.overwrite(), ) count = 0 # collect empty maps to remove them empty_maps = [] # Insert maps in the temporal database and in the new space time # dataset for new_map in map_list: count += 1 msgr.percent(count, num, 10) # Read the map data new_map.load() # In case of a null map continue, do not register null maps if ( new_map.metadata.get_min() is None and new_map.metadata.get_max() is None ): if not register_null: empty_maps.append(new_map) continue # Insert map in temporal database new_map.insert(dbif) new_sp.register_map(new_map, dbif) # Update the spatio-temporal extent and the metadata table entries new_sp.update_from_registered_maps(dbif) # Remove empty maps if len(empty_maps) > 0: n_empty, n_tot = len(empty_maps), len(map_list) msgr.warning( _("Removing {}/{} ({}%) maps because empty...").format( n_empty, n_tot, n_empty * 100.0 / n_tot ) ) names = "" count = 0 for map in empty_maps: if count == 0: names += "%s" % (map.get_name()) else: names += ",%s" % (map.get_name()) count += 1 if type == "raster": gs.run_command( "g.remove", flags="f", type="raster", name=names, quiet=True ) elif type == "raster3d": gs.run_command( "g.remove", flags="f", type="raster_3d", name=names, quiet=True ) dbif.close()
############################################################################### def _run_mapcalc2d(expr) -> None: """Helper function to run r.mapcalc in parallel""" try: gs.run_command( "r.mapcalc", expression=expr, overwrite=gs.overwrite(), quiet=True ) except CalledModuleError: sys.exit(1) ############################################################################### def _run_mapcalc3d(expr) -> None: """Helper function to run r3.mapcalc in parallel""" try: gs.run_command( "r3.mapcalc", expression=expr, overwrite=gs.overwrite(), quiet=True ) except CalledModuleError: sys.exit(1) ############################################################################### def _operator_parser(expr, first, current): """This method parses the expression string and substitutes the temporal operators with numerical values. Supported operators for relative and absolute time are: - td() - the time delta of the current interval in days and fractions of days or the unit in case of relative time - start_time() - The start time of the interval from the begin of the time series in days and fractions of days or the unit in case of relative time - end_time() - The end time of the current interval from the begin of the time series in days and fractions of days or the unit in case of relative time Supported operators for absolute time: - start_doy() - Day of year (doy) from the start time [1 - 366] - start_dow() - Day of week (dow) from the start time [1 - 7], the start of the week is monday == 1 - start_year() - The year of the start time [0 - 9999] - start_month() - The month of the start time [1 - 12] - start_week() - Week of year of the start time [1 - 54] - start_day() - Day of month from the start time [1 - 31] - start_hour() - The hour of the start time [0 - 23] - start_minute() - The minute of the start time [0 - 59] - start_second() - The second of the start time [0 - 59] - end_doy() - Day of year (doy) from the end time [1 - 366] - end_dow() - Day of week (dow) from the end time [1 - 7], the start of the week is monday == 1 - end_year() - The year of the end time [0 - 9999] - end_month() - The month of the end time [1 - 12] - end_week() - Week of year of the end time [1 - 54] - end_day() - Day of month from the end time [1 - 31] - end_hour() - The hour of the end time [0 - 23] - end_minute() - The minute of the end time [0 - 59] - end_second() - The minute of the end time [0 - 59] The modified expression is returned. """ is_time_absolute = first.is_time_absolute() expr = _parse_td_operator(expr, is_time_absolute, first, current) expr = _parse_start_time_operator(expr, is_time_absolute, first, current) expr = _parse_end_time_operator(expr, is_time_absolute, first, current) expr = _parse_start_operators(expr, is_time_absolute, current) return _parse_end_operators(expr, is_time_absolute, current) ############################################################################### def _parse_start_operators(expr, is_time_absolute: bool, current): """ Supported operators for absolute time: - start_doy() - Day of year (doy) from the start time [1 - 366] - start_dow() - Day of week (dow) from the start time [1 - 7], the start of the week is monday == 1 - start_year() - The year of the start time [0 - 9999] - start_month() - The month of the start time [1 - 12] - start_week() - Week of year of the start time [1 - 54] - start_day() - Day of month from the start time [1 - 31] - start_hour() - The hour of the start time [0 - 23] - start_minute() - The minute of the start time [0 - 59] - start_second() - The second of the start time [0 - 59] """ start, end = current.get_absolute_time() msgr = get_tgis_message_interface() if expr.find("start_year()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("start_*")) expr = expr.replace("start_year()", str(start.year)) if expr.find("start_month()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("start_*")) expr = expr.replace("start_month()", str(start.month)) if expr.find("start_week()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("start_*")) expr = expr.replace("start_week()", str(start.isocalendar()[1])) if expr.find("start_day()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("start_*")) expr = expr.replace("start_day()", str(start.day)) if expr.find("start_hour()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("start_*")) expr = expr.replace("start_hour()", str(start.hour)) if expr.find("start_minute()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("start_*")) expr = expr.replace("start_minute()", str(start.minute)) if expr.find("start_second()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("start_*")) expr = expr.replace("start_second()", str(start.second)) if expr.find("start_dow()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("start_*")) expr = expr.replace("start_dow()", str(start.isoweekday())) if expr.find("start_doy()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("start_*")) year = datetime(start.year, 1, 1) delta = start - year expr = expr.replace("start_doy()", str(delta.days + 1)) return expr ############################################################################### def _parse_end_operators(expr, is_time_absolute: bool, current): """ Supported operators for absolute time: - end_doy() - Day of year (doy) from the end time [1 - 366] - end_dow() - Day of week (dow) from the end time [1 - 7], the start of the week is monday == 1 - end_year() - The year of the end time [0 - 9999] - end_month() - The month of the end time [1 - 12] - end_week() - Week of year of the end time [1 - 54] - end_day() - Day of month from the end time [1 - 31] - end_hour() - The hour of the end time [0 - 23] - end_minute() - The minute of the end time [0 - 59] - end_second() - The minute of the end time [0 - 59] In case of time instances the end* expression will be replaced by null() """ start, end = current.get_absolute_time() msgr = get_tgis_message_interface() if expr.find("end_year()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("end_*")) if not end: expr = expr.replace("end_year()", "null()") else: expr = expr.replace("end_year()", str(end.year)) if expr.find("end_month()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("end_*")) if not end: expr = expr.replace("end_month()", "null()") else: expr = expr.replace("end_month()", str(end.month)) if expr.find("end_week()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("end_*")) if not end: expr = expr.replace("end_week()", "null()") else: expr = expr.replace("end_week()", str(end.isocalendar()[1])) if expr.find("end_day()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("end_*")) if not end: expr = expr.replace("end_day()", "null()") else: expr = expr.replace("end_day()", str(end.day)) if expr.find("end_hour()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("end_*")) if not end: expr = expr.replace("end_hour()", "null()") else: expr = expr.replace("end_hour()", str(end.hour)) if expr.find("end_minute()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("end_*")) if not end: expr = expr.replace("end_minute()", "null()") else: expr = expr.replace("end_minute()", str(end.minute)) if expr.find("end_second()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("end_*")) if not end: expr = expr.replace("end_second()", "null()") else: expr = expr.replace("end_second()", str(end.second)) if expr.find("end_dow()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("end_*")) if not end: expr = expr.replace("end_dow()", "null()") else: expr = expr.replace("end_dow()", str(end.isoweekday())) if expr.find("end_doy()") >= 0: if not is_time_absolute: msgr.fatal(_(_TEMPORAL_OPERATOR_SUPPORTS_ONLY_ABSOLUTE_TIME) % ("end_*")) if not end: expr = expr.replace("end_doy()", "null()") else: year = datetime(end.year, 1, 1) delta = end - year expr = expr.replace("end_doy()", str(delta.days + 1)) return expr ############################################################################### def _parse_td_operator(expr, is_time_absolute: bool, first, current): """Parse the time delta operator td(). This operator represents the size of the current sample time interval in days and fraction of days for absolute time, and in relative units in case of relative time. In case of time instances, the td() operator will be of type null(). """ if expr.find("td()") >= 0: td = "null()" if is_time_absolute: start, end = current.get_absolute_time() if end is not None: td = time_delta_to_relative_time(end - start) else: start, end, unit = current.get_relative_time() if end is not None: td = end - start expr = expr.replace("td()", str(td)) return expr ############################################################################### def _parse_start_time_operator(expr, is_time_absolute: bool, first, current): """Parse the start_time() operator. This operator represent the time difference between the start time of the sample space time raster dataset and the start time of the current sample interval or instance. The time is measured in days and fraction of days for absolute time, and in relative units in case of relative time.""" if expr.find("start_time()") >= 0: if is_time_absolute: start1, end = first.get_absolute_time() start, end = current.get_absolute_time() x = time_delta_to_relative_time(start - start1) else: start1, end, unit = first.get_relative_time() start, end, unit = current.get_relative_time() x = start - start1 expr = expr.replace("start_time()", str(x)) return expr ############################################################################### def _parse_end_time_operator(expr, is_time_absolute: bool, first, current): """Parse the end_time() operator. This operator represent the time difference between the start time of the sample space time raster dataset and the end time of the current sample interval. The time is measured in days and fraction of days for absolute time, and in relative units in case of relative time. The end_time() will be represented by null() in case of a time instance. """ if expr.find("end_time()") >= 0: x = "null()" if is_time_absolute: start1, end = first.get_absolute_time() start, end = current.get_absolute_time() if end: x = time_delta_to_relative_time(end - start1) else: start1, end, unit = first.get_relative_time() start, end, unit = current.get_relative_time() if end: x = end - start1 expr = expr.replace("end_time()", str(x)) return expr