Source code for psyclone.psyir.transformations.extract_trans

# -----------------------------------------------------------------------------
# BSD 3-Clause License
#
# Copyright (c) 2019-2024, Science and Technology Facilities Council.
# All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions are met:
#
# * Redistributions of source code must retain the above copyright notice, this
#   list of conditions and the following disclaimer.
#
# * Redistributions in binary form must reproduce the above copyright notice,
#   this list of conditions and the following disclaimer in the documentation
#   and/or other materials provided with the distribution.
#
# * Neither the name of the copyright holder nor the names of its
#   contributors may be used to endorse or promote products derived from
#   this software without specific prior written permission.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
# "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
# LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
# FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
# COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
# INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
# BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
# LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
# CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
# ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
# POSSIBILITY OF SUCH DAMAGE.
# -----------------------------------------------------------------------------
# Authors: I. Kavcic, Met Office
#          A. R. Porter and N. Nobre, STFC Daresbury Lab
#          J. Henrichs, Bureau of Meteorology

'''This module contains the base class for extracting extracting a region
of an Invoke into a stand-alone application."
'''

from psyclone.configuration import Config
from psyclone.psyGen import BuiltIn, Kern, HaloExchange, GlobalSum
from psyclone.psyir.nodes import (CodeBlock, ExtractNode, Loop, Schedule,
                                  Directive, OMPParallelDirective,
                                  ACCParallelDirective)
from psyclone.psyir.transformations.psy_data_trans import PSyDataTrans
from psyclone.psyir.transformations.transformation_error \
    import TransformationError


[docs]class ExtractTrans(PSyDataTrans): '''This transformation inserts an ExtractNode or a node derived from ExtractNode into the PSyIR of a schedule. At code creation time this node will use the PSyData API to create code that can write the input and output parameters to a file. The node might also create a stand-alone driver program that can read the created file and then execute the instrumented region. Examples are given in the derived classes DynamoExtractTrans and GOceanExtractTrans. After applying the transformation the Nodes marked for extraction are children of the ExtractNode. Nodes to extract can be individual constructs within an Invoke (e.g. Loops containing a Kernel or BuiltIn call) or entire Invokes. This functionality does not support distributed memory. :param node_class: The Node class of which an instance will be inserted \ into the tree (defaults to ExtractNode), but can be any derived class. :type node_class: :py:class:`psyclone.psyir.nodes.ExtractNode` or \ derived class ''' # The types of node that this transformation cannot enclose excluded_node_types = (CodeBlock, ExtractNode, HaloExchange, GlobalSum) def __init__(self, node_class=ExtractNode): # This function is required to provide the appropriate default # node class. super().__init__(node_class=node_class) # ------------------------------------------------------------------------- def get_default_options(self): '''Returns a new dictionary with additional options, specific to the transformation, that will be added to the user option. Any values specified by the user will take precedence. For the extract transformation, by default we want VariablesAccessInformation to report array arguments to lbound, ubound and size as read accesses, so we are certain these arrays will be included in the extraction. :returns: a dictionary with additional options. :rtype: Dict[str, Any] ''' return {"COLLECT-ARRAY-SHAPE-READS": True} # ------------------------------------------------------------------------- @staticmethod def determine_postfix(read_write_info, postfix="_post"): ''' This function prevents any name clashes that can occur when adding the postfix to output variable names. For example, if there is an output variable 'a', the driver (and the output file) will contain two variables: 'a' and 'a_post'. But if there is also another variable called 'a_post', a name clash would occur (two identical keys in the output file, and two identical local variables in the driver). In order to avoid this, the suffix 'post' is changed (to 'post0', 'post1', ...) until any name clashes are avoided. This works for structured and non-structured types. :param read_write_info: information about all input and output \ parameters. :type read_write_info: :py:class:`psyclone.psyir.tools.ReadWriteInfo` :param str postfix: the postfix to append to each output variable. :returns: a postfix that can be added to each output variable without generating a name clash. :rtype: str ''' suffix = "" # Create the a set of all input and output variables (to avoid # checking input+output variables more than once) all_vars = read_write_info.set_of_all_used_vars # The signatures in the input/output list need to be converted # back to strings to easily append the suffix. all_vars_string = [str(input_var) for _, input_var in all_vars] while any(str(out_sig)+postfix+str(suffix) in all_vars_string for out_sig in read_write_info.signatures_written): if suffix == "": suffix = 0 else: suffix += 1 return postfix+str(suffix) # ------------------------------------------------------------------------- def validate(self, node_list, options=None): # pylint: disable=arguments-renamed '''Performs validation checks specific to extract-based transformations. :param node_list: the list of Node(s) we are checking. :type node_list: list of :py:class:`psyclone.psyir.nodes.Node` :param options: a dictionary with options for transformations. :type options: Optional[Dict[str, Any]] :raises TransformationError: if distributed memory is configured. :raises TransformationError: if transformation is applied to a \ Kernel or a BuiltIn call without its \ parent Loop. :raises TransformationError: if transformation is applied to a Loop \ without its parent Directive when \ optimisations are applied. :raises TransformationError: if transformation is applied to an \ orphaned Directive without its parent \ Directive. ''' # Check ExtractTrans specific constraints. # Extracting distributed memory code is not supported due to # generation of infrastructure calls to set halos dirty or clean. # This constraint covers the presence of HaloExchange and # GlobalSum classes as they are only generated when distributed # memory is enabled. But in case of the Nemo API, we don't even # support distributed memory, so ignore the setting of distributed # memory in this case: config = Config.get() if config.distributed_memory and config.api != "nemo": raise TransformationError( f"Error in {self.name}: Distributed memory is not supported.") # Check constraints not covered by excluded_node_types for # individual Nodes in node_list. for node in node_list: # Check that ExtractNode is not inserted between a Kernel or # a BuiltIn call and its parent Loop. if isinstance(node, (Kern, BuiltIn)) and \ isinstance(node.parent.parent, Loop): raise TransformationError( f"Error in {self.name}: Application to a Kernel or a " f"Built-in call without its parent Loop is not allowed.") # Check that ExtractNode is not inserted between a Loop and its # parent Directive when optimisations are applied, as this may # result in including the end Directive for extraction but # not the beginning. if isinstance(node, Loop) and isinstance(node.parent, Schedule) \ and isinstance(node.parent.parent, Directive): raise TransformationError( f"Error in {self.name}: Application to a Loop without its " f"parent Directive is not allowed.") # Check that ExtractNode is not inserted within a thread # parallel region when optimisations are applied. For instance, # this may be between an orphaned Directive (e.g. OMPDoDirective, # ACCLoopDirective) and its ancestor Directive (e.g. ACC or OMP # Parallel Directive) or within an OMPParallelDoDirective. if node.ancestor((OMPParallelDirective, ACCParallelDirective)): raise TransformationError( f"Error in {self.name}: Application to Nodes enclosed " f"within a thread-parallel region is not allowed.") # Performs validation checks specific to PSyData-based # transformations. super().validate(node_list, options)