Skip to content

Commit

Permalink
Merge pull request #191 from ecmwf-ifs/naml-transformation-config
Browse files Browse the repository at this point in the history
Transformation configuration and SchedulerConfig update
  • Loading branch information
reuterbal authored Dec 19, 2023
2 parents 37d0033 + ffb6330 commit 2f5158a
Show file tree
Hide file tree
Showing 22 changed files with 426 additions and 268 deletions.
4 changes: 2 additions & 2 deletions .pylintrc
Original file line number Diff line number Diff line change
Expand Up @@ -518,5 +518,5 @@ min-public-methods=2

# Exceptions that will emit a warning when being caught. Defaults to
# "BaseException, Exception".
overgeneral-exceptions=BaseException,
Exception
overgeneral-exceptions=builtin.BaseException,
builtin.Exception
19 changes: 2 additions & 17 deletions loki/build/builder.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,15 +5,13 @@
# granted to it by virtue of its status as an intergovernmental organisation
# nor does it submit to any jurisdiction.

import sys
from pathlib import Path
from collections import deque
from importlib import import_module, reload, invalidate_caches
from operator import attrgetter
import networkx as nx

from loki.logging import default_logger
from loki.tools import as_tuple, delete
from loki.tools import as_tuple, delete, load_module
from loki.build.compiler import _default_compiler
from loki.build.obj import Obj
from loki.build.header import Header
Expand Down Expand Up @@ -150,20 +148,7 @@ def load_module(self, module):
"""
Handle import paths and load the compiled module
"""
if str(self.build_dir.absolute()) not in sys.path:
sys.path.insert(0, str(self.build_dir.absolute()))
if module in sys.modules:
reload(sys.modules[module])
return sys.modules[module]

try:
# Attempt to load module directly
return import_module(module)
except ModuleNotFoundError:
# If module caching interferes, try again with clean caches
invalidate_caches()
return import_module(module)

return load_module(module, path=self.build_dir.absolute())

def wrap_and_load(self, sources, modname=None, build=True,
libs=None, lib_dirs=None, incl_dirs=None,
Expand Down
1 change: 1 addition & 0 deletions loki/bulk/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,3 +7,4 @@

from loki.bulk.scheduler import * # noqa
from loki.bulk.item import * # noqa
from loki.bulk.configure import * # noqa
170 changes: 170 additions & 0 deletions loki/bulk/configure.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,170 @@
# (C) Copyright 2018- ECMWF.
# This software is licensed under the terms of the Apache Licence Version 2.0
# which can be obtained at http://www.apache.org/licenses/LICENSE-2.0.
# In applying this licence, ECMWF does not waive the privileges and immunities
# granted to it by virtue of its status as an intergovernmental organisation
# nor does it submit to any jurisdiction.

import re
from pathlib import Path

from loki.dimension import Dimension
from loki.tools import as_tuple, CaseInsensitiveDict, load_module
from loki.logging import error


__all__ = ['SchedulerConfig', 'TransformationConfig']


class SchedulerConfig:
"""
Configuration object for the transformation :any:`Scheduler` that
encapsulates default behaviour and item-specific behaviour. Can
be create either from a raw dictionary or configration file.
Parameters
----------
default : dict
Default options for each item
routines : dict of dicts or list of dicts
Dicts with routine-specific options.
dimensions : dict of dicts or list of dicts
Dicts with options to define :any`Dimension` objects.
disable : list of str
Subroutine names that are entirely disabled and will not be
added to either the callgraph that we traverse, nor the
visualisation. These are intended for utility routines that
pop up in many routines but can be ignored in terms of program
control flow, like ``flush`` or ``abort``.
enable_imports : bool
Disable the inclusion of module imports as scheduler dependencies.
"""

def __init__(
self, default, routines, disable=None, dimensions=None,
transformation_configs=None, enable_imports=False
):
self.default = default
self.disable = as_tuple(disable)
self.dimensions = dimensions
self.enable_imports = enable_imports

self.routines = CaseInsensitiveDict(routines)
self.transformation_configs = transformation_configs

# Resolve the dimensions for trafo configurations
for cfg in self.transformation_configs.values():
cfg.resolve_dimensions(dimensions)

# Instantiate Transformation objects
self.transformations = {
name: config.instantiate() for name, config in self.transformation_configs.items()
}

@classmethod
def from_dict(cls, config):
default = config['default']
routines = config.get('routines', [])
disable = default.get('disable', None)
enable_imports = default.get('enable_imports', False)

# Add any dimension definitions contained in the config dict
dimensions = config.get('dimensions', {})
dimensions = {k: Dimension(**d) for k, d in dimensions.items()}

# Create config objects for Transformation configurations
transformation_configs = config.get('transformations', {})
transformation_configs = {
name: TransformationConfig(name=name, **cfg)
for name, cfg in transformation_configs.items()
}

return cls(
default=default, routines=routines, disable=disable, dimensions=dimensions,
transformation_configs=transformation_configs, enable_imports=enable_imports
)

@classmethod
def from_file(cls, path):
import toml # pylint: disable=import-outside-toplevel
# Load configuration file and process options
with Path(path).open('r') as f:
config = toml.load(f)

return cls.from_dict(config)


class TransformationConfig:
"""
Configuration object for :any:`Transformation` instances that can
be used to create :any:`Transformation` objects from dictionaries
or a config file.
Parameters
----------
name : str
Name of the transformation object
module : str
Python module from which to load the transformation class
classname : str, optional
Name of the class to look for when instantiating the transformation.
If not provided, ``name`` will be used instead.
path : str or Path, optional
Path to add to the sys.path before attempting to load the ``module``
options : dict
Dicts of options that define the transformation behaviour.
These options will be passed as constructor arguments using
keyword-argument notation.
"""

_re_dimension = re.compile(r'\%dimensions\.(.*?)\%')

def __init__(self, name, module, classname=None, path=None, options=None):
self.name = name
self.module = module
self.classname = classname or self.name
self.path = path
self.options = dict(options)

def resolve_dimensions(self, dimensions):
"""
Substitute :any:`Dimension` objects for placeholder strings.
The format of the string replacement matches the TOML
configuration. It will attempt to replace ``%dimensions.dim_name%``
with a :any:`Dimension` found in :data:`dimensions`:
Parameters
----------
dimensions : dict
Dict matching string to pre-configured :any:`Dimension` objects.
"""
for key, val in self.options.items():
if not isinstance(val, str):
continue

matches = self._re_dimension.findall(val)
matches = tuple(dimensions[m] for m in as_tuple(matches))
if matches:
self.options[key] = matches[0] if len(matches) == 1 else matches

def instantiate(self):
"""
Creates instantiated :any:`Transformation` object from stored config options.
"""
# Load the module that contains the transformations
mod = load_module(self.module, path=self.path)

# Check for and return Transformation class
if not hasattr(mod, self.classname):
raise RuntimeError(f'Failed to load Transformation class: {self.classname}')

# Attempt to instantiate transformation from config
try:
transformation = getattr(mod, self.classname)(**self.options)
except TypeError as e:
error(f'[Loki::Transformation] Failed to instiate {self.classname} from configuration')
error(f' Options passed: {self.options}')
raise e

return transformation
90 changes: 4 additions & 86 deletions loki/bulk/scheduler.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,103 +7,21 @@

from os.path import commonpath
from pathlib import Path
from collections import deque, OrderedDict, defaultdict
from collections import deque, defaultdict
import networkx as nx
from codetiming import Timer

from loki.bulk.item import ProcedureBindingItem, SubroutineItem, GlobalVarImportItem, GenericImportItem
from loki.bulk.configure import SchedulerConfig
from loki.frontend import FP, REGEX, RegexParserClass
from loki.sourcefile import Sourcefile
from loki.dimension import Dimension
from loki.tools import as_tuple, CaseInsensitiveDict, flatten
from loki.logging import info, perf, warning, debug
from loki.bulk.item import ProcedureBindingItem, SubroutineItem, GlobalVarImportItem, GenericImportItem
from loki.subroutine import Subroutine
from loki.module import Module


__all__ = ['Scheduler', 'SchedulerConfig']


class SchedulerConfig:
"""
Configuration object for the transformation :any:`Scheduler` that
encapsulates default behaviour and item-specific behaviour. Can
be create either from a raw dictionary or configration file.
Parameters
----------
default : dict
Default options for each item
routines : dict of dicts or list of dicts
Dicts with routine-specific options.
dimensions : dict of dicts or list of dicts
Dicts with options to define :any`Dimension` objects.
disable : list of str
Subroutine names that are entirely disabled and will not be
added to either the callgraph that we traverse, nor the
visualisation. These are intended for utility routines that
pop up in many routines but can be ignored in terms of program
control flow, like ``flush`` or ``abort``.
enable_imports : bool
Disable the inclusion of module imports as scheduler dependencies.
"""

def __init__(self, default, routines, disable=None, dimensions=None, dic2p=None, derived_types=None,
enable_imports=False):
self.default = default
if isinstance(routines, dict):
self.routines = CaseInsensitiveDict(routines)
else:
self.routines = CaseInsensitiveDict((r.name, r) for r in as_tuple(routines))
self.disable = as_tuple(disable)
self.dimensions = dimensions
self.enable_imports = enable_imports

if dic2p is not None:
self.dic2p = dic2p
else:
self.dic2p = {}
if derived_types is not None:
self.derived_types = derived_types
else:
self.derived_types = ()

@classmethod
def from_dict(cls, config):
default = config['default']
if 'routine' in config:
config['routines'] = OrderedDict((r['name'], r) for r in config.get('routine', []))
else:
config['routines'] = []
routines = config['routines']
disable = default.get('disable', None)
enable_imports = default.get('enable_imports', False)

# Add any dimension definitions contained in the config dict
dimensions = {}
if 'dimension' in config:
dimensions = [Dimension(**d) for d in config['dimension']]
dimensions = {d.name: d for d in dimensions}

dic2p = {}
if 'dic2p' in config:
dic2p = config['dic2p']

derived_types = ()
if 'derived_types' in config:
derived_types = config['derived_types']

return cls(default=default, routines=routines, disable=disable, dimensions=dimensions, dic2p=dic2p,
derived_types=derived_types, enable_imports=enable_imports)

@classmethod
def from_file(cls, path):
import toml # pylint: disable=import-outside-toplevel
# Load configuration file and process options
with Path(path).open('r') as f:
config = toml.load(f)

return cls.from_dict(config)
__all__ = ['Scheduler']


class Scheduler:
Expand Down
23 changes: 22 additions & 1 deletion loki/tools/files.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,13 +7,15 @@

import os
import re
import sys
import pickle
import shutil
import fnmatch
import tempfile
from functools import wraps
from hashlib import md5
from pathlib import Path
from importlib import import_module, reload, invalidate_caches

from loki.logging import debug, info
from loki.tools.util import as_tuple, flatten
Expand All @@ -22,7 +24,7 @@

__all__ = [
'gettempdir', 'filehash', 'delete', 'find_paths', 'find_files',
'disk_cached'
'disk_cached', 'load_module'
]


Expand Down Expand Up @@ -146,3 +148,22 @@ def cached(*args, **kwargs):
return res
return cached
return decorator


def load_module(module, path=None):
"""
Handle import paths and load the compiled module
"""
if path and str(path) not in sys.path:
sys.path.insert(0, str(path))
if module in sys.modules:
reload(sys.modules[module])
return sys.modules[module]

try:
# Attempt to load module directly
return import_module(module)
except ModuleNotFoundError:
# If module caching interferes, try again with clean caches
invalidate_caches()
return import_module(module)
Loading

0 comments on commit 2f5158a

Please sign in to comment.