Source code for smif.controller.modelrun

"""The Model Run collects scenarios, timesteps, narratives, and
model collection into a package which can be built and passed to
the ModelRunner to run.

The ModelRunner is responsible for running a ModelRun, including passing
in the correct data to the model between timesteps and calling to the
DecisionManager to obtain decisions.

ModeRun has attributes:
- id
- description
- sosmodel
- timesteps
- scenarios
- narratives
- strategy
- status

"""
from logging import getLogger

import networkx as nx
from smif.decision.decision import DecisionManager
from smif.exception import SmifModelRunError, SmifTimestepResolutionError
from smif.metadata import RelativeTimestep
from smif.model import ModelOperation, ScenarioModel


[docs]class ModelRun(object):
    """Collects timesteps, scenarios , narratives and a SosModel together

    Attributes
    ----------
    name: str
        The unique name of the model run
    timestamp: :class:`datetime.datetime`
        An ISO8601 compatible timestamp of model run creation time
    description: str
        A friendly description of the model run
    sos_model: :class:`smif.model.sos_model.SosModel`
        The contained SosModel
    scenarios: dict
        For each scenario set, a mapping to a valid scenario within that set
    narratives: list
        A list of :class:`smif.parameters.Narrative` objects
    strategies: dict
    status: str
    logger: logging.Logger
    results: dict
    """

    def __init__(self):
        self.name = ""
        self.timestamp = None
        self.description = ""
        self.sos_model = None
        self._model_horizon = []

        self.scenarios = {}
        self.narratives = []
        self.strategies = None
        self.status = 'Empty'

        self.logger = getLogger(__name__)

        self.results = {}

[docs]    def as_dict(self):
        """Serialises :class:`smif.controller.modelrun.ModelRun`

        Returns a dictionary definition of a ModelRun which is equivalent to that required by
        `from_dict` to construct a new model run

        Returns
        -------
        dict
        """
        config = {
            'name': self.name,
            'description': self.description,
            'stamp': self.timestamp,
            'timesteps': self._model_horizon,
            'sos_model': self.sos_model.name,
            'scenarios': self.scenarios,
            'narratives': self.narratives,
            'strategies': self.strategies
        }
        return config

[docs]    @classmethod
    def from_dict(cls, config):
        """Create a :class:`smif.controller.modelrun.ModelRun` from a dictionary
        """
        model_run = cls()
        model_run.name = config['name']
        model_run.description = config['description']
        model_run.timestamp = config['stamp']
        model_run.initialised = False
        model_run.model_horizon = config['timesteps']
        model_run.sos_model = config['sos_model']
        model_run.scenarios = config['scenarios']
        model_run.narratives = config['narratives']
        model_run.strategies = config['strategies']
        model_run.status = 'Built'
        model_run.validate()
        return model_run

[docs]    def validate(self):
        """Validate that this ModelRun has been set up with sufficient data
        to run
        """
        scenarios = set(self.scenarios)
        model_scenarios = set(scenario.name for scenario in self.sos_model.scenario_models)
        missing_scenarios = scenarios - model_scenarios
        if missing_scenarios:
            raise SmifModelRunError("ScenarioSets {} are selected in the ModelRun "
                                    "configuration but not found in the SosModel "
                                    "configuration".format(missing_scenarios))

    @property
    def model_horizon(self):
        """Returns the list of timesteps

        Returns
        =======
        list
            A list of timesteps, distinct and sorted in ascending order
        """
        return self._model_horizon.copy()

    @model_horizon.setter
    def model_horizon(self, value):
        self._model_horizon = sorted(list(set(value)))

[docs]    def run(self, store, job_scheduler, warm_start_timestep=None, dry_run=False):
        """Builds all the objects and passes them to the ModelRunner

        The idea is that this will add ModelRuns to a queue for asychronous
        processing

        """
        self.logger.debug("Running model run %s", self.name)
        try:
            self.logger.profiling_start('modelrun.run', self.name)
        except AttributeError:
            self.logger.info('START modelrun.run %s', self.name)

        if self.status == 'Built':
            if not self.model_horizon:
                raise SmifModelRunError("No timesteps specified for model run")

            # Either avoid rework (if warm_start) or else make sure to clear stale results
            warm_start = warm_start_timestep is not None
            if warm_start:
                idx = self.model_horizon.index(warm_start_timestep)
                self.model_horizon = self.model_horizon[idx:]
            else:
                self.logger.debug("Clearing results for %s", self.name)
                store.clear_results(self.name)

            self.status = 'Running'
            modelrunner = ModelRunner(warm_start)
            modelrunner.solve_model(self, job_scheduler, store, dry_run)
            self.status = 'Successful'
        else:
            raise SmifModelRunError("Model is not yet built.")

        try:
            self.logger.profiling_stop('modelrun.run', self.name)
        except AttributeError:
            self.logger.info('STOP modelrun.run %s', self.name)


[docs]class ModelRunner(object):
    """The ModelRunner orchestrates the simulation of a SoSModel over decision iterations and
    timesteps as provided by a DecisionManager.
    """
    def __init__(self, warm_start=False):
        self.logger = getLogger(__name__)
        self.warm_start = warm_start

[docs]    def solve_model(self, model_run, job_scheduler, store, dry_run=False):
        """Solve a ModelRun

        This method steps through the model horizon, building
        a job graph and submitting this to the scheduler
        at each decision loop.

        Arguments
        ---------
        model_run : :class:`smif.controller.modelrun.ModelRun`
        store : :class:`smif.data_layer.Store`
        """
        # Solve the model run: decision loop generates a series of bundles of independent
        # decision iterations, each with a number of timesteps to run
        self.logger.debug("Solving the models over all timesteps: %s", model_run.model_horizon)

        # Initialise the decision manager (and hence decision modules)
        self.logger.debug("Initialising the decision manager")
        decision_manager = DecisionManager(store,
                                           model_run.model_horizon,
                                           model_run.name,
                                           model_run.sos_model)

        for bundle in decision_manager.decision_loop():
            # each iteration is independent at this point, so the following loop is a
            # candidate for running in parallel
            job_graph = self.build_job_graph(model_run, bundle)

            if self.warm_start:
                # filter graph to exclude already-available results
                complete_jobs = store.completed_jobs(model_run.name)
                job_graph = self.filter_job_graph(model_run.name, job_graph, complete_jobs)

            job_id, err = job_scheduler.add(job_graph, dry_run)
            self.logger.debug("Running job %s", job_id)
            if err is not None:
                status = job_scheduler.get_status(job_id)
                self.logger.debug("Job %s %s", job_id, status['status'])
                raise err

[docs]    def build_job_graph(self, model_run, bundle):
        """ Build a job graph

        Build and return the job graph for an entire bundle, including before_model_run jobs
        when the models were not yet initialised.

        Constraints:
        - Bundle must have keys: 'decision_iterations' and 'timesteps'
        - Running a bundle runs each (decision iteration, timestep) pair specified by the
          combinations of decision iterations and timesteps
        - (decision iteration, timestep) pairs must be unique over an entire model run
        - In a single bundle, timesteps must be a consecutive subset of the model horizon
          timesteps

        The first timestep in each decision iteration of a bundle is either:
        - the first timestep in the model horizon and initialised from the model run starting
          point with scenario data and initial-timestep interventions only
        - or another timestep, picking up from where some previous (timestep, decision
          iteration) left off, which is explicitly included in the bundle.

        If a bundle's timesteps start from a timestep after the first one in the model horizon,
        the bundle must provide 'decision_links', and bundle must start from the very next
        timestep available in the model horizon.

        Jobs need to be able to identify a point to pick up from, namely the (timestep,
        decision iteration) which identifies the immediately preceding simulation state.

        E.g. request running first two timesteps::

            {
                'decision_iterations': [0, 1],
                'timesteps': [0, 1]
            }

        Run first two timesteps again, with an updated decision::

            {
                'decision_iterations': [1, 2],
                'timesteps': [0, 1]
            }

        Results meet decision requirements, so run next two timesteps, linking this bundle's
        decision iterations to previous decision iterations::

            {
                'decision_iterations': [3, 4],
                'timesteps': [2, 3],
                'decision_links': {3: 1, 4: 2}
            }


        Arguments
        ---------
        model_run: :class:`smif.controller.modelrun.ModelRun` bundle: :class:`dict`

        Returns
        -------
        :class:`networkx.Graph` A populated job graph with edges showing dependencies between
            different operations and timesteps
        """
        job_graph = nx.DiGraph()

        # Solve the model run: decision loop generates a series of bundles of independent
        # decision iterations, each with a number of timesteps to run
        for decision_iteration in bundle['decision_iterations']:
            self.logger.info('Running decision iteration %s', decision_iteration)

            for timestep_index, timestep in enumerate(bundle['timesteps']):
                self.logger.info('Running timestep %s', timestep)
                # one simulate job node per model
                job_graph.add_nodes_from(
                    self._make_simulate_job_nodes(
                        model_run.name,
                        model_run.sos_model.sector_models,
                        decision_iteration,
                        timestep,
                        model_run.model_horizon
                    )
                )
                # edges to match within-timestep dependencies
                job_graph.add_edges_from(
                    self._make_current_simulate_job_edges(
                        model_run.name,
                        model_run.sos_model.model_dependencies,
                        timestep,
                        decision_iteration
                    )
                )

                # connect any between-timestep dependencies
                if timestep_index == 0:
                    # first timestep in bundle
                    try:
                        # connect to outputs from a previous bundle
                        relative = RelativeTimestep.PREVIOUS
                        previous_timestep = relative.resolve_relative_to(
                            timestep, model_run.model_horizon)
                        previous_decision_iteration = \
                            bundle['decision_links'][decision_iteration]
                        job_graph.add_edges_from(
                            self._make_between_bundle_previous_simulate_job_edges(
                                model_run.name,
                                model_run.sos_model.model_dependencies,
                                timestep,
                                previous_timestep,
                                decision_iteration,
                                previous_decision_iteration
                            )
                        )
                    except SmifTimestepResolutionError:
                        # no previous timestep, use scenarios to provide initial intertimestep
                        # dependenciess
                        job_graph.add_edges_from(
                            self._make_initial_previous_simulate_job_edges(
                                model_run.name,
                                model_run.sos_model.model_dependencies,
                                timestep,
                                decision_iteration
                            )
                        )

                else:
                    # subsequent timestep in a bundle - connect to previous timestep
                    previous_timestep = bundle['timesteps'][timestep_index - 1]
                    job_graph.add_edges_from(
                        self._make_within_bundle_previous_simulate_job_edges(
                            model_run.name,
                            model_run.sos_model.model_dependencies,
                            timestep,
                            previous_timestep,
                            decision_iteration
                        )
                    )

        if not model_run.initialised:
            # one before_model_run job per model
            self.logger.info("Initialising each of the sector models")
            job_graph.add_nodes_from(
                self._make_before_model_run_job_nodes(
                    model_run.name,
                    model_run.sos_model.sector_models,
                    model_run.model_horizon
                )
            )
            # must run before any simulate jobs
            for decision_iteration in bundle['decision_iterations']:
                for timestep in bundle['timesteps']:
                    job_graph.add_edges_from(
                        self._make_before_model_run_job_edges(
                            model_run.name,
                            model_run.sos_model.sector_models,
                            timestep,
                            decision_iteration
                        )
                    )
            model_run.initialised = True

        if not nx.is_directed_acyclic_graph(job_graph):
            raise NotImplementedError(
                "SosModel dependency graphs must not contain within-timestep cycles")

        return job_graph

[docs]    @staticmethod
    def filter_job_graph(modelrun_name, job_graph, complete_jobs):
        filtered = job_graph.copy()
        for timestep, decision_iteration, model_name in complete_jobs:
            job_id = ModelRunner._make_job_id(
                modelrun_name, model_name, ModelOperation.SIMULATE, timestep,
                decision_iteration)
            if job_id in filtered.nodes:
                filtered.remove_node(job_id)
        return filtered

    @staticmethod
    def _make_before_model_run_job_nodes(modelrun_name, models, horizon):
        return [
            (
                ModelRunner._make_job_id(
                    modelrun_name, model.name, ModelOperation.BEFORE_MODEL_RUN),
                {
                    'model': model,
                    'modelrun_name': modelrun_name,
                    'current_timestep': None,
                    'timesteps': horizon,
                    'decision_iteration': None,
                    'operation': ModelOperation.BEFORE_MODEL_RUN
                }
            )
            for model in models
        ]

    @staticmethod
    def _make_before_model_run_job_edges(modelrun_name, models, timestep, decision_iteration):
        edges = []
        for model in models:
            from_id = ModelRunner._make_job_id(
                modelrun_name, model.name, ModelOperation.BEFORE_MODEL_RUN)
            to_id = ModelRunner._make_job_id(
                modelrun_name, model.name, ModelOperation.SIMULATE, timestep,
                decision_iteration)
            edges.append((from_id, to_id))
        return edges

    @staticmethod
    def _make_simulate_job_nodes(modelrun_name, models, decision_iteration, timestep, horizon):
        return [
            (
                ModelRunner._make_job_id(
                    modelrun_name, model.name, ModelOperation.SIMULATE, timestep,
                    decision_iteration),
                {
                    'model': model,
                    'modelrun_name': modelrun_name,
                    'current_timestep': timestep,
                    'timesteps': horizon,
                    'decision_iteration': decision_iteration,
                    'operation': ModelOperation.SIMULATE
                }
            )
            for model in models
        ]

    @staticmethod
    def _make_current_simulate_job_edges(modelrun_name, dependencies, timestep,
                                         decision_iteration):
        edges = []
        for dependency in dependencies:
            if dependency.timestep != RelativeTimestep.PREVIOUS:
                from_id = ModelRunner._make_job_id(
                    modelrun_name, dependency.source_model.name, ModelOperation.SIMULATE,
                    timestep, decision_iteration)
                to_id = ModelRunner._make_job_id(
                    modelrun_name, dependency.sink_model.name, ModelOperation.SIMULATE,
                    timestep, decision_iteration)
                edges.append((from_id, to_id))
        return edges

    @staticmethod
    def _make_within_bundle_previous_simulate_job_edges(modelrun_name, dependencies, timestep,
                                                        previous_timestep, decision_iteration):
        edges = []
        for dependency in dependencies:
            if dependency.timestep == RelativeTimestep.PREVIOUS:
                from_id = ModelRunner._make_job_id(
                    modelrun_name, dependency.source_model.name, ModelOperation.SIMULATE,
                    previous_timestep, decision_iteration)
                to_id = ModelRunner._make_job_id(
                    modelrun_name, dependency.sink_model.name, ModelOperation.SIMULATE,
                    timestep, decision_iteration)
                edges.append((from_id, to_id))
        return edges

    @staticmethod
    def _make_between_bundle_previous_simulate_job_edges(modelrun_name, dependencies, timestep,
                                                         previous_timestep, decision_iteration,
                                                         previous_decision_iteration):
        edges = []
        for dependency in dependencies:
            if dependency.timestep == RelativeTimestep.PREVIOUS:
                from_id = ModelRunner._make_job_id(
                    modelrun_name, dependency.source_model.name, ModelOperation.SIMULATE,
                    previous_timestep, previous_decision_iteration)
                to_id = ModelRunner._make_job_id(
                    modelrun_name, dependency.sink_model.name, ModelOperation.SIMULATE,
                    timestep, decision_iteration)
                edges.append((from_id, to_id))
        return edges

    @staticmethod
    def _make_initial_previous_simulate_job_edges(modelrun_name, dependencies, timestep,
                                                  decision_iteration):
        edges = []
        for dependency in dependencies:
            if isinstance(dependency.source_model, ScenarioModel):
                from_id = ModelRunner._make_job_id(
                    modelrun_name, dependency.source_model.name, ModelOperation.SIMULATE,
                    timestep, decision_iteration)
                to_id = ModelRunner._make_job_id(
                    modelrun_name, dependency.sink_model.name, ModelOperation.SIMULATE,
                    timestep, decision_iteration)
                edges.append((from_id, to_id))
        return edges

    @staticmethod
    def _make_job_id(modelrun_name, model_name, operation, timestep=None,
                     decision_iteration=None):
        if operation == ModelOperation.BEFORE_MODEL_RUN:
            id_ = '%s_%s_%s' % (modelrun_name, operation.value, model_name)
        else:
            id_ = '%s_%s_%s_%s_%s' % (
                modelrun_name, operation.value, timestep, decision_iteration, model_name)
        return id_
Source code for smif.controller.modelrun

smif

Navigation

Related Topics