Source code for smif.cli

# -*- coding: utf-8 -*-
"""A command line interface to the system of systems framework

This command line interface implements a number of methods.

- `setup` creates an example project with the recommended folder structure
- `run` performs a simulation of an individual sector model, or the whole system
        of systems model
- `validate` performs a validation check of the configuration file
- `app` runs the graphical user interface, opening in a web browser

Folder structure
----------------

When configuring a project for the CLI, the folder structure below should be
used.  In this example, there is one system-of-systems model, combining a water
supply and an energy demand model::

    /config
        project.yaml
        /sector_models
            energy_demand.yml
            water_supply.yml
        /sos_models
            energy_water.yml
        /model_runs
            run_to_2050.yml
            short_test_run.yml
            ...
    /data
        /initial_conditions
            reservoirs.yml
        /interval_definitions
            annual_intervals.csv
        /interventions
            water_supply.yml
        /narratives
            high_tech_dsm.yml
        /region_definitions
            /oxfordshire
                regions.geojson
            /uk_nations_shp
                regions.shp
        /scenarios
            population.csv
            raininess.csv
        /water_supply
            /initial_system
    /models
        energy_demand.py
        water_supply.py
    /planning
        expected_to_2020.yaml
        national_infrastructure_pipeline.yml

The sector model implementations can be installed independently of the model run
configuration. The paths to python wrapper classes (implementing SectorModel)
should be specified in each ``sector_model/*.yml`` configuration.

The project.yaml file specifies the metadata shared by all elements of the
project; ``sos_models`` specify the combinations of ``sector_models`` and
``scenarios`` while individual ``model_runs`` specify the scenario, strategy
and narrative combinations to be used in each run of the models.

"""
from __future__ import print_function

import glob
import logging
import os
import sys
from argparse import ArgumentParser

import pkg_resources

import pandas
import smif
import smif.cli.log
from smif.controller import (copy_project_folder, execute_decision_step,
                             execute_model_before_step, execute_model_run,
                             execute_model_step)
from smif.controller.run import DAFNIRunScheduler, SubProcessRunScheduler
from smif.data_layer import Store
from smif.data_layer.file import (CSVDataStore, FileMetadataStore,
                                  ParquetDataStore, YamlConfigStore)
from smif.http_api import create_app

try:
    import _thread
except ImportError:
    import thread as _thread

try:
    import win32api

    USE_WIN32 = True
except ImportError:
    USE_WIN32 = False

__author__ = "Will Usher, Tom Russell"
__copyright__ = "Will Usher, Tom Russell"
__license__ = "mit"


[docs]def list_model_runs(args):
    """List the model runs defined in the config, optionally indicating whether complete
    results exist.
    """
    store = _get_store(args)
    model_run_configs = store.read_model_runs()

    if args.complete:
        print('Model runs with an asterisk (*) have complete results available\n')

    for run in model_run_configs:
        run_name = run['name']

        if args.complete:
            expected_results = store.canonical_expected_results(run_name)
            available_results = store.canonical_available_results(run_name)

            complete = ' *' if expected_results == available_results else ''

            print('{}{}'.format(run_name, complete))
        else:
            print(run_name)


[docs]def list_available_results(args):
    """List the available results for a specified model run.
    """

    store = _get_store(args)
    expected = store.canonical_expected_results(args.model_run)
    available = store.available_results(args.model_run)

    # Print run and sos model
    run = store.read_model_run(args.model_run)
    print('\nmodel run: {}'.format(args.model_run))
    print('{}- sos model: {}'.format(' ' * 2, run['sos_model']))

    # List of expected sector models
    sec_models = sorted({sec for _t, _d, sec, _out in expected})

    for sec_model in sec_models:
        print('{}- sector model: {}'.format(' ' * 4, sec_model))

        # List expected outputs for this sector model
        outputs = sorted({out for _t, _d, sec, out in expected if sec == sec_model})

        for output in outputs:
            print('{}- output: {}'.format(' ' * 6, output))

            # List available decisions for this sector model and output
            decs = sorted({d for _t, d, sec, out in available if
                           sec == sec_model and out == output})

            if len(decs) == 0:
                print('{}- no results'.format(' ' * 8))

            for dec in decs:
                base_str = '{}- decision {}:'.format(' ' * 8, dec)

                # List available time steps for this decision, sector model and output
                ts = sorted({t for t, d, sec, out in available if
                             d == dec and sec == sec_model and out == output})
                assert (len(
                    ts) > 0), "If a decision is available, so is at least one time step"

                res_str = ', '.join([str(t) for t in ts])
                print('{} {}'.format(base_str, res_str))


[docs]def list_missing_results(args):
    """List the missing results for a specified model run.
    """
    store = _get_store(args)
    expected = store.canonical_expected_results(args.model_run)
    missing = store.canonical_missing_results(args.model_run)

    # Print run and sos model
    run = store.read_model_run(args.model_run)
    print('\nmodel run: {}'.format(args.model_run))
    print('{}- sos model: {}'.format(' ' * 2, run['sos_model']))

    # List of expected sector models
    sec_models = sorted({sec for _t, _d, sec, _out in expected})

    for sec_model in sec_models:
        print('{}- sector model: {}'.format(' ' * 4, sec_model))

        # List expected outputs for this sector model
        outputs = sorted({out for _t, _d, sec, out in expected if sec == sec_model})

        for output in outputs:
            print('{}- output: {}'.format(' ' * 6, output))

            # List missing time steps for this sector model and output
            ts = sorted({t for t, d, sec, out in missing if
                         sec == sec_model and out == output})

            if len(ts) == 0:
                print('{}- no missing results'.format(' ' * 8))
            else:
                base_str = '{}- results missing for:'.format(' ' * 8)
                res_str = ', '.join([str(t) for t in ts])
                print('{} {}'.format(base_str, res_str))


[docs]def prepare_convert(args):
    src_store = _get_store(args)
    if isinstance(src_store.data_store, CSVDataStore):
        tgt_store = Store(
            config_store=YamlConfigStore(args.directory),
            metadata_store=FileMetadataStore(args.directory),
            data_store=ParquetDataStore(args.directory),
            model_base_folder=(args.directory)
        )
    else:
        tgt_store = Store(
            config_store=YamlConfigStore(args.directory),
            metadata_store=FileMetadataStore(args.directory),
            data_store=CSVDataStore(args.directory),
            model_base_folder=(args.directory)
        )
    # Read model run
    model_run = src_store.read_model_run(args.model_run)
    # Read sos model for model run
    sos_model = src_store.read_sos_model(model_run['sos_model'])
    # Now let us convert data
    # Convert strategies interventions for model run
    src_store.convert_strategies_data(model_run['name'], tgt_store, args.noclobber)
    # Convert scenario data for model run
    src_store.convert_scenario_data(model_run['name'], tgt_store)
    # Convert narrative data for sos model
    src_store.convert_narrative_data(sos_model['name'], tgt_store, args.noclobber)
    # Convert initial conditions, default parameter and interventions data
    # for sector models in sos model
    for sector_model_name in sos_model['sector_models']:
        src_store.convert_model_parameter_default_data(
            sector_model_name, tgt_store, args.noclobber)
        src_store.convert_interventions_data(sector_model_name, tgt_store, args.noclobber)
        src_store.convert_initial_conditions_data(sector_model_name, tgt_store, args.noclobber)


[docs]def csv2parquet(args):
    """Convert CSV to Parquet - assuming the CSV can be parsed as a dataframe
    """
    path = args.path
    if ".csv" in path:
        files = [path]
    else:
        files = glob.glob(os.path.join(path, '**', '*.csv'), recursive=True)

    for csv_path in files:
        parquet_path = csv_path.replace(".csv", ".parquet")
        if args.noclobber and os.path.exists(parquet_path):
            print("Skipping", csv_path)
        else:
            print("Converting", csv_path, flush=True)
            try:
                dataframe = pandas.read_csv(csv_path)
                dataframe.to_parquet(parquet_path, engine='pyarrow', compression='gzip')
            except UnicodeDecodeError:
                # guess that cp1252 is next most common encoding we'll come across
                dataframe = pandas.read_csv(csv_path, encoding='cp1252')
                dataframe.to_parquet(parquet_path, engine='pyarrow', compression='gzip')
            except pandas.errors.ParserError as ex:
                # nothing we can do with ParserError - usually a data problem
                print(ex)
                continue


[docs]def prepare_scenario(args):
    """Update scenario configuration file to include multiple scenario variants.

    The initial scenario configuration file is overwritten.
    """
    # Read template scenario using the Store class
    store = _get_store(args)
    list_of_variants = range(args.variants_range[0], args.variants_range[1] + 1)

    store.prepare_scenario(args.scenario_name, list_of_variants)


[docs]def prepare_model_runs(args):
    """Generate multiple model runs according to a model run file referencing a scenario
    with multiple variants.
    """
    # Read model run and scenario using the Store class
    store = _get_store(args)
    nb_variants = len(store.read_scenario_variants(args.scenario_name))
    # Define default lower and upper of variant range
    var_start = 0
    var_end = nb_variants

    # Check if optional cli arguments specify range of variants
    # They are compared to None because they can be 0
    if args.start is not None:
        var_start = args.start
        if var_start < 0:
            raise ValueError('Lower bound of variant range must be >=0')
        if var_start > nb_variants:
            raise ValueError("Lower bound of variant range greater"
                             " than number of variants")
    if args.end is not None:
        var_end = args.end
        if var_end < 0:
            raise ValueError('Upper bound of variant range must be >=0')
        if var_end > nb_variants - 1:
            raise ValueError("Upper bound of variant range cannot be greater"
                             " than {:d}".format(nb_variants - 1))
        if var_end < var_start:
            raise ValueError("Upper bound of variant range must be >= lower"
                             " bound of variant range")

    store.prepare_model_runs(args.model_run_name, args.scenario_name,
                             var_start, var_end)


[docs]def before_step(args):
    """Prepare a single model to run (call once before calling `smif step`)

    Parameters
    ----------
    args
    """
    store = _get_store(args)
    execute_model_before_step(args.modelrun, args.model, store)


[docs]def step(args):
    """Run a single model for a single timestep

    Parameters
    ----------
    args
    """
    store = _get_store(args)
    execute_model_step(args.modelrun, args.model, args.timestep, args.decision, store)


[docs]def decide(args):
    """Run a decision step for a model run

    Parameters
    ----------
    args
    """
    store = _get_store(args)
    execute_decision_step(args.modelrun, args.decision, store)


[docs]def run(args):
    """Run the model runs as requested. Check if results exist and asks
    user for permission to overwrite

    Parameters
    ----------
    args
    """
    logger = logging.getLogger(__name__)
    msg = '{:s}, {:s}, {:s}'.format(args.modelrun, args.interface, args.directory)

    try:
        logger.profiling_start('run_model_runs', msg)
    except AttributeError:
        logger.info('START run_model_runs %s', msg)

    if args.batchfile:
        with open(args.modelrun, 'r') as f:
            model_run_ids = f.read().splitlines()
    else:
        model_run_ids = [args.modelrun]

    store = _get_store(args)
    execute_model_run(model_run_ids, store, args.warm, args.dry_run)

    try:
        logger.profiling_stop('run_model_runs', msg)
        if not args.dry_run:
            logger.summary()
    except AttributeError:
        logger.info('STOP run_model_runs %s', msg)


def _get_store(args):
    """Contruct store as configured by arguments
    """
    if args.interface == 'local_csv':
        store = Store(
            config_store=YamlConfigStore(args.directory),
            metadata_store=FileMetadataStore(args.directory),
            data_store=CSVDataStore(args.directory),
            model_base_folder=args.directory
        )
    elif args.interface == 'local_binary':
        store = Store(
            config_store=YamlConfigStore(args.directory),
            metadata_store=FileMetadataStore(args.directory),
            data_store=ParquetDataStore(args.directory),
            model_base_folder=args.directory
        )
    else:
        raise ValueError("Store interface type {} not recognised.".format(args.interface))
    return store


def _run_server(args):
    app_folder = pkg_resources.resource_filename('smif', 'app/dist')
    if args.scheduler == 'dafni' and args.interface != 'local_csv':
        msg = "Scheduler implementation {0}, is not valid when combined with {1}."
        raise ValueError(msg.format(args.scheduler, args.interface))

    if args.scheduler == 'default':
        model_scheduler = SubProcessRunScheduler()
    elif args.scheduler == 'dafni':
        model_scheduler = DAFNIRunScheduler(args.username, args.password)
    else:
        raise ValueError("Scheduler implentation {} not recognised.".format(args.scheduler))

    app = create_app(
        static_folder=app_folder,
        template_folder=app_folder,
        data_interface=_get_store(args),
        scheduler=model_scheduler
    )

    print("    Opening smif app\n")
    print("    Copy/paste this URL into your web browser to connect:")
    print("        http://localhost:" + str(args.port) + "\n")
    # add flush to ensure that text is printed before server thread starts
    print("    Close your browser then type Control-C here to quit.", flush=True)
    app.run(host='0.0.0.0', port=args.port, threaded=True)


[docs]def run_app(args):
    """Run the client/server application

    Parameters
    ----------
    args
    """
    # avoid one of two error messages from 'forrtl error(200)' when running
    # on windows cmd - seems related to scipy's underlying Fortran
    os.environ['FOR_DISABLE_CONSOLE_CTRL_HANDLER'] = 'T'

    if USE_WIN32:
        # Set handler for CTRL-C. Necessary to avoid `forrtl: error (200):
        # program aborting...` crash on CTRL-C if we're runnging from Windows
        # cmd.exe
        def handler(dw_ctrl_type, hook_sigint=_thread.interrupt_main):
            """Handler for CTRL-C interrupt
            """
            if dw_ctrl_type == 0:  # CTRL-C
                hook_sigint()
                return 1  # don't chain to the next handler
            return 0  # chain to the next handler

        win32api.SetConsoleCtrlHandler(handler, 1)

    # Create backend server process
    _run_server(args)


[docs]def setup_project_folder(args):
    """Setup a sample project
    """
    copy_project_folder(args.directory)


[docs]def parse_arguments():
    """Parse command line arguments

    Returns
    =======
    :class:`argparse.ArgumentParser`

    """
    parser = ArgumentParser(description='Command line tools for smif')
    parser.add_argument('-V', '--version',
                        action='version',
                        version="smif " + smif.__version__,
                        help='show the current version of smif')

    parent_parser = ArgumentParser(add_help=False)
    parent_parser.add_argument('-v', '--verbose',
                               action='count',
                               help='show messages: -v to see messages reporting on ' +
                                    'progress, -vv to see debug messages.')
    parent_parser.add_argument('-i', '--interface',
                               default='local_csv',
                               choices=['local_csv', 'local_binary'],
                               help="Select the data interface (default: %(default)s)")
    parent_parser.add_argument('-d', '--directory',
                               default='.',
                               help="Path to the project directory")

    subparsers = parser.add_subparsers(help='available commands')

    # SETUP
    parser_setup = subparsers.add_parser(
        'setup', help='Setup the project folder', parents=[parent_parser])
    parser_setup.set_defaults(func=setup_project_folder)

    # LIST
    parser_list = subparsers.add_parser(
        'list', help='List available model runs', parents=[parent_parser])
    parser_list.set_defaults(func=list_model_runs)
    parser_list.add_argument('-c', '--complete',
                             help="Show which model runs have complete results",
                             action='store_true')

    # RESULTS
    parser_available_results = subparsers.add_parser(
        'available_results', help='List available results', parents=[parent_parser])
    parser_available_results.set_defaults(func=list_available_results)
    parser_available_results.add_argument(
        'model_run',
        help="Name of the model run to list available results"
    )

    parser_missing_results = subparsers.add_parser(
        'missing_results', help='List missing results', parents=[parent_parser])
    parser_missing_results.set_defaults(func=list_missing_results)
    parser_missing_results.add_argument(
        'model_run',
        help="Name of the model run to list missing results"
    )

    # PREPARE
    parser_convert = subparsers.add_parser(
        'prepare-convert', help='Convert data from one format to another',
        parents=[parent_parser])
    parser_convert.set_defaults(func=prepare_convert)
    parser_convert.add_argument(
        'model_run', help='Name of the model run')
    parser_convert.add_argument(
        '-nc', '--noclobber',
        help='Do not convert existing data files', action='store_true')

    parser_prepare_scenario = subparsers.add_parser(
        'prepare-scenario', help='Prepare scenario configuration file with multiple variants',
        parents=[parent_parser])
    parser_prepare_scenario.set_defaults(func=prepare_scenario)
    parser_prepare_scenario.add_argument(
        'scenario_name', help='Name of the scenario')
    parser_prepare_scenario.add_argument(
        'variants_range', nargs=2, type=int,
        help='Two integers delimiting the range of variants')

    parser_prepare_model_runs = subparsers.add_parser(
        'prepare-run', help='Prepare model runs based on scenario variants',
        parents=[parent_parser])
    parser_prepare_model_runs.set_defaults(func=prepare_model_runs)
    parser_prepare_model_runs.add_argument(
        'scenario_name', help='Name of the scenario')
    parser_prepare_model_runs.add_argument(
        'model_run_name', help='Name of the template model run')
    parser_prepare_model_runs.add_argument(
        '-s', '--start', type=int, help='Lower bound of the range of variants')
    parser_prepare_model_runs.add_argument(
        '-e', '--end', type=int, help='Upper bound of the range of variants')

    # CONVERT
    parser_convert_format = subparsers.add_parser(
        'csv2parquet', help='Convert CSV to Parquet. Pass a filename or a directory to ' +
        'search recurisvely', parents=[parent_parser])
    parser_convert_format.set_defaults(func=csv2parquet)
    parser_convert_format.add_argument(
        'path', help='Path to file')
    parser_convert_format.add_argument(
        '-nc', '--noclobber',
        help='Skip converting data files which already exist as parquet', action='store_true')

    # APP
    parser_app = subparsers.add_parser(
        'app', help='Open smif app', parents=[parent_parser])
    parser_app.set_defaults(func=run_app)
    parser_app.add_argument('-p', '--port',
                            type=int,
                            default=5000,
                            help="The port over which to serve the app")
    parser_app.add_argument('-s', '--scheduler',
                            default='default',
                            choices=['default', 'dafni'],
                            help="The module scheduling implementation to use")
    parser_app.add_argument('-u', '--username',
                            help="The username for logging in to the dafni JobSubmissionAPI, \
                                  only needed with the dafni job scheduler")
    parser_app.add_argument('-pw', '--password',
                            help="The password for logging in to the dafni JobSubmissionAPI, \
                                  only needed with the dafni job scheduler")

    # RUN
    parser_run = subparsers.add_parser(
        'run', help='Run a modelrun', parents=[parent_parser])
    parser_run.set_defaults(func=run)
    parser_run.add_argument('-w', '--warm',
                            action='store_true',
                            help="Use intermediate results from the last modelrun \
                                  and continue from where it had left")
    parser_run.add_argument('-b', '--batchfile',
                            action='store_true',
                            help="Use a batchfile instead of a modelrun name (a \
                                  list of modelrun names)")
    parser_run.add_argument('modelrun',
                            help="Name of the model run to run")
    parser_run.add_argument('-n', '--dry-run',
                            action='store_true',
                            help="Do not execute individual models, print steps instead")

    # BEFORE RUN
    parser_before_step = subparsers.add_parser(
        'before_step',
        help='Initialise a model before stepping through',
        parents=[parent_parser])
    parser_before_step.set_defaults(func=before_step)
    parser_before_step.add_argument('modelrun',
                                    help="Name of the model run")
    parser_before_step.add_argument('-m', '--model',
                                    required=True,
                                    help="The individual model to run.")

    # DECIDE
    parser_decide = subparsers.add_parser(
        'decide', help='Run a decision step', parents=[parent_parser])
    parser_decide.set_defaults(func=decide)
    parser_decide.add_argument('modelrun',
                               help="Name of the model run")
    parser_decide.add_argument('-dn', '--decision',
                               type=int,
                               default=0,
                               help="The decision step to run: either 0 to start a run, or "
                                    "n+1 where n is the maximum previous decision iteration "
                                    "for which all steps have been simulated")

    # STEP
    parser_step = subparsers.add_parser(
        'step', help='Run a model step', parents=[parent_parser])
    parser_step.set_defaults(func=step)
    parser_step.add_argument('modelrun',
                             help="Name of the model run")
    parser_step.add_argument('-m', '--model',
                             required=True,
                             help="The individual model to run.")
    parser_step.add_argument('-t', '--timestep',
                             type=int,
                             required=True,
                             help="The single timestep to run.")
    parser_step.add_argument('-dn', '--decision',
                             type=int,
                             required=True,
                             help="The decision step to run.")

    return parser


[docs]def confirm(prompt=None, response=False):
    """Prompts for a yes or no response from the user

    Arguments
    ---------
    prompt : str, default=None
    response : bool, default=False

    Returns
    -------
    bool
        True for yes and False for no.

    Notes
    -----

    `response` should be set to the default value assumed by the caller when
    user simply types ENTER.

    Examples
    --------

    >>> confirm(prompt='Create Directory?', response=True)
    Create Directory? [y]|n:
    True
    >>> confirm(prompt='Create Directory?', response=False)
    Create Directory? [n]|y:
    False
    >>> confirm(prompt='Create Directory?', response=False)
    Create Directory? [n]|y: y
    True

    """

    if prompt is None:
        prompt = 'Confirm'

    if response:
        prompt = '{} [{}]|{}: '.format(prompt, 'y', 'n')
    else:
        prompt = '{} [{}]|{}: '.format(prompt, 'n', 'y')

    while True:
        ans = input(prompt)
        if not ans:
            return response
        if ans not in ['y', 'Y', 'n', 'N']:
            print('please enter y or n.')
            continue
        if ans in ['y', 'Y']:
            return True
        if ans in ['n', 'N']:
            return False


[docs]def main(arguments=None):
    """Parse args and run
    """
    parser = parse_arguments()
    args = parser.parse_args(arguments)

    try:
        smif.cli.log.setup_logging(args.verbose)
    except AttributeError:
        # verbose is only set on subcommands - so `smif` or `smif -h` would error
        pass

    def exception_handler(exception_type, exception, traceback, debug_hook=sys.excepthook):
        if args.verbose:
            debug_hook(exception_type, exception, traceback)
        else:
            print("{}: {}".format(exception_type.__name__, exception), file=sys.stderr)

    sys.excepthook = exception_handler
    if 'func' in args:
        args.func(args)
    else:
        parser.print_help()
Source code for smif.cli

smif

Navigation

Related Topics