Source code for sierra.core.pipeline.stage4.intra_exp_graph_generator

# Copyright 2018 London Lowmanstone, John Harwell, All rights reserved.
#
#  SPDX-License-Identifier: MIT
#
"""
Classes for generating graphs within a single :term:`Experiment`.
"""

# Core packages
import os
import copy
import typing as tp
import logging
import pathlib

# 3rd party packages
import json

# Project packages
from sierra.core.graphs.stacked_line_graph import StackedLineGraph
from sierra.core.graphs.heatmap import Heatmap
from sierra.core.models.graphs import IntraExpModel2DGraphSet
import sierra.core.variables.batch_criteria as bc
import sierra.core.plugin_manager as pm
from sierra.core import types, config, utils


[docs]class BatchIntraExpGraphGenerator:
[docs]    def __init__(self, cmdopts: types.Cmdopts) -> None:
        # Copy because we are modifying it and don't want to mess up the
        # arguments for graphs that are generated after us
        self.cmdopts = copy.deepcopy(cmdopts)
        self.logger = logging.getLogger(__name__)

[docs]    def __call__(self,
                 main_config: types.YAMLDict,
                 controller_config: types.YAMLDict,
                 LN_config: types.YAMLDict,
                 HM_config: types.YAMLDict,
                 criteria: bc.IConcreteBatchCriteria) -> None:
        """Generate all intra-experiment graphs for a :term:`Batch Experiment`.

        Parameters:

            main_config: Parsed dictionary of main YAML configuration

            controller_config: Parsed dictionary of controller YAML
                               configuration.

            LN_config: Parsed dictionary of intra-experiment linegraph
                       configuration.

            HM_config: Parsed dictionary of intra-experiment heatmap
                       configuration.

            criteria:  The :term:`Batch Criteria` used for the batch
                       experiment.

        """
        exp_to_gen = utils.exp_range_calc(self.cmdopts,
                                          self.cmdopts['batch_output_root'],
                                          criteria)

        for exp in exp_to_gen:
            batch_output_root = pathlib.Path(self.cmdopts["batch_output_root"])
            batch_stat_root = pathlib.Path(self.cmdopts["batch_stat_root"])
            batch_input_root = pathlib.Path(self.cmdopts["batch_input_root"])
            batch_graph_root = pathlib.Path(self.cmdopts["batch_graph_root"])
            batch_model_root = pathlib.Path(self.cmdopts["batch_model_root"])

            cmdopts = copy.deepcopy(self.cmdopts)
            cmdopts["exp_input_root"] = str(batch_input_root / exp.name)
            cmdopts["exp_output_root"] = str(batch_output_root / exp.name)
            cmdopts["exp_graph_root"] = str(batch_graph_root / exp.name)
            cmdopts["exp_model_root"] = str(batch_model_root / exp.name)
            cmdopts["exp_stat_root"] = str(batch_stat_root / exp.name)

            if os.path.isdir(cmdopts["exp_stat_root"]):
                generator = pm.module_load_tiered(project=self.cmdopts['project'],
                                                  path='pipeline.stage4.intra_exp_graph_generator')
                generator.IntraExpGraphGenerator(main_config,
                                                 controller_config,
                                                 LN_config,
                                                 HM_config,
                                                 cmdopts)(criteria)
            else:
                self.logger.warning("Skipping experiment '%s': %s does not exist",
                                    exp,
                                    cmdopts['exp_stat_root'])


[docs]class IntraExpGraphGenerator:
    """Generates graphs from :term:`Averaged .csv` files for a single experiment.

    Which graphs are generated is controlled by YAML configuration files parsed
    in :class:`~sierra.core.pipeline.stage4.pipeline_stage4.PipelineStage4`.

    This class can be extended/overriden using a :term:`Project` hook. See
    :ref:`ln-sierra-tutorials-project-hooks` for details.

    Attributes:

        cmdopts: Dictionary of parsed cmdline attributes.

        main_config: Parsed dictionary of main YAML configuration

        controller_config: Parsed dictionary of controller YAML
                           configuration.

        LN_config: Parsed dictionary of intra-experiment linegraph
                   configuration.

        HM_config: Parsed dictionary of intra-experiment heatmap
                   configuration.

        criteria:  The :term:`Batch Criteria` used for the batch
                   experiment.

        logger: The handle to the logger for this class. If you extend this
               class, you should save/restore this variable in tandem with
               overriding it in order to get logging messages have unique logger
               names between this class and your derived class, in order to
               reduce confusion.

    """

[docs]    def __init__(self,
                 main_config: types.YAMLDict,
                 controller_config: types.YAMLDict,
                 LN_config: types.YAMLDict,
                 HM_config: types.YAMLDict,
                 cmdopts: types.Cmdopts) -> None:
        # Copy because we are modifying it and don't want to mess up the
        # arguments for graphs that are generated after us
        self.cmdopts = copy.deepcopy(cmdopts)
        self.main_config = main_config
        self.LN_config = LN_config
        self.HM_config = HM_config
        self.controller_config = controller_config
        self.logger = logging.getLogger(__name__)

        utils.dir_create_checked(self.cmdopts["exp_graph_root"], exist_ok=True)

[docs]    def __call__(self, criteria: bc.IConcreteBatchCriteria) -> None:
        """
        Generate graphs.

        Performs the following steps:

        # . :class:`~sierra.core.pipeline.stage4.intra_exp_graph_generator.LinegraphsGenerator`
            to generate linegraphs for each experiment in the batch.

        # . :class:`~sierra.core.pipeline.stage4.intra_exp_graph_generator.HeatmapsGenerator`
            to generate heatmaps for each experiment in the batch.
        """
        LN_targets, HM_targets = self.calc_targets()
        self.generate(LN_targets, HM_targets)

[docs]    def generate(self,
                 LN_targets: tp.List[types.YAMLDict],
                 HM_targets: tp.List[types.YAMLDict]):
        if not self.cmdopts['project_no_LN']:
            LinegraphsGenerator(self.cmdopts, LN_targets).generate()

        if not self.cmdopts['project_no_HM']:
            HeatmapsGenerator(self.cmdopts, HM_targets).generate()

[docs]    def calc_targets(self) -> tp.Tuple[tp.List[types.YAMLDict],
                                       tp.List[types.YAMLDict]]:
        """Calculate what intra-experiment graphs should be generated.

        Uses YAML configuration for controller and intra-experiment graphs.
        Returns a tuple of dictionaries: (intra-experiment linegraphs,
        intra-experiment heatmaps) defined what graphs to generate. The enabled
        graphs exist in their YAML respective YAML configuration `and` are
        enabled by the YAML configuration for the selected controller.

        """
        keys = []
        for category in list(self.controller_config.keys()):
            if category not in self.cmdopts['controller']:
                continue
            for controller in self.controller_config[category]['controllers']:
                if controller['name'] not in self.cmdopts['controller']:
                    continue

                # valid to specify no graphs, and only to inherit graphs
                keys = controller.get('graphs', [])
                if 'graphs_inherit' in controller:
                    for inherit in controller['graphs_inherit']:
                        keys.extend(inherit)   # optional

        # Get keys for enabled graphs
        LN_keys = [k for k in self.LN_config if k in keys]
        self.logger.debug("Enabled linegraph categories: %s", LN_keys)

        HM_keys = [k for k in self.HM_config if k in keys]
        self.logger.debug("Enabled heatmap categories: %s", HM_keys)

        # Strip out all configured graphs which are not enabled
        LN_targets = [self.LN_config[k] for k in LN_keys]
        HM_targets = [self.HM_config[k] for k in HM_keys]

        return LN_targets, HM_targets


[docs]class LinegraphsGenerator:
    """
    Generates linegraphs from :term:`Averaged .csv` files within an experiment.
    """

[docs]    def __init__(self,
                 cmdopts: types.Cmdopts,
                 targets: tp.List[types.YAMLDict]) -> None:
        self.cmdopts = cmdopts
        self.targets = targets
        self.logger = logging.getLogger(__name__)
        self.graph_root = pathlib.Path(self.cmdopts['exp_graph_root'])
        self.stats_root = pathlib.Path(self.cmdopts['exp_stat_root'])

[docs]    def generate(self) -> None:
        self.logger.info("Linegraphs from %s", self.cmdopts['exp_stat_root'])

        # For each category of linegraphs we are generating
        for category in self.targets:

            # For each graph in each category
            for graph in category['graphs']:
                output_fpath = self.graph_root / ('SLN-' + graph['dest_stem'] +
                                                  config.kImageExt)
                try:
                    self.logger.trace('\n' +  # type: ignore
                                      json.dumps(graph, indent=4))
                    StackedLineGraph(stats_root=self.stats_root,
                                     input_stem=graph['src_stem'],
                                     output_fpath=output_fpath,
                                     stats=self.cmdopts['dist_stats'],
                                     dashstyles=graph.get('dashes', None),
                                     linestyles=graph.get('styles', None),
                                     cols=graph.get('cols', None),
                                     title=graph.get('title', None),
                                     legend=graph.get('legend', None),
                                     xlabel=graph.get('xlabel', None),
                                     ylabel=graph.get('ylabel', None),
                                     logyscale=self.cmdopts['plot_log_yscale'],
                                     large_text=self.cmdopts['plot_large_text']).generate()
                except KeyError:
                    self.logger.fatal(("Could not generate linegraph. "
                                       "Possible reasons include: "))

                    self.logger.fatal(("1. The YAML configuration entry is "
                                       "missing required fields"))
                    missing_cols = graph.get('cols', "MISSING_KEY")
                    missing_stem = graph.get('src_stem', "MISSING_KEY")
                    self.logger.fatal(("2. 'cols' is present in YAML "
                                       "configuration but some of %s are "
                                       "missing from %s"),
                                      missing_cols,
                                      missing_stem)

                    raise


[docs]class HeatmapsGenerator:
    """
    Generates heatmaps from :term:`Averaged .csv` files for a single experiment.
    """

[docs]    def __init__(self,
                 cmdopts: types.Cmdopts,
                 targets: tp.List[types.YAMLDict]) -> None:

        self.exp_stat_root = pathlib.Path(cmdopts['exp_stat_root'])
        self.exp_graph_root = pathlib.Path(cmdopts["exp_graph_root"])
        self.exp_model_root = pathlib.Path(cmdopts["exp_model_root"])
        self.large_text = cmdopts['plot_large_text']

        self.targets = targets
        self.logger = logging.getLogger(__name__)

[docs]    def generate(self) -> None:
        self.logger.info("Heatmaps from %s", self.exp_stat_root)

        # For each category of heatmaps we are generating
        for category in self.targets:

            # For each graph in each category
            for graph in category['graphs']:
                self.logger.trace('\n' +  # type: ignore
                                  json.dumps(graph, indent=4))
                if IntraExpModel2DGraphSet.model_exists(self.exp_model_root,
                                                        graph['src_stem']):
                    IntraExpModel2DGraphSet(self.exp_stat_root,
                                            self.exp_model_root,
                                            self.exp_graph_root,
                                            graph['src_stem'],
                                            graph.get('title', None)).generate()
                else:
                    input_fpath = self.exp_stat_root / (graph['src_stem'] +
                                                        config.kStats['mean'].exts['mean'])
                    output_fpath = self.exp_graph_root / ('HM-' + graph['src_stem'] +
                                                          config.kImageExt)

                    Heatmap(input_fpath=input_fpath,
                            output_fpath=output_fpath,
                            title=graph.get('title', None),
                            xlabel='X',
                            ylabel='Y',
                            large_text=self.large_text).generate()


__api__ = [
    'BatchIntraExpGraphGenerator',
    'IntraExpGraphGenerator',
    'LinegraphsGenerator',
    'HeatmapsGenerator'
]