Source code for evaluator

import json
import shutil
import subprocess
import tempfile
from abc import ABC, abstractmethod
import os
import copy
from contextlib import contextmanager
from functools import lru_cache, wraps
from pathlib import Path
from typing import Callable, Tuple, List, Union
from warnings import warn

import pandas as pd
from pandas import DataFrame as DF
import numpy as np
import platypus

import config
from problem import Problem
from objectives import read_eso


def _list_cache(enabled=config.cache['enabled'], size=config.cache['size'],
                typed=config.cache['typed']):
    """Decorator that allows the lru_cache (last recently used cache)
    to work on functions that receive lists"""

    def _list_cache_decorator(f):
        if enabled:
            cache_f = lru_cache(size, typed)(f)

            @wraps(cache_f)
            def safe_f(individual, *args, **kwargs):
                return cache_f(tuple(individual), *args, **kwargs)

            safe_f.cache_clear = cache_f.cache_clear
            return safe_f
        # add a no-op as the cache clear operation so it does not error if disabled in the config
        f.cache_clear = lambda: None
        return f

    return _list_cache_decorator


@contextmanager
def working_directory(path=None):
    old_wd = os.getcwd()
    if path is None:
        tempdir = tempfile.TemporaryDirectory()
        path = tempdir.name
    else:
        tempdir = None
    os.chdir(path)
    try:
        yield path
    finally:
        os.chdir(old_wd)
        if tempdir is not None:
            tempdir.cleanup()


def run(building, schema=config.files['data dict'], epw=config.files['epw'],
        out_dir=config.out_dir, err_dir=config.err_dir):
    def resolve(path):
        if path is None:
            return None
        return Path(path).resolve()

    schema, epw, out_dir, err_dir = (resolve(p) for p in (schema, epw, out_dir, err_dir))
    with working_directory(out_dir) as out_dir:
        try:
            building_path = 'in.idf'
            building.saveas(building_path)
        except AttributeError:
            building_path = str(Path(out_dir, 'in.epJSON'))
            with open(building_path, 'w') as f:
                json.dump(building, f)
        try:
            # TODO: Include energyplus output in the error message
            subprocess.run(['energyplus', '--idd', str(schema),
                                   '--weather', str(epw), building_path], check=True)
            results = read_eso(out_dir)
            return results
        except subprocess.CalledProcessError as e:
            if err_dir is not None and Path(out_dir).resolve() != Path(err_dir).resolve():
                if os.path.exists(err_dir):
                    shutil.rmtree(err_dir)
                shutil.copytree(out_dir, err_dir)
            raise e


[docs]class AbstractEvaluator(ABC):
    """AbstractEvaluator(problem, error_mode = 'Failfast', error_value = None)
    Base class for Evaluators.

    This template requires that Evaluators are callable.
    It also gives them the df_apply method and result caching.

    :param Problem problem: description of the inputs and outputs the evaluator will use
    :param str error_mode: One of {'Failfast', 'Silent', 'Print'}.
        Failfast: Any error aborts the evaluation.
        Silent: Evaluation will return the `error_value` for any lists of values that raise an error.
        Print: Same as silent, but warnings are printed to stderr for any errors.
    :param tuple error_value: The value of the evaluation if an error occurs. Incompatible with error_mode='Failfast'.
        must have the form (objective_values, constraint_values).
    """

    error_mode_options = {'Failfast', 'Silent', 'Print'}

    def __init__(self, problem: Problem,
                 error_mode='Failfast', error_value: tuple = None):
        """
        """
        self.problem = problem
        self.error_mode = error_mode
        self.error_value = error_value
        self.validate_error_mode()
        # this makes the cache instance-specific instead of class-specific
        self._call = _list_cache()(self._call)

    # TODO: Accept more flexible input formats
    # Factoring out some of the code from _call related to handling different tuple formats might be of use
    def validate_error_mode(self):
        msg = f'Invalid error mode, only {self.error_mode_options} are allowed'
        assert self.error_mode in self.error_mode_options, msg
        if self.error_mode == 'Failfast':
            assert self.error_value is None, 'error value cannot be set when in Failfast mode'
            return
        # intuit error_value if needed
        if self.error_value is None:
            self.error_value = (None, None)
        err_out, err_constraint = self.error_value
        if err_out is None:
            err_out = tuple(float('inf') if minimize else float('-inf')
                            for minimize in self.problem.minimize_outputs)
        if err_constraint is None:
            # TODO: Intuit constraint error values as well
            err_constraint = ()
        msg = 'error value must match outputs length'
        assert len(err_out) == self.problem.num_outputs, msg
        msg = 'error value must match constraints length'
        assert len(err_constraint) == self.problem.num_constraints, msg
        self.error_value = (err_out, err_constraint)
        self.error_mode = self.error_mode

[docs]    @abstractmethod
    def eval_single(self, values: list, **kwargs) -> Tuple[Tuple, Tuple]:
        """eval_single(values, **kwargs) -> Tuple
        Returns the objective results for a single list of parameter values.

        :param list values: A list of values to set each parameter to,
            in the same order as this evaluator's inputs
        :param kwargs: Any keyword arguments
        :return: a tuple of the objectives and constraints
        """
        pass

    def _call(self, values: list, separate_constraints=None, **kwargs) -> tuple:
        # This method is a workaround to allow lru_cache to be instance-specific and work on __call__
        if separate_constraints is None:
            separate_constraints = self.problem.num_constraints > 0
        try:
            self.validate(values)
            outputs, constraints = self.eval_single(values, **kwargs)
        except Exception as e:
            if self.error_mode != 'Silent':
                msg = ''
                if self.problem.inputs is not None:
                    msg += f'for inputs: {self.problem.names("inputs")} '
                msg += f'problematic values were: {values}'
                warn(msg)
            if self.error_mode == 'Failfast':
                raise e
            else:
                outputs, constraints = self.error_value
        if separate_constraints:
            return outputs, constraints
        return outputs + constraints

    def __call__(self, values: list, separate_constraints=None, **kwargs) -> tuple:
        """Returns the objective results for a single list of parameter values.

        :param values: A list of values to set each parameter to,
            in the same order as this evaluator's inputs
        :param separate_constraints: which output format to use:
            objectives and constraints are both tuples of the measured values
            True: (objectives, constraints)
            False: objectives + constraints
            None: Same as True if there is at least one constraint, else the same as False
        :return: a tuple of the objectives' results
        """
        # Enables validation and caching in subclasses
        # Redirects calls to evaluate a list of values to the eval_single function.
        # Override eval_single, not this method.
        # Values can be empty to allow evaluating at the current state, but this is not the default behaviour
        # If this is not supported, the validate function of a subclass should reject an empty list
        return self._call(values, separate_constraints, **kwargs)

[docs]    def cache_clear(self):
        """Clears any cached vales of calls to this evaluator.
        This should be called whenever the evaluator's outputs could have changed."""
        self._call.cache_clear()

[docs]    def validate(self, values):
        """Takes a list of values and checks that they are a valid input for this evaluator.

        :param values: Values to be checked
        """

        if len(values) != self.problem.num_inputs:
            raise ValueError(f'Wrong number of input values.'
                             f'{len(values)} provided, {self.problem.num_inputs} expected')
        for p, value in zip(self.problem.inputs, values):
            if not p.validate(value):
                raise ValueError(f'Invalid value {value} for parameter {p}')

[docs]    def df_apply(self, df: DF, keep_input=False, **kwargs) -> pd.DataFrame:
        """df_apply(df, keep_input = False, **kwargs) -> DataFrame
        Applies this evaluator to an entire dataFrame, row by row.

        :param DF df: a DataFrame where each row represents valid input values for this Evaluator.
        :param boolean keep_input: whether to include the input data in the returned DataFrame
        :return: Returns a DataFrame with one column containing the results for each objective.
        """
        result = df.apply(self, axis=1, result_type='expand', separate_constraints=False, **kwargs)
        result = result.rename({i: name for i, name in enumerate(self.problem.names('outputs'))}, axis=1)
        if keep_input:
            result = pd.concat([df, result], axis=1)
        return result

[docs]    def to_platypus(self) -> platypus.Problem:
        """to_platypus()
        Converts this evaluator (and the underlying problem) to a platypus compatible format

        :return: A platypus Problem that can optimise over this evaluator
        """
        problem = self.problem.to_platypus()
        problem.function = self
        return problem


[docs]class EvaluatorSR(AbstractEvaluator):
    """EvaluatorSR(evaluation_func, problem, error_mode = 'Failfast', error_value = None)

    Surrogate Model Evaluator

    This evaluator is a wrapper around a surrogate model, as defined by a function.

    :param eval_func_format evaluation_func: a function that takes as input an list of values,
            and gives as output a tuple of the objective values for that point in the solution space
    :param Problem problem: description of the inputs and outputs the evaluator will use
    :param str error_mode: One of {'Failfast', 'Silent', 'Print'}.
        Failfast: Any error aborts the evaluation.
        Silent: Evaluation will return the `error_value` for any lists of values that raise an error.
        Print: Same as silent, but warnings are printed to stderr for any errors.
    :param tuple error_value: The value of the evaluation if an error occurs. Incompatible with error_mode='Failfast'.
        must have the form (objective_values, constraint_values).
    """
    eval_func_format = Callable[[List], Tuple[float, ...]]

    def __init__(self, evaluation_func: eval_func_format,
                 problem: Problem, error_mode='Failfast', error_value=None):
        """
        """

        super().__init__(problem=problem, error_mode=error_mode, error_value=error_value)
        self._evaluation_func = evaluation_func

[docs]    def eval_single(self, values: List) -> Tuple:
        return self._evaluation_func(values)


tabular = Union[DF, np.array]


# TODO: Add an option/subclass that automatically bundles several single variable models into a multiobjective model.
[docs]class AdaptiveSR(AbstractEvaluator, ABC):
    """AdaptiveSR(reference = None, error_mode = 'Failfast', error_value = None)
    A Template for making adaptive sampling based models compatible with the evaluator interface.

    :param AbstractEvaluator reference: A reference evaluator
    :param str error_mode: One of {'Failfast', 'Silent', 'Print'}.
        Failfast: Any error aborts the evaluation.
        Silent: Evaluation will return the `error_value` for any lists of values that raise an error.
        Print: Same as silent, but warnings are printed to stderr for any errors.
    :param tuple error_value: The value of the evaluation if an error occurs. Incompatible with error_mode='Failfast'.
        must have the form (objective_values, constraint_values).
    """

    # helper functions provided by AdaptiveSR (Generally avoid editing these, but use them as needed)
    # append_data(X, y)
    # do_infill
    # get_from_reference

    # functions with defaults (These can be removed from this template if you like the defaults)
    # They may depend on some of the optional functions in order to work if using the defaults
    # __init__
    # infill -> get_infill, _update_model
    # update_model

    # optional functions (These will not work unless you implement them)
    # get_infill

    # required functions
    # train
    # eval_single

    def __init__(self, reference: AbstractEvaluator = None,
                 error_mode='Failfast', error_value=None):
        self.reference: AbstractEvaluator = reference
        super().__init__(problem=reference.problem, error_mode=error_mode, error_value=error_value)

        self.model = None
        self.data: DF = pd.DataFrame(columns=self.problem.names(parts=['inputs', 'outputs', 'constraints']))

    @property
    def problem(self):
        return self.reference.problem

    @problem.setter
    def problem(self, value: Problem):
        self.reference.problem = value

[docs]    def append_data(self, data: tabular, deduplicate=True) -> None:
        """append_data(data, deduplicate = True)

        Adds the X and y data to input_data and output_data respectively

        :param tabular data: a table of training data to store
        :param boolean deduplicate: whether to remove duplicates from the combined DataFrame
        :return: None
        """
        self.cache_clear()  # TODO: decide on a consistent way of tracking this
        # can we assume users will only modify the data using this method or will call cache_clear themselves
        new_data = self.problem.to_df(data, ['inputs', 'outputs', 'constraints'])
        self.data = self.data.append(new_data, ignore_index=True)
        if deduplicate:
            self.data.drop_duplicates(inplace=True)

[docs]    def get_infill(self, num_datapoints: int) -> tabular:
        """get_infill(num_datapoints) -> tabular

        Generates data that is most likely to improve the model, and can be used for retraining.

        :param int num_datapoints: the number of datapoints to generate
        :return: the datapoints generated, in some tabular datastructure
        """
        raise NotImplementedError

[docs]    def do_infill(self, data: DF) -> None:
        """do_infill(data)

        Updates the model using the inputs X and outputs y, and stores the added data

        :param DF data: a table of training data
        :return: None
        """
        old_df = self.data
        df, parts = self.problem.partial_df(data, parts=['inputs', 'outputs', 'constraints'])
        if parts == ['inputs']:
            outputs: DF = self.get_from_reference(df)
            df = pd.concat([df, outputs], axis=1)
        self.append_data(df)
        if self.model is None:
            self.train()
        else:
            self.update_model(df, old_df)

[docs]    def update_model(self, new_data: tabular, old_data: DF = None) -> None:
        """update_model(new_data, old_data = None)

        Modifies self.model to incorporate the new data.

        This function should not edit the existing data

        :param tabular new_data: a table of inputs and outputs
        :param DF old_data: the table of inputs and outputs without the new data
        :return: None
        """
        self.train()

[docs]    def infill(self, num_datapoints: int) -> None:
        """infill(num_datapoints)

        Adds num_datapoints samples to the model and updates it.

        :param int num_datapoints: number of datapoints to add to the model's training set
        :return: None
        """
        inputs: DF = self.problem.to_df(self.get_infill(num_datapoints), 'inputs')
        outputs: DF = self.get_from_reference(inputs)
        self.do_infill(pd.concat([inputs, outputs], axis=1))

[docs]    @abstractmethod
    def train(self) -> None:
        """Generates a new model using the stored data, and stores it as self.model"""
        pass

[docs]    @abstractmethod
    def eval_single(self, values: List, **kwargs) -> Tuple:
        """eval_single(value, **kwargs) -> Tuple

        Evaluates a single input point

        :param List values: The datapoint to evaluate
        :param kwargs: Arbitrary keyword arguments.
        :return: A tuple of the predicted outputs for this datapoint
        """
        pass

[docs]    def get_from_reference(self, X: tabular) -> DF:
        """get_from_reference(X) -> DF

        Use the reference evaluator to get the real value of a dataframe of datapoints

        :param tabular X: a table containing the datapoints to evaluate
        :return: a DataFrame containing the results of the datapoints
        """
        df = self.problem.to_df(X, 'inputs')
        return self.reference.df_apply(df)


[docs]class EvaluatorEP(AbstractEvaluator, ABC):
    """EvaluatorEP(problem, building, epw, out_dir, err_dir, error_mode = 'Failfast', error_value = None)

    This evaluator uses a Problem to modify a building, and then simulate it.
    It keeps track of the building and the weather file.

    :param problem: a parametrization of the building and the desired outputs
    :param building: the building that is being simulated.
    :param epw: the epw file representing the weather
    :param out_dir: the directory used for files created by the EnergyPlus simulation.
    :param err_dir: the directory where files from a failed run are stored.
    :param error_mode: One of {'Failfast', 'Silent', 'Print'}.
        Failfast: Any error aborts the evaluation.
        Silent: Evaluation will return the `error_value` for any lists of values that raise an error.
        Print: Same as silent, but warnings are printed to stderr for any errors.
    :param error_value: The value of the evaluation if an error occurs. Incompatible with error_mode='Failfast'.
    """

    def __init__(self, problem: Problem,
                 building, epw=config.files['epw'], out_dir=config.out_dir,
                 err_dir=config.err_dir, error_mode='Failfast', error_value=None):
        super().__init__(problem=problem, error_mode=error_mode, error_value=error_value)
        self.out_dir = out_dir
        self.err_dir = err_dir
        for io in self.problem:
            io.setup(building)
        self.building = building
        self.epw = epw

[docs]    def eval_single(self, values: list):
        current_building = copy.deepcopy(self.building)
        for p, value in zip(self.problem.inputs, values):
            # apply the modification of each parameter to the building using the corresponding value
            p.transformation_function(current_building, value)
        results = run(current_building, out_dir=self.out_dir, err_dir=self.err_dir, epw=self.epw)
        outputs = tuple((objective(results) for objective in self.problem.outputs))
        constraints = tuple((constraint(results) for constraint in self.problem.constraints))
        return outputs, constraints

    @property
    def building(self):
        return self._building

    @building.setter
    def building(self, value):
        """Changes the building simulated.
        Changing this resets the cache.

        :param value: the building to use
        :return: None
        """
        self.cache_clear()
        self._building = value

    @property
    def epw(self):
        return self._epw

    @epw.setter
    def epw(self, value: str) -> None:
        """epw(value)

        Changes the epw file used with this building.
        Changing this resets the cache.

        :param str value: path to the new epw file to use.
        :return: None
        """
        self.cache_clear()
        self._epw = value