Codestin Search App

executable file
413 lines (378 loc) · 15 KB
# -*- coding: utf-8 -*-
Created on Tue Feb  6 09:49:36 2018
@author: tstopi
import yaml as y
from numpy import float64, interp, ones
import warnings
from collections import namedtuple
from pyropython.utils import read_data
from pyropython.objective_functions import get_objective_function
case = None
run_opts = namedtuple('run_opts',
                      ['num_jobs', 'max_iter', 'num_points',
                       'num_initial', 'initial_design',
                       'optimizer_opts','output_dir'])
run_opts.num_jobs = 1
run_opts.max_iter = 50
run_opts.num_points = 100
run_opts.num_initial = 100
run_opts.initial_design = "rand"
run_opts.optimizer_opts = {"base_estimator":       "ET",
                           "acq_func":             "gp_hedge",
                           "acq_optimizer":        "auto",
                           "n_initial_points":      100,
                           "acq_optimizer_kwargs":
                           {"n_points": 10000,
                            "n_restarts_optimizer": 5,
                            "n_jobs": 1},
                           "acq_func_kwargs":       {"xi": 0.01, "kappa": 1.96}
run_opts.output_dir = "Best/"
def _check_required_fields(dict, req_fields):
    Tries to find fields in a dict.
        dict - dictinionary to check
        req_fields - list of required keys
    Returns:
        not_found - list of fields not found.
    not_found = []
    for field in req_fields:
        if field not in dict:
            not_found.append(field)
        # check for keywords followed by no input.
        if dict[field] is None:
            not_found.append(field)
    return not_found
def _check_misspellings(dict, valid_keys):
    Checks keys in dict against valid keys. Suggest matches for misspellings
    from difflib import get_close_matches
    for key in dict:
        if key not in valid_keys:
            quess = get_close_matches(key, valid_keys, 1)
            msg = "Unknown keyword {key:s} did you mean {q:s}?"
            warnings.warn(msg.format(key=key, q=quess))
def _proc_optimizer_opts(args_dict):
    """Process optimizer kwargs. 
    This is meainly used to set different defaults
    for skopt.learn - Tree regressors. 
    from skopt.utils import cook_estimator
    if args_dict is None:
        return {}
    if "base_estimator" in args_dict:
        if args_dict["base_estimator"]=="ET":
            args = {"n_estimators": 100,
                    "min_samples_leaf":3,
                    "max_depth":None,
                    "bootstrap":False}
        elif args_dict["base_estimator"]=="ET2":
            args = {"n_estimators": 1000,
                    "min_samples_leaf":1,
                    "max_depth":None,
                    "bootstrap":False}
            args_dict["base_estimator"]="ET"
        elif args_dict["base_estimator"]=="RF":
            args = {"n_estimators": 100,
                    "min_samples_leaf": 1,
                    "max_depth": None,
                    "bootstrap": True}
        elif args_dict["base_estimator"]=="GBRT":
            args = None
        else:
            args = None
        if args: 
            args_dict["base_estimator"] = cook_estimator(
                                            args_dict["base_estimator"],
    return args_dict
def _set_data_line_defaults(line,
                            ind_col_name="Time",
                            normalize=False,
                            conversion_factor=1.0,
                            header=1,
                            filter_type="None",
                            filter_opts={},
                            gradient=False):
    This is a convenience function to set the default values for data line
    and check for missing values
        line - dictionary containing the data line description
    kwargs:
        optional arguments and their default values
    not_found = _check_required_fields(line, ["dep_col_name", "fname"])
    if not_found:
        raise KeyError("required field(s) %s not found." % str(not_found))
    line.setdefault("ind_col_name", ind_col_name)
    line.setdefault("normalize", normalize)
    line.setdefault("conversion_factor", conversion_factor)
    line.setdefault("header", header)
    line.setdefault("filter_type", filter_type)
    line.setdefault("filter_opts", filter_opts)
    line.setdefault("gradient", gradient)
    return line
def _check_templates(templates,params):
    """This function attempts to render the  given templates
    from jinja2 import Environment, FileSystemLoader
    from jinja2 import TemplateSyntaxError,TemplateNotFound, TemplateError
    cwd = os.getcwd()
    env = Environment(loader=FileSystemLoader(cwd))
    error = False
    for fname in templates:
        template = env.get_template(fname)
        variables = {name: 0.5*(minval + maxval)
                     for name, (minval, maxval) in params}
        try:
            output = template.render(**variables)
        except TemplateSyntaxError as err:
            print(err.message)
            print("Filename:",err.filename)
            print("Line number:",err.lineno)
            error = True
            pass
        except TemplateNotFound as err:
            print("Template %s not found",err.name)
            error = True
            pass
        except TemplateError as err:
            print("Error wihle processing tmeplate %s" % fname)
            error = True
            pass
    if error:
        sys.exit('Problems with templates. Exiting.')
def read_model(input):
    This function creates a initialized Model object based on the dictionary
    "cfg". The dictionary is assumed to be produced by reading a yaml file.
    if isinstance(input, str):
        lines = open(input, "r").read()
        cfg = y.load(lines)
    elif isinstance(input, dict):
        cfg = input
    Check for required fields
    not_found = _check_required_fields(cfg, ["simulation",
                                             "experiment",
                                             "variables",
                                             "templates"])
    if not_found:
        raise KeyError("Required field(s) %s not found in config." %
                       str(not_found))
    # handle empyty keywords and misspelled fields
    for key, value in cfg.items():
        if value is None:
            value = {}
            msg = "Empty keyword {field:s} in config."
            warnings.warn(msg.format(field=key))
    #keywords = ["objective"]
    #_check_misspellings(cfg,keywords)
     yaml is sometimes unable to correctly convert str to float.
     For example, scientific notation like "1e15" will  fail.
     Here we explicitly attempt to convert numeric input to floats
    variables = list(cfg['variables'].items())
    for n, (name, bounds) in enumerate(variables):
        try:
            variables[n] = (name, float64(bounds))
        except ValueError:
            raise TypeError("Bounds for %s need to benumeric (for now)." %
    simulation = cfg['simulation']
    experiment = cfg['experiment']
    for key in cfg['simulation']:
        if key not in cfg['experiment']:
            raise KeyError("No experimental data for variable %s" % key)
    for key in cfg['experiment']:
        if key not in cfg['simulation']:
            raise KeyError("No simulation data for variable %s" % key)
    if len(cfg['templates']) < 1:
        raise ValueError("Templates list cannot be empty.")
    templates =  cfg['templates']
    # set default values for data lines
    for key, line in simulation.items():
        line = _set_data_line_defaults(line)
    exp_data = {}
    for key, line in experiment.items():
        """
        For experimental data we expect only one header line unless indicates
        otherwise
        """
        line = _set_data_line_defaults(line,
        exp_data[key] = read_data(**line)
    Read and process the "objective" dictionary
    obj = cfg.get("objective", {})
    objective_name = obj.get("type", "mse")
    objective_function = get_objective_function(objective_name)
    objective_opts = obj.get("objective_opts", {})
    data_weights = obj.get("data_weights", {})
    var_weights = obj.get("var_weights", {})
     Process weights for each  variable.
     if weights are not given, set weight to 1.0 for all datasets
    if len(var_weights) > 0:
        if set(var_weights) != set(simulation):
            warnings.warn(
                "If weights are defined for one or more variables they " +
                "should  be defined for all variables in 'experiment'" +
                " and 'simulation'. Weights will be set to unity. " +
                " Missing: \n %s " %
                str(set(var_weights).symmetric_difference(set(simulation))))
            for key in experiment:
                var_weights[key] = 1.0
        for key in experiment:
            var_weights[key] = 1.0
    Weights can be read from a file as a list of tuples in the format
     [(x,w),(x,w),(x,w)] where x is the independent variable and
     w is the weight
     weights will be interpolated to coincide with the experimental data
    for key, (etime, edata) in exp_data.items():
        if key in data_weights:
            entry = data_weights[key]
            if isinstance(entry, dict):
                wtime, weights = read_data(**entry)
            elif isinstance(entry, list):
                wtime, weights = zip(*entry)
            else:
                warnings.warn(("Problem with weights for variable %s."
                               "Weigths set to one.") % key)
                wtime = etime
                weights = ones(len(etime))
        else:
            wtime = etime
            weights = ones(len(etime))
        weightsi = interp(etime, wtime, weights)
        data_weights[key] = weightsi
    if "fds_command" not in cfg:
        warnings.warn("fds_command not defined. Using 'fds'")
    fds_command = cfg.get("fds_command", "fds")
    # check if fds_command is found and executable
    if not os.path.isfile(fds_command) or not os.access(fds_command, os.X_OK):
        raise ValueError(("The executable %s can not found or not executable" %
                          fds_command))
    # Check ih the temnplates can be rendered
    _check_templates(templates, variables)
    tempdir = os.path.join(os.getcwd(), "Work/")
    from pyropython.model import Model
    return Model(exp_data=exp_data,
                 params=variables,
                 simulation=simulation,
                 var_weights=var_weights,
                 data_weights=data_weights,
                 templates=templates,
                 command=fds_command,
                 objective_function=objective_function,
                 tempdir=tempdir,
                 objective_opts=objective_opts)
def read_plots(input):
    This function reads a config file and gathers all data needed for 'plots'
    if isinstance(input, str):
        lines = open(input, "r").read()
        cfg = y.load(lines)
    elif isinstance(input, dict):
        cfg = input
    plot_data = namedtuple('plot_data',
                           ['raw_data',
                            'simulation',
                            'exp_data',
                            'plots',
                            'fig_dir',
                            'output_dir'
    simulation = cfg.get('simulation', {})
    experiment = cfg.get('experiment', {})
    for key, line in simulation.items():
        line = _set_data_line_defaults(line)
    # set default values for data lines
    plot_data.simulation = simulation
    plot_data.plots = cfg.get('plots', {})
    plot_data.exp_data = {}
    plot_data.raw_data = {}
    for key, line in experiment.items():
        """
        For experimental data we expect only one header line unless indicates
        otherwise
        """
        line = _set_data_line_defaults(line,
        plot_data.exp_data[key] = read_data(**line)
        tmp = dict(line)  # create copy
        tmp["filter_type"] = "None"
        plot_data.raw_data[key] = read_data(**tmp)
    run_opts = proc_general_options(input)
    plot_data.fig_dir = run_opts.fig_dir
    plot_data.output_dir = run_opts.output_dir
    return plot_data
def proc_general_options(input):
    if isinstance(input, str):
        lines = open(input, "r").read()
        cfg = y.load(lines)
    elif isinstance(input, dict):
        cfg = input
    run_opts = namedtuple('run_opts',
                          ['num_jobs', 'max_iter', 'num_points',
                           'num_initial', 'initial_design',
                           'initial_points_from_file',
                           'optimizer_opts', 'optimizer_name', 'output_dir',
                           'case_name','fig_dir'])
    run_opts.max_iter = cfg.get("max_iter", 1)
    run_opts.num_jobs = cfg.get("num_jobs", 1)
    run_opts.num_points = cfg.get("num_points", 1)
    run_opts.num_initial = cfg.get("num_initial", 1)
    run_opts.initial_design = cfg.get("initial_design", "rand")
    opt = cfg.get("optimizer", {})
    run_opts.optimizer_opts = _proc_optimizer_opts(opt) 
    run_opts.optimizer_name = cfg.get("optimizer_name", "skopt")
    run_opts.output_dir = cfg.get("output_dir", "Best/")
    run_opts.fig_dir = cfg.get("fig_dir", "Figs/")
    run_opts.casename = cfg.get("casename", "")
    run_opts.logfilename = cfg.get("logfilename", "log.csv")
    run_opts.initial_design_file = cfg.get("initial_design_file", 
    if "output_dir" not in cfg and "casename" in cfg:
        run_opts.output_dir = run_opts.casename + "/"
    if "logfilename" not in cfg and "casename" in cfg:
        run_opts.logfilename = run_opts.casename + ".csv"
    if "fig_dir" not in cfg and "casename" in cfg:
        run_opts.fig_dir = "Figs_" + run_opts.casename +"/"
    # Add trailing slash if it isn't there
    run_opts.output_dir = os.path.join(run_opts.output_dir, '')
    run_opts.fig_dir = os.path.join(run_opts.fig_dir, '')
    return run_opts
def read_config(fname):
    Reads and processes pyropython config file
    case = read_model(fname)
    # check for misspelled keys
    run_opts = proc_general_options(fname)
    return case, run_opts
def main():
    fname = sys.argv[1]
    read_config(fname)
    print(run_opts.num_jobs)
    print(len(case.exp_data))
if __name__ == "__main__":
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

config.py

Latest commit

History

config.py

File metadata and controls