Source code for mpisppy.utils.sputils

# Copyright 2020 by B. Knueven, D. Mildebrath, C. Muir, J-P Watson, and D.L. Woodruff
# This software is distributed under the 3-clause BSD License.
# Base and utility functions for mpisppy
# Note to developers: things called spcomm are way more than just a comm; SPCommunicator

import pyomo.environ as pyo
import sys
import os
import re
import time
import numpy as np
import mpisppy.scenario_tree as scenario_tree
from pyomo.core import Objective

from mpisppy import MPI, haveMPI
global_rank = MPI.COMM_WORLD.Get_rank()
from pyomo.core.expr.numeric_expr import LinearExpression
from pyomo.opt import SolutionStatus, TerminationCondition

from mpisppy import tt_timer, global_toc

def not_good_enough_results(results):
    return (results is None) or (len(results.solution) == 0) or \
        (results.solution(0).status == SolutionStatus.infeasible) or \
        (results.solver.termination_condition == TerminationCondition.infeasible) or \
        (results.solver.termination_condition == TerminationCondition.infeasibleOrUnbounded) or \
        (results.solver.termination_condition == TerminationCondition.unbounded)


_spin_the_wheel_move_msg = \
        "spin_the_wheel should now be used as the class "\
        "mpisppy.spin_the_wheel.WheelSpinner using the method `spin()`. Output "\
        "writers are now methods of the class WheelSpinner."

def spin_the_wheel(hub_dict, list_of_spoke_dict, comm_world=None):
    raise RuntimeError(
            _spin_the_wheel_move_msg + \
            " See the example code below for a fix:\n"
    '''
    from mpisppy.spin_the_wheel import WheelSpinner
    ws = WheelSpinner(hub_dict, list_of_spoke_dict)
    ws.spin(comm_world=comm_world)
    '''
    )

def first_stage_nonant_npy_serializer(file_name, scenario, bundling):
    # write just the nonants for ROOT in an npy file (e.g. for Conf Int)
    root = scenario._mpisppy_node_list[0]
    assert root.name == "ROOT"
    root_nonants = np.fromiter((pyo.value(var) for var in root.nonant_vardata_list), float)
    np.save(file_name, root_nonants)

def first_stage_nonant_writer( file_name, scenario, bundling ):
    with open(file_name, 'w') as f:
        root = scenario._mpisppy_node_list[0]
        assert root.name == "ROOT"
        for var in root.nonant_vardata_list:
            var_name = var.name
            if bundling:
                dot_index = var_name.find('.')
                assert dot_index >= 0
                var_name = var_name[(dot_index+1):]
            f.write(f"{var_name},{pyo.value(var)}\n")

def scenario_tree_solution_writer( directory_name, scenario_name, scenario, bundling ):
    with open(os.path.join(directory_name, scenario_name+'.csv'), 'w') as f:
        for var in scenario.component_data_objects(
                ctype=(pyo.Var, pyo.Expression),
                descend_into=True,
                active=True,
                sort=True):
            var_name = var.name
            if bundling:
                dot_index = var_name.find('.')
                assert dot_index >= 0
                var_name = var_name[(dot_index+1):]
            f.write(f"{var_name},{pyo.value(var)}\n")
        
def write_spin_the_wheel_first_stage_solution(spcomm, opt_dict, solution_file_name,
        first_stage_solution_writer=first_stage_nonant_writer):
    raise RuntimeError(_spin_the_wheel_move_msg)

def write_spin_the_wheel_tree_solution(spcomm, opt_dict, solution_directory_name,
        scenario_tree_solution_writer=scenario_tree_solution_writer):
    raise RuntimeError(_spin_the_wheel_move_msg)

def local_nonant_cache(spcomm):
    raise RuntimeError(_spin_the_wheel_move_msg)

### a few Pyomo-related utilities ###


def get_objs(scenario_instance, allow_none=False):
    """ return the list of objective functions for scenario_instance"""
    scenario_objs = scenario_instance.component_data_objects(pyo.Objective,
                    active=True, descend_into=True)
    scenario_objs = list(scenario_objs)
    if (len(scenario_objs) == 0) and not allow_none:
        raise RuntimeError(f"Scenario {scenario_instance.name} has no active "
                           "objective functions.")
    if (len(scenario_objs) > 1):
        print("WARNING: Scenario", sname, "has multiple active "
              "objectives. Selecting the first objective.")
    return scenario_objs


def stash_ref_objs(scenario_instance):
    """Stash a reference to active objs so
        Reactivate_obj can use the reference to reactivate them/it later.
    """
    scenario_instance._mpisppy_data.obj_list = get_objs(scenario_instance)


def deact_objs(scenario_instance):
    """ Deactivate objs 
    Args:
        scenario_instance (Pyomo ConcreteModel): the scenario
    Returns:
        obj_list (list of Pyomo Objectives): the deactivated objs
    Note: If none are active, just do nothing
    """
    obj_list = get_objs(scenario_instance, allow_none=True)
    for obj in obj_list:
        obj.deactivate()
    return obj_list


def reactivate_objs(scenario_instance):
    """ Reactivate ojbs stashed by stash_ref_objs """
    if not hasattr(scenario_instance._mpisppy_data, "obj_list"):
        raise RuntimeError("reactivate_objs called with prior call to stash_ref_objs")
    for obj in scenario_instance._mpisppy_data.obj_list:
        obj.activate()

    

[docs]
def create_EF(scenario_names, scenario_creator, scenario_creator_kwargs=None,
              EF_name=None, suppress_warnings=False,
              nonant_for_fixed_vars=True):
    """ Create a ConcreteModel of the extensive form.

        Args:
            scenario_names (list of str):
                Names for each scenario to be passed to the scenario_creator
                function.
            scenario_creator (callable):
                Function which takes a scenario name as its first argument and
                returns a concrete model corresponding to that scenario.
            scenario_creator_kwargs (dict, optional):
                Options to pass to `scenario_creator`.
            EF_name (str, optional):
                Name of the ConcreteModel of the EF.
            suppress_warnings (boolean, optional):
                If true, do not display warnings. Default False.
            nonant_for_fixed_vars (bool--optional): If True, enforces
                non-anticipativity constraints for all variables, including
                those which have been fixed. Default is True.

        Returns:
            EF_instance (ConcreteModel):
                ConcreteModel of extensive form with explicit
                non-anticipativity constraints.

        Note:
            If any of the scenarios produced by scenario_creator do not have a
            ._mpisppy_probability attribute, this function displays a warning, and assumes
            that all scenarios are equally likely.
    """
    if scenario_creator_kwargs is None:
        scenario_creator_kwargs = dict()
    scen_dict = {
        name: scenario_creator(name, **scenario_creator_kwargs)
        for name in scenario_names
    }

    if (len(scen_dict) == 0):
        raise RuntimeError("create_EF() received empty scenario list")
    elif (len(scen_dict) == 1):
        scenario_instance = list(scen_dict.values())[0]
        scenario_instance._ef_scenario_names = list(scen_dict.keys())
        if not suppress_warnings:
            print("WARNING: passed single scenario to create_EF()")
        # special code to patch in ref_vars
        scenario_instance.ref_vars = dict()
        scenario_instance._nlens = {node.name: len(node.nonant_vardata_list) 
                                for node in scenario_instance._mpisppy_node_list}
        for node in scenario_instance._mpisppy_node_list:
            ndn = node.name

            for i in range(scenario_instance._nlens[ndn]):
                v = node.nonant_vardata_list[i]
                if (ndn, i) not in scenario_instance.ref_vars:
                    scenario_instance.ref_vars[(ndn, i)] = v
        # patch in EF_Obj        
        scenario_objs = deact_objs(scenario_instance)        
        obj = scenario_objs[0]            
        sense = pyo.minimize if obj.is_minimizing() else pyo.maximize
        scenario_instance.EF_Obj = pyo.Objective(expr=obj.expr, sense=sense)

        return scenario_instance  #### special return for single scenario

    # Check if every scenario has a specified probability
    probs_specified = \
        all(hasattr(scen, '_mpisppy_probability') for scen in scen_dict.values())
    uniform_specified = \
        probs_specified and all(scen._mpisppy_probability == "uniform" for scen in scen_dict.values())
    if not probs_specified or uniform_specified:
        for scen in scen_dict.values():
            scen._mpisppy_probability = 1 / len(scen_dict)
        if not suppress_warnings and not uniform_specified:
            print('WARNING: At least one scenario is missing _mpisppy_probability attribute.',
                  'Assuming equally-likely scenarios...')

    EF_instance = _create_EF_from_scen_dict(scen_dict,
                                            EF_name=EF_name,
                                            nonant_for_fixed_vars=nonant_for_fixed_vars)
    return EF_instance


def _create_EF_from_scen_dict(scen_dict, EF_name=None,
                                nonant_for_fixed_vars=True):
    """ Create a ConcreteModel of the extensive form from a scenario
        dictionary.

        Args:
            scen_dict (dict): Dictionary whose keys are scenario names and
                values are ConcreteModel objects corresponding to each
                scenario.
            EF_name (str--optional): Name of the resulting EF model.
            nonant_for_fixed_vars (bool--optional): If True, enforces
                non-anticipativity constraints for all variables, including
                those which have been fixed. Default is True.

        Returns:
            EF_instance (ConcreteModel): ConcreteModel of extensive form with
                explicity non-anticipativity constraints.

        Notes:
            The non-anticipativity constraints are enforced by creating
            "reference variables" at each node in the scenario tree (excluding
            leaves) and enforcing that all the variables for each scenario at
            that node are equal to the reference variables.

            This function is called directly when creating bundles for PH.
 
            Does NOT assume that each scenario is equally likely. Raises an
            AttributeError if a scenario object is encountered which does not
            have a ._mpisppy_probability attribute.

            Added the flag nonant_for_fixed_vars because original code only
            enforced non-anticipativity for non-fixed vars, which is not always
            desirable in the context of bundling. This allows for more
            fine-grained control.
    """
    is_min, clear = _models_have_same_sense(scen_dict)
    if (not clear):
        raise RuntimeError('Cannot build the extensive form out of models '
                           'with different objective senses')
    sense = pyo.minimize if is_min else pyo.maximize
    EF_instance = pyo.ConcreteModel(name=EF_name)
    EF_instance.EF_Obj = pyo.Objective(expr=0.0, sense=sense)

    # we don't strictly need these here, but it allows for eliding
    # of single scenarios and bundles when convenient
    EF_instance._mpisppy_data = pyo.Block(name="For non-Pyomo mpi-sppy data")
    EF_instance._mpisppy_model = pyo.Block(name="For mpi-sppy Pyomo additions to the scenario model")
    EF_instance._mpisppy_data.scenario_feasible = None

    EF_instance._ef_scenario_names = []
    EF_instance._mpisppy_probability = 0
    for (sname, scenario_instance) in scen_dict.items():
        EF_instance.add_component(sname, scenario_instance)
        EF_instance._ef_scenario_names.append(sname)
        # Now deactivate the scenario instance Objective
        scenario_objs = deact_objs(scenario_instance)
        obj_func = scenario_objs[0] # Select the first objective
        try:
            EF_instance.EF_Obj.expr += scenario_instance._mpisppy_probability * obj_func.expr
            EF_instance._mpisppy_probability   += scenario_instance._mpisppy_probability
        except AttributeError as e:
            raise AttributeError("Scenario " + sname + " has no specified "
                        "probability. Specify a value for the attribute "
                        " _mpisppy_probability and try again.") from e
    # Normalization does nothing when solving the full EF, but is required for
    # appropraite scaling of EFs used as bundles.
    EF_instance.EF_Obj.expr /= EF_instance._mpisppy_probability

    # For each node in the scenario tree, we need to collect the
    # nonanticipative vars and create the constraints for them,
    # which we do using a reference variable.
    ref_vars = dict() # keys are _nonant_indices (i.e. a node name and a
                      # variable number)

    ref_suppl_vars = dict()

    EF_instance._nlens = dict() 

    nonant_constr = pyo.Constraint(pyo.Any, name='_C_EF_')
    EF_instance.add_component('_C_EF_', nonant_constr)

    nonant_constr_suppl = pyo.Constraint(pyo.Any, name='_C_EF_suppl')
    EF_instance.add_component('_C_EF_suppl', nonant_constr_suppl)

    for (sname, s) in scen_dict.items():
        nlens = {node.name: len(node.nonant_vardata_list) 
                            for node in s._mpisppy_node_list}
        
        for (node_name, num_nonant_vars) in nlens.items(): # copy nlens to EF
            if (node_name in EF_instance._nlens.keys() and
                num_nonant_vars != EF_instance._nlens[node_name]):
                raise RuntimeError("Number of non-anticipative variables is "
                    "not consistent at node " + node_name + " in scenario " +
                    sname)
            EF_instance._nlens[node_name] = num_nonant_vars

        nlens_ef_suppl = {node.name: len(node.nonant_ef_suppl_vardata_list)
                                   for node in s._mpisppy_node_list}

        for node in s._mpisppy_node_list:
            ndn = node.name
            for i in range(nlens[ndn]):
                v = node.nonant_vardata_list[i]
                if (ndn, i) not in ref_vars:
                    # grab the reference variable
                    if (nonant_for_fixed_vars) or (not v.is_fixed()):
                        ref_vars[(ndn, i)] = v
                # Add a non-anticipativity constraint, except in the case when
                # the variable is fixed and nonant_for_fixed_vars=False.
                elif (nonant_for_fixed_vars) or (not v.is_fixed()):
                    expr = LinearExpression(linear_coefs=[1,-1],
                                            linear_vars=[v,ref_vars[(ndn,i)]],
                                            constant=0.)
                    nonant_constr[(ndn,i,sname)] = (expr, 0.0)

            for i in range(nlens_ef_suppl[ndn]):
                v = node.nonant_ef_suppl_vardata_list[i]
                if (ndn, i) not in ref_suppl_vars:
                    # create the reference variable as a singleton with long name
                    # xxxx maybe index by _nonant_index ???? rather than singleton VAR ???
                    ref_suppl_vars[(ndn, i)] = v
                # Add a non-anticipativity constraint, expect in the case when
                # the variable is fixed and nonant_for_fixed_vars=False.
                elif (nonant_for_fixed_vars) or (not v.is_fixed()):
                        expr = LinearExpression(linear_coefs=[1,-1],
                                                linear_vars=[v,ref_suppl_vars[(ndn,i)]],
                                                constant=0.)
                        nonant_constr_suppl[(ndn,i,sname)] = (expr, 0.0)

    EF_instance.ref_vars = ref_vars
    EF_instance.ref_suppl_vars = ref_suppl_vars
                        
    return EF_instance

def _models_have_same_sense(models):
    ''' Check if every model in the provided dict has the same objective sense.

        Input:
            models (dict) -- Keys are scenario names, values are Pyomo
                ConcreteModel objects.
        Returns:
            is_minimizing (bool) -- True if and only if minimizing. None if the
                check fails.
            check (bool) -- True only if all the models have the same sense (or
                no models were provided)
        Raises:
            ValueError -- If any of the models has either none or multiple
                active objectives.
    '''
    if (len(models) == 0):
        return True, True
    senses = [find_active_objective(scenario).is_minimizing()
                for scenario in models.values()]
    sense = senses[0]
    check = all(val == sense for val in senses)
    if (check):
        return (sense == pyo.minimize), check
    return None, check

def is_persistent(solver):
    return isinstance(solver,
        pyo.pyomo.solvers.plugins.solvers.persistent_solver.PersistentSolver)
    
def ef_scenarios(ef):
    """ An iterator to give the scenario sub-models in an ef
    Args:
        ef (ConcreteModel): the full extensive form model

    Yields:
        scenario name, scenario instance (str, ConcreteModel)
    """    
    for sname in ef._ef_scenario_names:
        yield (sname, getattr(ef, sname))

def ef_nonants(ef):
    """ An iterator to give representative Vars subject to non-anticipitivity
    Args:
        ef (ConcreteModel): the full extensive form model

    Yields:
        tree node name, full EF Var name, Var value

    Note:
        not on an EF object because not all ef's are part of an EF object
    """
    for (ndn,i), var in ef.ref_vars.items():
        yield (ndn, var, pyo.value(var))

        
def ef_nonants_csv(ef, filename):
    """ Dump the nonant vars from an ef to a csv file; truly a dump...
    Args:
        ef (ConcreteModel): the full extensive form model
        filename (str): the full name of the csv output file
    """
    with open(filename, "w") as outfile:
        outfile.write("Node, EF_VarName, Value\n")
        for (ndname, varname, varval) in ef_nonants(ef):
            outfile.write("{}, {}, {}\n".format(ndname, varname, varval))

            
def nonant_cache_from_ef(ef,verbose=False):
    """ Populate a nonant_cache from an ef. Also works with multi-stage
    Args:
        ef (mpi-sppy ef): a solved ef
    Returns:
        nonant_cache (dict of numpy arrays): a special structure for nonant values
    """     
    nonant_cache = dict()
    nodenames = set([ndn for (ndn,i) in ef.ref_vars])
    for ndn in sorted(nodenames):
        nonant_cache[ndn]=[]
        i = 0
        while ((ndn,i) in ef.ref_vars):
            xvar = pyo.value(ef.ref_vars[(ndn,i)])
            nonant_cache[ndn].append(xvar)
            if verbose:
                print("barfoo", i, xvar)
            i+=1
    return nonant_cache


def ef_ROOT_nonants_npy_serializer(ef, filename):
    """ write the root node nonants to be ready by a numpy load
    Args:
        ef (ConcreteModel): the full extensive form model
        filename (str): the full name of the .npy output file
    """
    root_nonants = np.fromiter((v for ndn,var,v in ef_nonants(ef) if ndn == "ROOT"), float)
    np.save(filename, root_nonants)

def write_ef_first_stage_solution(ef,
                                  solution_file_name,
                                  first_stage_solution_writer=first_stage_nonant_writer):
    """ 
    Write a solution file, if a solution is available, to the solution_file_name provided
    Args:
        ef : A Concrete Model of the Extensive Form (output of create_EF). 
             We assume it has already been solved.
        solution_file_name : filename to write the solution to
        first_stage_solution_writer (optional) : custom first stage solution writer function
    
    NOTE:
        This utility is replicating WheelSpinner.write_first_stage_solution for EF
    """
    if global_rank == 0:
        representative_scenario = getattr(ef,ef._ef_scenario_names[0])
        first_stage_solution_writer(solution_file_name, 
                                    representative_scenario,
                                    bundling=False)

def write_ef_tree_solution(ef, solution_directory_name,
        scenario_tree_solution_writer=scenario_tree_solution_writer):
    """ Write a tree solution directory, if available, to the solution_directory_name provided
    Args:
        ef : A Concrete Model of the Extensive Form (output of create_EF). 
             We assume it has already been solved.
        solution_file_name : filename to write the solution to
        scenario_tree_solution_writer (optional) : custom scenario solution writer function
        
    NOTE:
        This utility is replicating WheelSpinner.write_tree_solution for EF
    """
    if global_rank==0:
        os.makedirs(solution_directory_name, exist_ok=True)
        for scenario_name, scenario in ef_scenarios(ef):
            scenario_tree_solution_writer(solution_directory_name,
                                          scenario_name, 
                                          scenario,
                                          bundling=False)
    

def extract_num(string):
    ''' Given a string, extract the longest contiguous
        integer from the right-hand side of the string.

        Example:
            scenario324 -> 324

        TODO: Add Exception Handling
    '''
    return int(re.compile(r'(\d+)$').search(string).group(1))

def node_idx(node_path,branching_factors):
    '''
    Computes a unique id for a given node in a scenario tree.
    It follows the path to the node, computing the unique id for each ascendant.

    Parameters
    ----------
    node_path : list of int
        A list of integer, specifying the path of the node.
    branching_factors : list of int
        branching_factors of the scenario tree.

    Returns
    -------
    node_idx
        Node unique id.
        
    NOTE: Does not work with unbalanced trees.

    '''
    if node_path == []: #ROOT node
        return 0
    else:
        stage_id = 0 #node unique id among stage t+1 nodes.
        for t in range(len(node_path)):
            stage_id = node_path[t]+branching_factors[t]*stage_id
        node_idx = _nodenum_before_stage(len(node_path),branching_factors)+stage_id
        return node_idx

def _extract_node_idx(nodename,branching_factors):
    """
    

    Parameters
    ----------
    nodename : str
        The name of a node, e.g. 'ROOT_2_0_4'.
    branching_factors : list
        Branching factor of a scenario tree, e.g. [3,2,8,4,3].

    Returns
    -------
    node_idx : int
        A unique integer that can be used as a key to designate this scenario.

    """
    if nodename =='ROOT':
        return 0
    else:
        to_list = [int(x) for x in re.findall(r'\d+',nodename)]
        return node_idx(to_list,branching_factors)

def parent_ndn(nodename):
    if nodename == 'ROOT':
        return None
    else:
        return re.search('(.+)_(\d+)',nodename).group(1)

    
def option_string_to_dict(ostr):
    """ Convert a string to the standard dict for solver options.
    Intended for use in the calling program; not internal use here.

    Args:
        ostr (string): space seperated options with = for arguments

    Returns:
        solver_options (dict): solver options

    """
    def convert_value_string_to_number(s):
        try:
            return int(s)
        except ValueError:
            try:
                return float(s)
            except ValueError:
                return s

    solver_options = dict()
    if ostr is None or ostr == "":
        return None
    for this_option_string in ostr.split():
        this_option_pieces = this_option_string.strip().split("=")
        if len(this_option_pieces) == 2:
            option_key = this_option_pieces[0]
            option_value = convert_value_string_to_number(this_option_pieces[1])
            solver_options[option_key] = option_value
        elif len(this_option_pieces) == 1:
            option_key = this_option_pieces[0]
            solver_options[option_key] = None
        else:
            raise RuntimeError("Illegally formed subsolve directive"\
                               + " option=%s detected" % this_option)
    return solver_options


def option_dict_to_string(odict):
    """ Convert a standard dict for solver options to a string.

    Args:
        odict (dict): options dict for Pyomo

    Returns:
        ostring (str): options string as in mpi-sppy

    Note: None begets None, and empty begets empty

    """
    if odict is None:
        return None
    ostr = ""
    for i, v in odict.items():
        if v is None:
            ostr += "{i} "
        else:
            ostr += f"{i}={v} "
    return ostr


################################################################################
# Various utilities related to scenario rank maps (some may not be in use)


def scens_to_ranks(scen_count, n_proc, rank, branching_factors = None):
    """ Determine the rank assignments that are made in spbase.
    NOTE: Callers to this should call _scentree.scen_names_to_ranks
    Args:
        scen_count (int): number of scenarios
        n_proc (int): the number of intra ranks (within the cylinder)
        rank (int): my rank (i.e., intra; i.e., within the cylinder)
    Returns:
        slices (list of ranges): the indices into all all_scenario_names to assign to rank
                                 (the list entries are ranges that correspond to ranks)
        scenario_name_to_rank (dict of dict): only for multi-stage
                keys are comms (i.e., tree nodes); values are dicts with keys
                that are scenario names and values that are ranks

    """
    if not haveMPI:
        raise RuntimeError("scens_to_ranks called, but cannot import mpi4py")
    if scen_count < n_proc:
        raise RuntimeError(
            "More MPI ranks (%d) supplied than needed given the number of scenarios (%d) "
            % (n_proc, scen_count)
        )

    # for now, we are treating two-stage as a special case
    if (branching_factors is None):
        avg = scen_count / n_proc
        slices = [list(range(int(i * avg), int((i + 1) * avg))) for i in range(n_proc)]
        return slices, None
    else:
        # OCT 2020: this block is never triggered and would fail.
        # indecision as of May 2020 (delete this comment DLW)
        # just make sure things are consistent with what xhat will do...
        # TBD: streamline
        all_scenario_names = ["ID"+str(i) for i in range(scen_count)]
        tree = _ScenTree(branching_factors, all_scenario_names)
        scenario_names_to_ranks, slices, = tree.scen_name_to_rank(n_proc, rank)
        return slices, scenario_names_to_ranks

def _nodenum_before_stage(t,branching_factors):
    #How many nodes in a tree of stage 1,2,...,t ?
    #Only works with branching factors
    return int(sum(np.prod(branching_factors[0:i]) for i in range(t)))

def find_leaves(all_nodenames):
    #Take a list of all nodenames from a tree, and find the leaves of it.
    #WARNING: We do NOT check that the tree is well constructed
    
    if all_nodenames is None or all_nodenames == ['ROOT']:
        return {'ROOT':False} # 2 stage problem: no leaf nodes in all_nodenames
    #A leaf is simply a root with no child n°0
    is_leaf = dict()
    for ndn in all_nodenames:
        if ndn+"_0" in all_nodenames:
            is_leaf[ndn] = False
        else:
            is_leaf[ndn] = True
    return is_leaf
            
    
class _TreeNode():
    #Create the subtree generated by a node, with associated scenarios
    # stages are 1-based, everything else is 0-based
    # scenario lists are stored as (first, last) indices in all_scenarios
    #This is also checking that the nodes from all_nodenames are well-named.
    def __init__(self, Parent, scenfirst, scenlast, desc_leaf_dict, name):
        #desc_leaf_dict is the output of find_leaves
        self.scenfirst = scenfirst #id of the first scenario with this node
        self.scenlast = scenlast #id of the last scenario with this node
        self.name = name
        numscens = scenlast - scenfirst + 1 #number of scenarios with this node
        self.is_leaf = False
        if Parent is None:
            assert(self.name == "ROOT")
            self.stage = 1
        else:
            self.stage = Parent.stage + 1
        if len(desc_leaf_dict)==1 and list(desc_leaf_dict.keys()) == ['ROOT']: 
            #2-stage problem, we don't create leaf nodes
            self.kids = []
        elif not name+"_0" in desc_leaf_dict:
            self.is_leaf = True
            self.kids = []
        else:
            if len(desc_leaf_dict) < numscens:                
                raise RuntimeError(f"There are more scenarios ({numscens}) than remaining leaves, for the node {name}")
            # make children
            first = scenfirst
            self.kids = list()
            child_regex = re.compile(name+'_\d*\Z')
            child_list = [x for x in desc_leaf_dict if child_regex.match(x) ]
            for i in range(len(desc_leaf_dict)):
                childname = name+f"_{i}"
                if not childname in desc_leaf_dict:
                    if len(child_list) != i:
                        raise RuntimeError("The all_nodenames argument is giving an inconsistent tree."
                                           f"The node {name} has {len(child_list)} children, but {childname} is not one of them.")
                    break
                childdesc_regex = re.compile(childname+'(_\d*)*\Z')
                child_leaf_dict = {ndn:desc_leaf_dict[ndn] for ndn in desc_leaf_dict \
                                   if childdesc_regex.match(ndn)}
                #We determine the number of children of this node
                child_scens_num = sum(child_leaf_dict.values())
                last = first+child_scens_num - 1
                self.kids.append(_TreeNode(self, first, last, 
                                           child_leaf_dict, childname))
                first += child_scens_num
            if last != scenlast:
                print("numscens, last, scenlast", numscens, last, scenlast)
                raise RuntimeError(f"Tree node did not initialize correctly for node {name}")


    def stage_max(self):
        #Return the number of stages of a subtree.
        #Also check that all the subtrees have the same number of stages
        #i.e. that the leaves are always on the same stage. 
        if self.is_leaf:
            return 1
        else:
            l = [child.stage_max() for child in self.kids]
            if l.count(l[0]) != len(l):
                maxstage = max(l)+ self.stage
                minstage = min(l)+ self.stage
                raise RuntimeError("The all_nodenames argument is giving an inconsistent tree. "
                                   f"The node {self.name} has descendant leaves with stages going from {minstage} to {maxstage}")
            return 1+l[0]
            
                    

                
class _ScenTree():
    def __init__(self, all_nodenames, ScenNames):
        if all_nodenames is None:
            all_nodenames = ['ROOT'] #2 stage problem: no leaf nodes
        self.ScenNames = ScenNames
        self.NumScens = len(ScenNames)
        first = 0
        last = self.NumScens - 1
        desc_leaf_dict = find_leaves(all_nodenames)
        self.rootnode = _TreeNode(None, first, last, desc_leaf_dict, "ROOT")
        def _nonleaves(nd):
            if nd.is_leaf:
                return []
            else:
                retval = [nd]
                for child in nd.kids:
                    retval+=_nonleaves(child)
                return retval
        self.nonleaves = _nonleaves(self.rootnode)
        
        self.NumStages = \
            2 if all_nodenames == ['ROOT'] else self.rootnode.stage_max() 
        self.NonLeafTerminals = \
            [nd for nd in self.nonleaves if nd.stage == self.NumStages-1]
        
        self.NumLeaves = len(desc_leaf_dict) - len(self.nonleaves)
        if self.NumStages>2 and self.NumLeaves != self.NumScens:
            raise RuntimeError("The all_nodenames argument is giving an inconsistent tree."
                               f"There are {self.NumLeaves} leaves for this tree, but {self.NumScens} scenarios are given.")
    def scen_names_to_ranks(self, n_proc):
        """ 
        Args:
            n_proc: number of ranks in the cylinder (i.e., intra)

        Returns:
            scenario_names_to_rank (dict of dict):
                keys are comms (i.e., tree nodes); values are dicts with keys
                that are scenario names and values that are ranks within that comm
            slices (list of lists)
                indices correspond to ranks in self.mpicomm and the values are a list
                of scenario indices
                rank -> list of scenario indices for that rank
            list_of_ranks_per_scenario_idx (list)
                indices are scenario indices and values are the rank of that scenario
                within self.mpicomm
                scenario index -> rank

        NOTE:
            comm names are the same as the corresponding scenario tree node name

        """
        scenario_names_to_rank = dict()  # scenario_name_to_rank dict of dicts
        # one processor for the cylinder is a special case
        if n_proc == 1:
            for nd in self.nonleaves:
                scenario_names_to_rank[nd.name] = {s: 0 for s in self.ScenNames}
            return scenario_names_to_rank, [list(range(self.NumScens))], [0]*self.NumScens

        scen_count = len(self.ScenNames)
        avg = scen_count / n_proc

        # rank -> list of scenario indices for that rank
        slices = [list(range(int(i * avg), int((i + 1) * avg))) for i in range(n_proc)]

        # scenario index -> rank
        list_of_ranks_per_scenario_idx = [ rank for rank, scen_idxs in enumerate(slices) for _ in scen_idxs ]

        scenario_names_to_rank["ROOT"] = { s: rank for s,rank in zip(self.ScenNames, list_of_ranks_per_scenario_idx) }
         
        def _recurse_do_node(node):
            for child in node.kids:

                first_scen_idx = child.scenfirst
                last_scen_idx = child.scenlast

                ranks_in_node = list_of_ranks_per_scenario_idx[first_scen_idx:last_scen_idx+1]
                minimum_rank_in_node = ranks_in_node[0]

                # IMPORTANT:
                # this accords with the way SPBase.create_communicators assigns the "key" when
                # creating its comm for this node. E.g., the key is the existing rank, which
                # will then be offset by the minimum rank. As the ranks within each node are
                # contiguous, this is enough to infer the rank each scenario will have in this
                # node's comm
                within_comm_ranks_in_node = [(rank-minimum_rank_in_node) for rank in ranks_in_node]

                scenarios_in_nodes = self.ScenNames[first_scen_idx:last_scen_idx+1]

                scenario_names_to_rank[child.name] = { s : rank for s,rank in zip(scenarios_in_nodes, within_comm_ranks_in_node) }

                if child not in self.NonLeafTerminals:
                    _recurse_do_node(child)

        _recurse_do_node(self.rootnode)

        return scenario_names_to_rank, slices, list_of_ranks_per_scenario_idx
    
    
######## Utility to attach the one and only node to a two-stage scenario #######
def attach_root_node(model, firstobj, varlist, nonant_ef_suppl_list=None, do_uniform=True):
    """ Create a root node as a list to attach to a scenario model
    Args:
        model (ConcreteModel): model to which this will be attached
        firstobj (Pyomo Expression): First stage cost (e.g. model.FC)
        varlist (list): Pyomo Vars in first stage (e.g. [model.A, model.B])
        nonant_ef_suppl_list (list of pyo Var, Vardata or slices):
              vars for which nonanticipativity constraints tighten the EF
              (important for bundling)
        do_uniform (boolean): controls a side-effect to deal with missing probs

    Note: 
       attaches a list consisting of one scenario node to the model
    """
    model._mpisppy_node_list = [
        scenario_tree.ScenarioNode("ROOT", 1.0, 1, firstobj, varlist, model,
                                   nonant_ef_suppl_list = nonant_ef_suppl_list)
    ]
    if do_uniform:
        # Avoid a warning per scenario
        if not hasattr(model, "_mpisppy_probability"):
            model._mpisppy_probability = "uniform"
    

### utilities to check the slices and the map ###
def check4losses(numscens, branching_factors,
                 scenario_names_to_rank,slices,list_of_ranks_per_scenario_idx):
    """ Check the data structures; gag and die if it looks bad.
    Args:
        numscens (int): number of scenarios
        branching_factors (list of int): branching factors
        scenario_names_to_rank (dict of dict):
            keys are comms (i.e., tree nodes); values are dicts with keys
            that are scenario names and values that are ranks within that comm
        slices (list of lists)
            indices correspond to ranks in self.mpicomm and the values are a list
            of scenario indices
            rank -> list of scenario indices for that rank
        list_of_ranks_per_scenario_idx (list)
            indices are scenario indices and values are the rank of that scenario
            within self.mpicomm
            scenario index -> rank

    """

    present = [False for _ in range(numscens)]
    for rank, scenlist in enumerate(slices):
        for scen in scenlist:
            present[scen] = True
    missingsome = False
    for scen, there in enumerate(present):
        if not there:
            print(f"Scenario {scen} is not in slices")
            missingsome = True
    if missingsome:
        raise RuntimeError("Internal error: slices is not correct")

    # not stage presence...
    stagepresents = {stage: [False for _ in range(numscens)] for stage in range(len(branching_factors))}
    # loop over the entire structure, marking those found as present
    for nodename, scenlist in scenario_names_to_rank.items():
        stagenum = nodename.count('_')
        for s in scenlist:
            snum = int(s[8:])
            stagepresents[stagenum][snum] = True
    missingone = False
    for stage in stagepresents:
        for scen, there in enumerate(stagepresents[stage]):
            if not there:
                print(f"Scenario number {scen} missing from stage {stage}.")
                missingsome = True
    if missingsome:
        raise RuntimeError("Internal error: scenario_name_to_rank")
    print("check4losses: OK")

    
def disable_tictoc_output():
    f = open(os.devnull,"w")
    tt_timer._ostream = f

def reenable_tictoc_output():
    # Primarily to re-enable after a disable
    tt_timer._ostream.close()
    tt_timer._ostream = sys.stdout

    
def find_active_objective(pyomomodel):
    # return the only active objective or raise and error
    obj = list(pyomomodel.component_data_objects(
        Objective, active=True, descend_into=True))
    if len(obj) != 1:
        raise RuntimeError("Could not identify exactly one active "
                           "Objective for model '%s' (found %d objectives)"
                           % (pyomomodel.name, len(obj)))
    return obj[0]

def create_nodenames_from_branching_factors(BFS):
    """
    This function creates the node names of a tree without creating the whole tree.

    Parameters
    ----------
    BFS : list of integers
        Branching factors.

    Returns
    -------
    nodenames : list of str
        a list of the node names induced by branching_factors, including leaf nodes.

    """
    stage_nodes = ["ROOT"]
    nodenames = ['ROOT']
    if len(BFS)==1 : #2stage
        return(nodenames)
    for bf in BFS[:(len(BFS))]:
        old_stage_nodes = stage_nodes
        stage_nodes = []
        for k in range(len(old_stage_nodes)):
            stage_nodes += ['%s_%i'%(old_stage_nodes[k],b) for b in range(bf)]
        nodenames += stage_nodes
    return nodenames

def get_branching_factors_from_nodenames(all_nodenames):
    #WARNING: Do not work with unbalanced trees
    staget_node = "ROOT"
    branching_factors = []
    while staget_node+"_0" in all_nodenames:
        child_regex = re.compile(staget_node+'_\d*\Z')
        child_list = [x for x in all_nodenames if child_regex.match(x) ]
        
        branching_factors.append(len(child_list))
        staget_node += "_0"
    if len(branching_factors)==1:
        #2stage
        return None
    else:
        return branching_factors
    
def number_of_nodes(branching_factors):
    #How many nodes does a tree with a given branching_factors have ?
    last_node_stage_num = [i-1 for i in branching_factors]
    return node_idx(last_node_stage_num, branching_factors)
    

if __name__ == "__main__":
    branching_factors = [2,2,2,3]
    numscens = np.prod(branching_factors)
    scennames = ["Scenario"+str(i) for i in range(numscens)]
    testtree = _ScenTree(branching_factors, scennames)
    print("nonleaves:")
    for nd in testtree.nonleaves:
        print("   ", nd.name)
    print("NonLeafTerminals:")
    for nd in testtree.NonLeafTerminals:
        print("   ", nd.name)
    n_proc = 8
    sntr, slices, ranks_per_scenario = testtree.scen_names_to_ranks(n_proc)
    print("map:")
    for ndn,v in sntr.items():
        print(ndn, v)
    print(f"slices: {slices}")
    check4losses(numscens, branching_factors, sntr, slices, ranks_per_scenario)