Source code for bnelearn.experiment.combinatorial_experiment

"""
This module implements combinatorial experiments. Currently, this is only Local Global experiments as
considered by Bosshard et al. (2018).

Limitations and comments:
    - Currently implemented for only uniform valuations
    - Strictly speaking Split Award might belong here (however, implementation closer to multi-unit)
    
"""
import os
from abc import ABC
from functools import partial
from typing import Iterable, List
import math

from scipy import optimize
from tqdm import tqdm
import numpy as np
from torch.utils.tensorboard import SummaryWriter
import torch

from bnelearn.mechanism import (
    LLGAuction, LLGFullAuction, LLLLGGAuction, LLLLRRGAuction
)
from bnelearn.bidder import Bidder, CombinatorialBidder

from bnelearn.environment import AuctionEnvironment
from bnelearn.experiment.configurations import ExperimentConfig
from bnelearn.experiment.equilibria import truthful_bid
from bnelearn.experiment import Experiment
from bnelearn.strategy import ClosureStrategy

import bnelearn.util.logging as logging_utils
from bnelearn.sampler import LLGSampler, LLGFullSampler, LLLLGGSampler, LLLLRRGSampler

# maps config correlation_types to LocalGlobalSampler correlation_method arguments
CORRELATION_METHODS = {
        'Bernoulli_weights': 'Bernoulli',
        'constant_weights': 'constant',
        'independent': None
    }

[docs]class LocalGlobalExperiment(Experiment, ABC):
    """
    This class represents Local Global experiments in general as considered by Bosshard et al. (2018).
    It serves only to provide common logic and parameters for LLG and LLLLGG.
    """

    def __init__(self, config: ExperimentConfig,
                 n_players, n_local, valuation_size, observation_size, action_size):
        self.config = config

        # provided by subclass constructors
        self.n_players = n_players
        self.n_local = n_local
        self.valuation_size = valuation_size
        self.observation_size = observation_size
        self.action_size = action_size

        self.risk = float(config.setting.risk)

        self._set_valuation_bounds()

        self.positive_output_point = torch.tensor([min(self.u_hi)] * self.observation_size)

        self.model_sharing = self.config.learning.model_sharing
        if self.model_sharing:
            self.n_models = 2
            self._bidder2model: List[int] = \
                [0] * self.n_local + [1] * (self.n_players - self.n_local)
        else:
            self.n_models = self.n_players
            self._bidder2model: List[int] = list(range(self.n_players))

        super().__init__(config=config)

        self.plot_xmin = min(self.u_lo)
        self.plot_xmax = max(self.u_hi)
        self.plot_ymin = self.plot_xmin
        self.plot_ymax = self.plot_xmax * 1.05

    def _set_valuation_bounds(self):
        """Validates input for uniform valuation bounds and converts
        them to required type List[float] if necessary.
        """
        assert self.config.setting.u_lo is not None, """Missing prior information!"""
        assert self.config.setting.u_hi is not None, """Missing prior information!"""
        u_lo = self.config.setting.u_lo
        # Frontend could either provide single number u_lo that is shared or a list for each player.
        if isinstance(u_lo, Iterable): # pylint: disable=isinstance-second-argument-not-valid-type
            assert len(u_lo) == self.n_players
            u_lo = [float(l) for l in u_lo]
        else:
            u_lo = [float(u_lo)] * self.n_players
        self.u_lo = u_lo

        u_hi = self.config.setting.u_hi
        assert isinstance(u_hi, Iterable) # pylint: disable=isinstance-second-argument-not-valid-type
        assert len(u_hi) == self.n_players
        assert u_hi[1:self.n_local] == \
               u_hi[:self.n_local - 1], "local bidders should be identical"
        assert u_hi[0] < \
               u_hi[self.n_local], "local bidders must be weaker than global bidder"
        self.u_hi = [float(h) for h in u_hi]

    def _get_model_names(self):
        if self.model_sharing:
            global_name = 'global' if self.n_players - self.n_local == 1 else 'globals'
            return ['locals', global_name]
        else:
            return super()._get_model_names()

    def _strat_to_bidder(self, strategy, batch_size, player_position=0,
                         enable_action_caching=False):
        return Bidder(strategy, player_position=player_position, batch_size=batch_size,
                      valuation_size=self.valuation_size, observation_size=self.observation_size,
                      bid_size=self.action_size, risk=self.risk, enable_action_caching=False)


[docs]class LLGExperiment(LocalGlobalExperiment):
    """
    A combinatorial experiment with 2 local and 1 global bidder and 2 items; but each bidders bids on 1 bundle only.
    Local bidder 1 bids only on the first item, the second only on the second and global only on both.
    Ausubel and Baranov (2018) provide closed form solutions for the 3 core selecting rules.

    Supports arbitrary number of local bidders, not just two.
    """

    def __init__(self, config: ExperimentConfig):
        self.config = config

        assert config.setting.n_players == 3, "invalid n_players for LLG"

        self.gamma = self.correlation = float(config.setting.gamma)

        super().__init__(config=config,
                         n_players=3, n_local= 2,
                         valuation_size=1, observation_size=1, action_size=1)

    def _setup_sampler(self):

        default_batch_size = self.config.learning.batch_size
        default_device = self.config.hardware.device

        if not (self.config.setting.u_lo == [0,0,0] and
                self.config.setting.u_hi == [1,1,2]):
            raise NotImplementedError("LLG Sampler only implemented for default valuation bounds!")


        method = CORRELATION_METHODS[self.config.setting.correlation_types]

        self.sampler = LLGSampler(correlation = self.gamma,
                                  correlation_method=method,
                                  default_batch_size=default_batch_size,
                                  default_device=default_device)

    def _setup_mechanism(self):
        self.mechanism = LLGAuction(rule=self.payment_rule)

    def _optimal_bid(self, valuation, player_position): # pylint: disable=method-hidden
        """Core selecting and vcg equilibria for the Bernoulli weights model in Ausubel & Baranov (2019)

           Note: for gamma=0 or gamma=1, these are identical to the constant weights model.
        """
        if not isinstance(valuation, torch.Tensor):
            valuation = torch.tensor(valuation)

        ### Global bidder: all core-selecting rules are strategy proof for global player
        if self.payment_rule in ['vcg', 'proxy', 'nearest_zero', 'nearest_bid',
                                 'nearest_vcg'] and player_position == self.n_players - 1:
            return valuation

        ### Local bidders: vcg => truthfull bidding
        if self.payment_rule in ['vcg'] and player_position in list(range(self.n_players - 1)):
            return valuation

        assert self.risk == 1.0, 'BNE known for risk-neutral only (or in VCG)'

        ### Local bidders:
        if self.config.setting.correlation_types in ['Bernoulli_weights', 'independent'] or \
            (self.config.setting.correlation_types == 'constant_weights' and self.gamma in [0, 1]):
            ## perfect correlation
            if self.gamma == 1.0: # limit case, others not well defined
                sigma = 1.0 # TODO: implement for other valuation profiles!
                bid = valuation
                if self.payment_rule == 'nearest_vcg':
                    bid.mul_(sigma / (1 + sigma - 2**(-sigma)))
                elif self.payment_rule == 'nearest_bid':
                    bid.mul_(sigma / (1 + sigma))
                # truthful for vcg and proxy/nearest-zero
                return bid
            ## no or imperfect correlation
            if self.payment_rule in ['proxy', 'nearest_zero']:
                bid_if_positive = 1 + torch.log(valuation * (1.0 - self.gamma) + self.gamma) / (1.0 - self.gamma)
                return torch.max(torch.zeros_like(valuation), bid_if_positive)
            if self.payment_rule == 'nearest_bid':
                return (np.log(2) - torch.log(2.0 - (1. - self.gamma) * valuation)) / (1. - self.gamma)
            if self.payment_rule == 'nearest_vcg':
                bid_if_positive = 2. / (2. + self.gamma) * (
                    valuation - (3. - np.sqrt(9 - (1. - self.gamma) ** 2)) / (1. - self.gamma))
                return torch.max(torch.zeros_like(valuation), bid_if_positive)
            raise NotImplementedError('Optimal bid not implemented for this payment rule.')
        else:
            raise NotImplementedError('Optimal bid not implemented for this correlation type.')

        self.known_bne = False

    def _check_and_set_known_bne(self):
        # TODO: This is not exhaustive, other criteria must be fulfilled for the bne to be known!
        #  (i.e. uniformity, bounds, etc)

        if self.config.setting.payment_rule == 'vcg' \
            or (self.config.setting.payment_rule in ['nearest_bid', 'nearest_zero', 'proxy', 'nearest_vcg']
                and (self.config.setting.correlation_types in ['Bernoulli_weights', 'independent']
                    or (self.config.setting.correlation_types == 'constant_weights'
                        and self.gamma in [0, 1])) and self.risk == 1.0):
            return True

        known_bne = super()._check_and_set_known_bne()
        if not known_bne:
            self.logging.log_metrics['l2'] = False
            self.logging.log_metrics['opt'] = False

        return known_bne

    def _setup_eval_environment(self):

        assert self.known_bne
        assert hasattr(self, '_optimal_bid')

        bne_strategies = [
            ClosureStrategy(partial(self._optimal_bid, player_position=i))  # pylint: disable=no-member
            for i in range(self.n_players)]

        bne_env = AuctionEnvironment(
            mechanism=self.mechanism,
            agents=[self._strat_to_bidder(bne_strategies[i], player_position=i,
                                          batch_size=self.config.logging.eval_batch_size,
                                          enable_action_caching=self.config.logging.cache_eval_actions)
                    for i in range(self.n_players)],
            valuation_observation_sampler=self.sampler,
            n_players=self.n_players,
            batch_size=self.config.logging.eval_batch_size,
            strategy_to_player_closure=self._strat_to_bidder
        )

        self.bne_env = bne_env

        db_batch_size, db_bne_utility = logging_utils.read_bne_utility_database(self)

        # Found higher precision db entry
        if db_batch_size >= self.config.logging.eval_batch_size:
            print(f"BNE utility is estimated on larger batch of size {db_batch_size}.")
            self.bne_utilities = db_bne_utility
        else:
            self.bne_utilities = torch.tensor(
                [bne_env.get_reward(a, redraw_valuations=True) for a in bne_env.agents])
            logging_utils.write_bne_utility_database(self, self.bne_utilities)

        print(f'Setting up BNE env with batch size 2**{np.log2(self.config.logging.eval_batch_size)}.')
        print(('Utilities in BNE (sampled):' + '\t{:.5f}' * self.n_players + '.').format(*self.bne_utilities))
        print("No closed form solution for BNE utilities available in this setting. Using sampled value as baseline.")

    def _get_logdir_hierarchy(self):
        name = [self.n_local * 'L' + 'G', self.payment_rule]
        if self.gamma > 0:
            name += [self.config.setting.correlation_types, f"gamma_{self.gamma:.3}"]
        else:
            name += ['independent']
        if self.risk != 1.0:
            name += [f'risk_{self.risk}']
        return os.path.join(*name)


[docs]class LLGFullExperiment(LocalGlobalExperiment):
    """A combinatorial experiment with 2 local and 1 global bidder and 2 items.

    Essentially, this is a general CA with 3 bidders and 2 items.

    Each bidder bids on all bundles. Local bidder 1 has only a value for the
    first item, the second only for the second and global only on both. This
    experiment is therefore more general than the `LLGExperiment` and includes
    the specific payment rule from Beck & Ott, where the 2nd local bidder is
    favored (pays VCG prices).
    """
    def __init__(self, config: ExperimentConfig):
        self.config = config
        assert self.config.setting.n_players == 3, \
            "Incorrect number of players specified."

        self.gamma = self.correlation = float(config.setting.gamma)
        if config.setting.correlation_types not in ['independent', None] or \
            self.gamma > 0.0:
            # Should be similar to reduced LLG setting, but we have to consider
            # asymmetry of local bidders.
            raise NotImplementedError('Correlation not implemented.')

        super().__init__(config=config, n_players=3, n_local=2,
                         valuation_size=1, observation_size=1, action_size=3)

    def _setup_mechanism(self):
        self.mechanism = LLGFullAuction(
            rule=self.payment_rule,
            cuda=self.hardware.device
        )

    def _setup_sampler(self):

        default_batch_size = self.config.learning.batch_size
        default_device = self.config.hardware.device

        if not (self.config.setting.u_lo == [0, 0, 0] and
                self.config.setting.u_hi == [1, 1, 2]):
            raise NotImplementedError("LLG Sampler only implemented for default valuation bounds!")

        method = CORRELATION_METHODS[self.config.setting.correlation_types]

        self.sampler = LLGFullSampler(correlation=self.gamma,
                                      correlation_method=method,
                                      default_batch_size=default_batch_size,
                                      default_device=default_device)

    def _check_and_set_known_bne(self):
        if self.payment_rule == 'vcg':
            return True
        if self.payment_rule == 'mrcs_favored' \
            and self.config.setting.correlation_types in ['independent', None]:
            return True
        return super()._check_and_set_known_bne()

    def _optimal_bid(self, valuation, player_position):  # pylint: disable=method-hidden
        """Equilibrium bid functions.

        Payment rule `mrcs_favored` is from Beck & Ott (minimum revenue core
        selecting with one player favored).
        """
        if not isinstance(valuation, torch.Tensor):
            valuation = torch.as_tensor(valuation, device=self.config.hardware.device)

        assert self.risk == 1.0, 'BNE known for risk-neutral only (or in VCG)'

        if self.payment_rule in ['vcg', 'mrcs_favored']:
            if player_position == 1:
                return torch.cat([
                    torch.zeros_like(valuation),  # item A
                    valuation,                    # item B
                    valuation], axis=1)           # bundle {A, B}
            if player_position == 2:
                return torch.cat([
                    torch.zeros_like(valuation),
                    torch.zeros_like(valuation),
                    valuation], axis=1)

        ### Favored bidder 1:
        if self.config.setting.correlation_types in ['independent', None] and player_position == 0:
            if self.payment_rule == 'vcg':
                return torch.cat([
                    valuation,
                    torch.zeros_like(valuation),
                    valuation], axis=1)
            if self.payment_rule == 'mrcs_favored':
                # Beck & Ott provide incomplete/wrong solution
                print('Calculating high-precision BNE...')
                eps = 1e-16

                v = valuation.cpu().numpy().astype('float64')
                def root_func(z, v):
                    """We're looking for roots of this function"""
                    return 12*v - 15*z - 1 + (9*z - 1 - 3*v) * np.sqrt(1 - 6*z + 6*v)
                def solve_for_z(v):
                    """Brent-q for finding root"""
                    f = lambda z: root_func(z, v=v)
                    low = max((1 - np.sqrt(6*v - 2))/3., v - .5) + eps
                    up = (1 + 6*v) / 6. - eps
                    if np.sign(f(low)) == np.sign(f(up)):
                        return 0
                    z = optimize.brentq(f, a=low, b=up, xtol=1e-13, disp=False)
                    return z

                threshold = 2 - 2 * math.sqrt(6.) / 3.
                z = np.zeros_like(v)
                for i, vv in tqdm(enumerate(v), total=v.shape[0]):
                    if threshold < vv:
                        z[i] = solve_for_z(vv)
                z = torch.as_tensor(
                    z, device=valuation.device, dtype=valuation.dtype
                )

                v = torch.as_tensor(
                    valuation, device=valuation.device, dtype=valuation.dtype
                )
                b_A = torch.zeros_like(v)
                mask = threshold < v
                b_A[mask] = z[mask] \
                    - (2 - torch.sqrt(1 - 6 * z[mask] + 6 * v[mask])) \
                    / 3.
                b_AB = 0.5 * v.detach().clone()
                b_AB[mask] = z[mask]
                bids = torch.cat([b_A, torch.zeros_like(v), b_AB], axis=1)
                bids[bids < 0] = 0  # b_A is somewhat inprecise
                return bids

            raise NotImplementedError('Optimal bid not implemented for this payment rule.')
        else:
            raise NotImplementedError('Optimal bid not implemented for this correlation type.')

[docs]    def pretrain_transform(self, player_position: int) -> callable:
        """Transformation during pretraining: Bidders are single-minded in this
        setting.
        """
        return lambda x: torch.tensor(
            [[1, 0, 1], [0, 1, 1], [0, 0, 1]],
            device=self.config.hardware.device,
            dtype=torch.bool
        )[player_position] * x

    def _setup_eval_environment(self):
        assert self.known_bne
        assert hasattr(self, '_optimal_bid')

        bne_strategies = [
            ClosureStrategy(partial(self._optimal_bid, player_position=i))  # pylint: disable=no-member
            for i in range(self.n_players)]

        self.known_bne = True
        self.bne_env = AuctionEnvironment(
            mechanism=self.mechanism,
            agents=[self._strat_to_bidder(bne_strategies[i], player_position=i,
                                          batch_size=self.config.logging.eval_batch_size,
                                          enable_action_caching=self.config.logging.cache_eval_actions)
                    for i in range(self.n_players)],
            valuation_observation_sampler=self.sampler,
            n_players=self.n_players,
            batch_size=self.config.logging.eval_batch_size,
            strategy_to_player_closure=self._strat_to_bidder
        )
        self.bne_utilities = torch.tensor(
            [self.bne_env.get_reward(a, redraw_valuations=True) for a in self.bne_env.agents])

        # Compare estimated util to that of Beck & Ott table 2
        if self.payment_rule == 'mrcs_favored':
            max_diff_to_estimate = float(max(
                torch.abs(self.bne_utilities - torch.tensor([0.154, 0.093, 0.418]))
            ))
            print(f'Max difference to BNE estimate is {round(max_diff_to_estimate, 4)}.')

    def _get_logdir_hierarchy(self):
        name = ['LLGFull', self.payment_rule]
        if self.gamma > 0:
            name += [self.config.setting.correlation_types,
                     f"gamma_{self.gamma:.3}"]
        else:
            name += ['independent']
        if self.risk != 1.0:
            name += [f'risk_{self.risk}']
        return os.path.join(*name)

    def _get_model_names(self):
        return ['local 1', 'local 2', 'global']

    def _strat_to_bidder(self, strategy, batch_size, player_position=0,
                         enable_action_caching=False):
        return CombinatorialBidder(
            strategy=strategy,
            player_position=player_position,
            batch_size=batch_size,
            valuation_size=self.valuation_size,
            observation_size=self.observation_size,
            bid_size=3,
            risk=self.risk,
            enable_action_caching=enable_action_caching
        )

    def _plot(self, **kwargs):  # pylint: disable=arguments-differ
        kwargs['x_label'] = ['item A', 'item B', 'bundle']

        if 'labels' not in kwargs.keys():
            kwargs['labels'] = self._get_model_names()

        # handle dim-missmatch that agents only value 1 bundle but bid for 3
        plot_data = list(kwargs['plot_data'])
        if plot_data[0].shape != plot_data[1].shape:
            plot_data[0] = plot_data[0].repeat(1, 1, self.action_size)
            kwargs['plot_data'] = plot_data

        super()._plot(**kwargs)


[docs]class LLLLGGExperiment(LocalGlobalExperiment):
    """
    A combinatorial experiment with 4 local and 2 global bidder and 6 items; but each bidders bids on 2 bundles only.
        Local bidder 1 bids on the bundles {(item_1,item_2),(item_2,item_3)}
        Local bidder 2 bids on the bundles {(item_3,item_4),(item_4,item_5)}
        ...
        Gloabl bidder 1 bids on the bundles {(item_1,item_2,item_3,item_4), (item_5,item_6,item_7,item_8)}
        Gloabl bidder 1 bids on the bundles {(item_3,item_4,item_5,item_6), (item_1,item_2,item_7,item_8)}
    No BNE are known (but VCG).
    Bosshard et al. (2018) consider this setting with nearest-vcg and first-price payments.

    TODO:
        - Implement eval_env for VCG
    """

    def __init__(self, config: ExperimentConfig):
        self.config = config
        assert self.config.setting.n_players == 6, "not right number of players for setting"

        super().__init__(config=config,
                         n_players=6, n_local=4,
                         valuation_size=2, observation_size=2, action_size=2)

    def _setup_sampler(self):
        default_batch_size = self.config.learning.batch_size
        default_device = self.config.hardware.device

        if not (self.config.setting.u_lo == [0,0,0,0,0,0] and
                self.config.setting.u_hi == [1,1,1,1,2,2]):
            raise NotImplementedError("LLG Sampler only implemented for default valuation bounds!")

        gammas = self.config.setting.correlation_coefficients
        assert gammas is None or gammas[1] == 0.0, \
            "correlation between global players not implemented."
        local_gamma = 0.0
        local_corr_method = None
        if gammas:
            local_gamma = gammas[0]
            local_corr_method = CORRELATION_METHODS[self.config.setting.correlation_types[0]]

        self.sampler = LLLLGGSampler(
            correlation_locals=local_gamma,
            correlation_method_locals=local_corr_method,
            default_batch_size=default_batch_size,
            default_device=default_device)

    def _setup_mechanism(self):
        self.mechanism = LLLLGGAuction(rule=self.payment_rule, core_solver=self.setting.core_solver,
                                       parallel=self.hardware.max_cpu_threads, cuda=self.hardware.cuda)

    def _get_logdir_hierarchy(self):
        name = ['LLLLGG', self.payment_rule, str(self.n_players) + 'p']
        return os.path.join(*name)

    def _plot(self, plot_data, writer: SummaryWriter or None, fmts=['o'], **kwargs):
        super()._plot(plot_data=plot_data, writer=writer, fmts=fmts, **kwargs)
        super()._plot_3d(plot_data=plot_data, writer=writer,
                         figure_name=kwargs['figure_name'])


[docs]class LLLLRRGExperiment(Experiment):
    """Experiment in an extension of the Local-Global Model with three groups of bidders."""

    def __init__(self, config: ExperimentConfig):
        self.config = config

        # provided by subclass constructors
        self.n_players = 7
        assert self.config.setting.n_players == 7, "incorrect number of players supplied."

        self.n_local = 4
        self.n_regional = 2
        self.n_global = 1
        self.valuation_size = 2
        self.observation_size = 2
        self.action_size = 2

        self.risk = float(config.setting.risk)

        self._set_valuation_bounds()

        self.positive_output_point = torch.tensor([min(self.u_hi)] * self.observation_size)

        self.model_sharing = self.config.learning.model_sharing
        if self.model_sharing:
            self.n_models = 3
            self._bidder2model: List[int] = \
                [0] * self.n_local + [1] * self.n_regional + [2] * self.n_global
        else:
            self.n_models = self.n_players
            self._bidder2model: List[int] = list(range(self.n_players))

        super().__init__(config=config)

        self.plot_xmin = min(self.u_lo)
        self.plot_xmax = max(self.u_hi)
        self.plot_ymin = self.plot_xmin
        self.plot_ymax = self.plot_xmax * 1.05

    def _setup_sampler(self):
        default_batch_size = self.config.learning.batch_size
        default_device = self.config.hardware.device

        gammas = self.config.setting.correlation_coefficients
        assert gammas is None or gammas[2] == 0.0
        local_gamma, regional_gamma = 0.0, 0.0
        local_corr_method, regional_corr_method = None, None
        if gammas:
            local_gamma = gammas[0]
            regional_gamma = gammas[1]
            local_corr_method = CORRELATION_METHODS[self.config.setting.correlation_types[0]]
            regional_corr_method = CORRELATION_METHODS[self.config.setting.correlation_types[1]]

        self.sampler = LLLLRRGSampler(local_gamma, local_corr_method,
                                      regional_gamma, regional_corr_method,
                                      default_batch_size, default_device)

    def _setup_mechanism(self):
        self.mechanism = LLLLRRGAuction(rule = 'first_price', core_solver = self.setting.core_solver,
                                        parallel = self.hardware.max_cpu_threads, cuda = self.hardware.cuda)

    def _get_logdir_hierarchy(self):
        name = ['LLLLRRG', self.payment_rule, str(self.n_players) + 'p']
        return os.path.join(*name)

    def _plot(self, plot_data, writer: SummaryWriter or None, epoch = None, fmts=['o'], **kwargs):
        super()._plot(plot_data=plot_data, writer = writer, fmts=fmts, **kwargs)
        # TODO: 3d plot for LLLLRRG broken because 2nd dim of global player is singular (always 0.0).
        #super()._plot_3d(plot_data = plot_data, writer = writer, epoch=epoch,
        #                 figure_name=kwargs['figure_name'])

    def _set_valuation_bounds(self):
        """Validates input for uniform valuation bounds and converts
        them to required type List[float] if necessary.
        """
        assert self.config.setting.u_lo is not None, """Missing prior information!"""
        assert self.config.setting.u_hi is not None, """Missing prior information!"""
        u_lo = self.config.setting.u_lo
        # Frontend could either provide single number u_lo that is shared or a list for each player.
        if isinstance(u_lo, Iterable): # pylint: disable=isinstance-second-argument-not-valid-type
            assert len(u_lo) == self.n_players
            u_lo = [float(l) for l in u_lo]
        else:
            u_lo = [float(u_lo)] * self.n_players
        self.u_lo = u_lo

        u_hi = self.config.setting.u_hi
        assert isinstance(u_hi, Iterable) # pylint: disable=isinstance-second-argument-not-valid-type
        assert len(u_hi) == self.n_players
        assert u_hi[1:self.n_local] == \
               u_hi[:self.n_local - 1], "local bidders should be identical"
        assert u_hi[self.n_local : self.n_local + self.n_regional - 1] == \
               u_hi[self.n_local+1 : self.n_local + self.n_regional], "regional bidders should be identical"
        assert u_hi[0] < u_hi[self.n_local], "local bidders must be weaker than regional bidders"
        assert u_hi[self.n_local] < u_hi[self.n_local + self.n_regional], "regional bidders must be weaker than global bidders"
        self.u_hi = [float(h) for h in u_hi]

    def _get_model_names(self):
        if self.model_sharing:
            global_name = 'global' if self.n_players - self.n_local - self.n_regional == 1 else 'globals'
            return ['locals', 'regionals', global_name]
        else:
            return super()._get_model_names()

    def _strat_to_bidder(self, strategy, batch_size, player_position=0, enable_action_caching=False):
        return Bidder(strategy, player_position=player_position, batch_size=batch_size,
                      valuation_size=self.valuation_size, observation_size=self.observation_size,
                      bid_size=self.action_size,
                      risk=self.risk, enable_action_caching=enable_action_caching)