Source code for Environment.ResultMultiPlayers

# -*- coding: utf-8 -*-
""" ResultMultiPlayers.ResultMultiPlayers class to wrap the simulation results, for the multi-players case."""
from __future__ import division, print_function  # Python 2 compatibility

__author__ = "Lilian Besson"
__version__ = "0.9"

import numpy as np


[docs]class ResultMultiPlayers(object):
    """ ResultMultiPlayers accumulators, for the multi-players case. """

    # , delta_t_save=1
[docs]    def __init__(self, nbArms, horizon, nbPlayers, means=None):
        """ Create ResultMultiPlayers."""
        # self._means = means  # Keep the means for ChangingAtEachRepMAB cases
        self.choices = np.zeros((nbPlayers, horizon), dtype=int)  #: Store all the choices of all the players
        self.rewards = np.zeros((nbPlayers, horizon))  #: Store all the rewards of all the players, to compute the mean
        # self.rewardsSquared = np.zeros((nbPlayers, horizon))  #: Store all the rewards**2 of all the players, to compute the variance  # XXX uncomment if needed
        self.pulls = np.zeros((nbPlayers, nbArms), dtype=int)  #: Store the pulls of all the players
        self.allPulls = np.zeros((nbPlayers, nbArms, horizon), dtype=int)  #: Store all the pulls of all the players
        self.collisions = np.zeros((nbArms, horizon), dtype=int)  #: Store the collisions on all the arms
        self.running_time = -1  #: Store the running time of the experiment
        self.memory_consumption = -1  #: Store the memory consumption of the experiment

[docs]    def store(self, time, choices, rewards, pulls, collisions):
        """ Store results."""
        self.choices[:, time] = choices
        self.rewards[:, time] = rewards
        # self.rewardsSquared[:, time] = rewards ** 2  # XXX uncomment if needed
        self.pulls += pulls
        self.allPulls[:, :, time] = pulls
        self.collisions[:, time] = collisions