import numpy as np


HORIZON = 20000
NB_SEGS = 5
NUM_OF_INSTANCE = 100
REPETITIONS = 50

class Regret_versus_K(object):
    def __init__(self, horizon = HORIZON, nb_segs = NB_SEGS, nb_of_instances = NUM_OF_INSTANCE, repetitions = REPETITIONS) :
        max_nb_arms = 10
        listOfMeans = []
        self.ENVIRONMENTS = []
        for i in range(nb_of_instances):
            listOfMeans = []
            for m in range(nb_segs):
                listOfMeans = listOfMeans + [[np.random.rand() for k in range(max_nb_arms)]]
            changePoints = []
            for m in range(nb_segs):
                changePoints = changePoints + [int(m*horizon /nb_segs)]
            self.ENVIRONMENTS = self.ENVIRONMENTS + [ 
                # envId = 0
                {   # A simple piece-wise stationary problem
                    "env_type" : "Others",  # "Type-I" = 2 arm switch, "Type-II" = 1 arm switch 1 arm constant, "Others"
                    "params": {
                        "listOfMeans": listOfMeans,
                        "changePoints": changePoints,
                    }
                }]
