import numpy as np

class MultiArmedBandits:
    def __init__(self, mu, var=0.3):
        self.mu = mu # mean rewards of bandits
        self.num_A = len(self.mu)
        self.var = var # variance of rewards

    def transit(self,A):
        '''
        A: chosen action; should be an integer
        '''
        r = self.mu[A] + np.random.normal(0,self.var) # add Gaussian noise 
        return r
    
class LinearBandits:
    def __init__(self,theta,phi,var=0.3):
        self.theta, self.phi, self.var = theta, phi, var
        self.mu = np.dot(self.phi,self.theta)

    def transit(self,A):
        '''
        A: chosen action; should be an integer
        '''
        r = self.mu[A] +  np.random.normal(0,self.var) # add Gaussian noise 
        return r