import numpy as np
from .utils import generate_items

def get_best_reward(items, theta):
	return np.max(np.dot(items, theta))

def generate_subgaussian_noise(scale=0.05):
	return np.random.normal(loc=0, scale=scale)

class Environment:
	def __init__(self, L, d, m, num_users, p, theta):
		self.L = L
		self.d = d
		self.p = p
		self.items = generate_items(num_items = L, d = d)
		self.theta = theta

	def get_items(self):
		self.items = generate_items(num_items = self.L, d = self.d)
		return self.items

	def feedback(self, i, k):
		x = self.items[k, :]
		r = np.dot(self.theta[i], x)
		# y = np.random.binomial(1, r)  #0-1
		y = r + generate_subgaussian_noise()
		br = get_best_reward(self.items, self.theta[i])
		return y, r, br

	def test_feedback(self, i, k):
		x = self.items[k, :]
		r = np.dot(self.theta[i], x)
		# y = np.random.binomial(1, r)  #0-1
		y = r
		br = get_best_reward(self.items, self.theta[i])
		return y, r, br

	def generate_users(self):
		X = np.random.multinomial(1, self.p)
		I = np.nonzero(X)[0]
		return I
