import numpy as np
import tensorflow as tf

def get_vars(scope_name):
	vars = tf.get_collection(tf.GraphKeys.TRAINABLE_VARIABLES, scope=scope_name)
	assert len(vars) > 0
	return vars

def get_reg_loss(scope_name):
	return tf.reduce_mean(tf.get_collection(tf.GraphKeys.REGULARIZATION_LOSSES, scope=scope_name))

class RandomNormal:
	def __init__(self, mean, logstd):
		self.raw_logstd = logstd
		if len(mean.get_shape().as_list()) > len(logstd.get_shape().as_list()):
			logstd = mean*0.0 + logstd
		self.mean = mean
		self.logstd = logstd
		self.std = tf.maximum(tf.exp(logstd),1e-2)

	def log_p(self, x):
		return tf.reduce_sum(
			-0.5*np.log(2.0*np.pi)-self.logstd-0.5*tf.square((x-self.mean)/self.std),
			axis=-1, keepdims=True
		)

	def entropy(self):
		return tf.reduce_sum(self.logstd+0.5*np.log(2.0*np.pi*np.e), axis=-1, keepdims=True)

	def kl(self, other):
		return tf.reduce_sum(
			-0.5+other.logstd-self.logstd
			+0.5*tf.square(self.std/other.std)
			+0.5*tf.square((self.mean-other.mean)/other.std),
			axis=-1, keepdims=True
		)

class Normalizer:
	def __init__(self, shape, sess, eps_std=1e-2, norm_clip=5.0):
		self.shape = shape
		self.sess = sess
		self.eps_std = eps_std
		self.norm_clip = norm_clip

		with tf.variable_scope('normalizer_variables', initializer=tf.zeros_initializer()):
			self.sum = tf.get_variable(name='sum', shape=self.shape, dtype=np.float32, trainable=False)
			self.sum_sqr = tf.get_variable(name='sum_sqr', shape=self.shape, dtype=np.float32, trainable=False)
			self.cnt = tf.get_variable(name='cnt', shape=[1], dtype=np.float32, trainable=False)
			self.mean = tf.get_variable(name='mean', shape=self.shape, dtype=np.float32, trainable=False)
			self.std = tf.get_variable(name='std', shape=self.shape, dtype=np.float32, trainable=False)

		self.add_sum = tf.placeholder(tf.float32, self.shape)
		self.add_sum_sqr = tf.placeholder(tf.float32, self.shape)
		self.add_cnt = tf.placeholder(tf.float32, [1])

		self.update_array_op = tf.group(
			self.sum.assign_add(self.add_sum),
			self.sum_sqr.assign_add(self.add_sum_sqr),
			self.cnt.assign_add(self.add_cnt)
		)
		self.update_scalar_op = tf.group(
			self.mean.assign(self.sum/self.cnt),
			self.std.assign(tf.maximum(self.eps_std, tf.sqrt(self.sum_sqr/self.cnt-tf.square(self.sum/self.cnt))))
		)

	def get_mean(self): return self.sess.run(self.mean)
	def get_std(self): return self.sess.run(self.std)

	def normalize(self, inputs_ph):
		return tf.clip_by_value((inputs_ph-self.mean)/self.std, -self.norm_clip, self.norm_clip)

	def normalize_prefix(self, inputs_ph):
		dim = int(inputs_ph.get_shape()[-1])
		return tf.clip_by_value((inputs_ph-self.mean[:dim])/self.std[:dim], -self.norm_clip, self.norm_clip)

	def normalize_suffix(self, inputs_ph):
		dim = int(inputs_ph.get_shape()[-1])
		return tf.clip_by_value((inputs_ph-self.mean[-dim:])/self.std[-dim:], -self.norm_clip, self.norm_clip)

	def update(self, inputs):
		feed_dict = {
			self.add_sum: np.sum(inputs, axis=0),
			self.add_sum_sqr: np.sum(np.square(inputs), axis=0),
			self.add_cnt: [inputs.shape[0]]
		}
		self.sess.run(self.update_array_op, feed_dict)
		self.sess.run(self.update_scalar_op)

	def fetch_debug(self):
		mean, std = self.sess.run([self.mean, self.std])
		print('mean:', np.absolute(mean[:3]-mean[-3:]))
		print('std:', np.absolute(std[:3]-std[-3:]))
