import tensorflow as tf

from rllab.core.serializable import Serializable

from rllab.misc.overrides import overrides
from sandbox.rocky.tf.policies.base import Policy


class NNPolicy(Policy, Serializable):
    def __init__(self, env_spec, observation_ph, actions,
                 scope_name=None):
        Serializable.quick_init(self, locals())

        self._observations_ph = observation_ph
        self._actions = actions
        self._scope_name = (
            tf.get_variable_scope().name if not scope_name else scope_name
        )
        super(NNPolicy, self).__init__(env_spec)

    @overrides
    def get_action(self, observation):
        """Sample single action based on the observations."""
        return self.get_actions(observation[None])[0], {}

    @overrides
    def get_actions(self, observations, currentdropoutpi=1.0, isbnpitrainmode=False):
        """Sample actions based on the observations."""
        feed_dict = {self._observations_ph: observations}
        if 'todropoutpi' in self.__dict__.keys() and self.todropoutpi:
            feed_dict[self.dropoutpi_placeholder] = currentdropoutpi
        if 'batchnormpi' in self.__dict__.keys() and self.batchnormpi:
            feed_dict[self.isbnpitrainmode] = isbnpitrainmode
        actions = tf.get_default_session().run(self._actions, feed_dict)
        return actions

    @overrides
    def log_diagnostics(self, paths):
        pass

    @overrides
    def get_params_internal(self, **tags):
        if tags:
            raise NotImplementedError
        scope = self._scope_name
        # Add "/" to 'scope' unless it's empty (otherwise get_collection will
        # return all parameters that start with 'scope'.
        scope = scope if scope == '' else scope + '/'
        return tf.get_collection(tf.GraphKeys.TRAINABLE_VARIABLES, scope)
