#!/usr/bin/env python
# -*- coding: utf-8 -*-

"""
file  : LISTA_cp.py
author: Xiaohan Chen
email : chernxh@tamu.edu
last_modified : 2018-10-21

Implementation of Learned ISTA with weight coupling.
"""

import numpy as np
import tensorflow as tf

import utils.train
from models.LISTA_base import LISTA_base
from utils.tf import shrink_free, hard_shrink


class LISTA_cp(LISTA_base):
    """
    Implementation of learned ISTA with weight coupling constraint.
    """

    def __init__(self, A, T, lam, rho, beta, untied, coord, scope, train=True):
        """
        :prob:  : Instance of Problem class, describing problem settings.
        :T      : Number of layers (depth) of this LISTA model.
        :lam    : Initial value of thresholds of shrinkage functions.
        :untied : Whether weights are shared within layers.
        """
        self._A = A.astype(np.float32)
        self._T = T
        self._lam = lam
        self._M = self._A.shape[0]
        self._N = self._A.shape[1]
        self._rho = rho
        self._beta = beta
        self._train_sam = train
        self._scale = 1.001 * np.linalg.norm(A, ord=2) ** 2
        self._theta = (self._lam / self._scale).astype(np.float32)
        if coord:
            self._theta = np.ones((self._N, 1), dtype=np.float32) * self._theta

        self._untied = untied
        self._coord = coord
        self._scope = scope

        """ Set up layers."""
        self.setup_layers()

    def setup_layers(self):
        """
        Implementation of LISTA model proposed by LeCun in 2010.

        :prob: Problem setting.
        :T: Number of layers in LISTA.
        :returns:
            :layers: List of tuples ( name, xh_, var_list )
                :name: description of layers.
                :xh: estimation of sparse code at current layer.
                :var_list: list of variables to be trained seperately.

        """
        Ws_ = []
        thetas_ = []
        rhos_ = []

        W = (np.transpose(self._A) / self._scale).astype(np.float32)

        with tf.variable_scope(self._scope, reuse=False) as vs:
            # constant
            self._kA_ = tf.constant(value=self._A, dtype=tf.float32)

            if not self._untied:  # tied model
                Ws_.append(tf.get_variable(name="W", dtype=tf.float32, initializer=W))
                Ws_ = Ws_ * self._T

            for t in range(self._T):
                thetas_.append(
                    tf.get_variable(
                        name="theta_%d" % (t + 1),
                        dtype=tf.float32,
                        initializer=self._theta,
                    )
                )
                if self._untied:  # untied model
                    Ws_.append(
                        tf.get_variable(
                            name="W_%d" % (t + 1), dtype=tf.float32, initializer=W
                        )
                    )
                if self._train_sam:
                    rhos_.append(tf.get_variable(name="rho_%d"%(t+1),
                                                dtype=tf.float32,
                                                initializer=self._rho))
                

        # Collection of all trainable variables in the model layer by layer.
        # We name it as `vars_in_layer` because we will use it in the manner:
        # vars_in_layer [t]
        if self._train_sam:
            self.vars_in_layer = list(zip(Ws_, thetas_, rhos_))
        else:
            self.vars_in_layer = list(zip(Ws_, thetas_))

    def inference(self, y_, x0_=None):
        xhs_ = []  # collection of the regressed sparse codes

        if x0_ is None:
            batch_size = tf.shape(y_)[-1]
            xh_ = tf.zeros(shape=(self._N, batch_size), dtype=tf.float32)
        else:
            xh_ = x0_
        xhs_.append(xh_)
        g = None

        with tf.variable_scope(self._scope, reuse=True) as vs:
            for t in range(self._T):
                if self._train_sam:
                    W_, theta_, rho_ = self.vars_in_layer[t]
                else:
                    W_, theta_ = self.vars_in_layer[t]
                    rho_ = self._rho
                if g is None:
                    epsilon = rho_ * tf.zeros_like(xh_)
                else:
                    # mg = tf.where(tf.abs(xh_) > theta_, g, tf.zeros_like(g))
                    one_over_norm = 1. / tf.sqrt(tf.reduce_sum(xh_ * g, axis=0, keepdims=True) + 1e-20)
                    epsilon = rho_ * (xh_ * xh_ * g) * one_over_norm 
                zh_ = xh_ + epsilon

                res_ = y_ - tf.matmul(self._kA_, zh_)
                uh_ = xh_ + tf.matmul(W_, res_)
                xh_ = shrink_free(uh_ + epsilon, theta_) - epsilon
                g = uh_ - xh_
                xhs_.append(xh_)

        return xhs_
