from scipy.signal import hilbert, chirp
from tqdm import tqdm
import os
import h5py
import numpy as np
import pandas as pd
import scipy.stats
# import numpy.typing as npt

from typing import Optional, List, Tuple
from .trial_data import TrialData
from scipy import signal, stats
from .utils import compute_m5_hash

class H5DataReader:
    def __init__(self, trial_data,
                 selected_electrodes: List[str],
                 rereference=None,
                 normalization=None,
                 despike=False,
                 high_gamma=False) -> None:
        '''
            Input: trial_data=ecog and word data to perform processing on
        '''
        self.freqs_to_filter = [60, 120, 180, 240, 300, 360]
        self.trial_data = trial_data
        self.high_gamma= high_gamma
        self.rereference = rereference
        self.normalization = normalization
        self.despike = despike

        self.selected_electrodes = selected_electrodes

        if selected_electrodes==[]:
            self.selected_electrodes = trial_data.get_brain_region_localization()

        if self.rereference=="laplacian":
            self.adj_electrodes = self.get_all_adj_electrodes()

    def stem_electrode_name(self, name):
        #names look like 'O1aIb4', 'O1aIb5', 'O1aIb6', 'O1aIb7'
        #names look like 'T1b2
        reverse_name = reversed(name)
        found_stem_end = False
        stem, num = [], []
        for c in reversed(name):
            if c.isalpha():
                found_stem_end = True
            if found_stem_end:
                stem.append(c)
            else:
                num.append(c)
        return ''.join(reversed(stem)), int(''.join(reversed(num)))

    def get_adj_electrodes(self, name):
        labels = self.trial_data.get_brain_region_localization()
        all_electrode_stems = [self.stem_electrode_name(l) for l in labels]

        stem, num = self.stem_electrode_name(name)
        same_wire = [(s,n) for (s,n) in all_electrode_stems  if s==stem]
        nbrs = [(stem, num+1), (stem, num-1)]
        nbrs = [n for n in nbrs if n in all_electrode_stems]
        assert len(nbrs)==2
        return [e+str(s) for (e,s) in nbrs]

    def get_all_adj_electrodes(self):
        nbrs = [self.get_adj_electrodes(n) for n in self.selected_electrodes] #TODO debug
        flat_nbrs = [x for y in nbrs for x in y]
        return list(set(flat_nbrs))
        
    def notch_filter(self, data, freq, Q=30) -> np.ndarray:
        samp_frequency = self.trial_data.samp_frequency
        w0 = freq / (samp_frequency / 2)
        b, a = signal.iirnotch(w0, Q)
        y = signal.lfilter(b, a, data, axis = 1)
        return y

    def highpass_filter(self, data, freq, Q=30) -> np.ndarray:
        samp_frequency = self.trial_data.samp_frequency
        sos = signal.butter(Q, freq, 'highpass', fs=samp_frequency, output='sos')
        y = signal.sosfilt(sos, data, axis = 1)
        return y

    def band_filter(self, data, freqs, Q=30) -> np.ndarray:
        samp_frequency = self.trial_data.samp_frequency
        sos = signal.butter(Q, freqs, 'bandpass', analog=False, fs=samp_frequency, output='sos')
        y = signal.sosfilt(sos, data, axis = 1)
        return y

    def car_rereference(self, data_arr):
        all_ordered_labels = self.trial_data.get_brain_region_localization()
        selected = [(i,e) for i,e in enumerate(all_ordered_labels) if e in self.selected_electrodes]
        sel_idxs, sel_labels = zip(*selected)

        all_data = self.select_electrodes(all_ordered_labels)
        reref = data_arr - np.mean(all_data, axis=0)
        return reref

    def laplacian_rereference(self, data_arr):
        all_ordered_labels = self.trial_data.get_brain_region_localization()
        selected = [(i,e) for i,e in enumerate(all_ordered_labels) if e in self.selected_electrodes]
        sel_idxs, sel_labels = zip(*selected)

        ordered_nbrs = [e for e in all_ordered_labels if e in self.adj_electrodes]
        label2idx = {v:k for (k,v) in enumerate(ordered_nbrs)}

        adj_data_arr = self.select_electrodes(self.adj_electrodes)
        sel_nbrs = [self.get_adj_electrodes(n) for n in sel_labels]
        sel_nbrs_idxs = [[label2idx[l] for l in nbr_list] for nbr_list in sel_nbrs]
        sel_nbr_data = [[adj_data_arr[i] for i in idx_list] for idx_list in sel_nbrs_idxs]
        sel_nbr_data = np.array(sel_nbr_data)
        sel_nbr_data = self.filter_data(sel_nbr_data)

        #sel_nbr_data is [n_electrodes, 2, n_samples]
        laplacian = data_arr - np.mean(sel_nbr_data, axis=1)
        return laplacian
        
    def filter_data(self, data_arr):
        for f in self.freqs_to_filter:
            data_arr = self.notch_filter(data_arr, f)
        if self.high_gamma:
            band_data_arr = self.band_filter(data_arr, [70,250], Q=5)
            data_arr = band_data_arr
        return data_arr

    def de_spike(self, y):
        fuzz = 125 #number of samples around the spike to subtract out
        scaling_factor = 0.95 #how much of the spike to remove

        zscored = scipy.stats.zscore(y)
        mask = (np.abs(zscored)>4)
        fuzzed_mask = np.sign(np.convolve(mask, np.ones(fuzz), mode='same'))
        de_spiked = y - (fuzzed_mask*y*scaling_factor)
        return de_spiked

    def get_filtered_data(self) -> np.ndarray:
        '''
            filters out freqs from the trial data
        '''
        data_arr = self.select_electrodes(self.selected_electrodes)

        data_arr = self.filter_data(data_arr)
        if self.rereference == "CAR":
           data_arr = self.car_rereference(data_arr)
        if self.rereference=="laplacian":
           data_arr = self.laplacian_rereference(data_arr)
        if self.normalization=="zscore":
            data_arr = scipy.stats.zscore(data_arr, axis=1)
        if self.normalization=="standard":
            #This should be the same as above in principle
            mean = np.mean(data_arr, axis=1)
            std_dev = np.std(data_arr, axis=1)
            eps = 0.0001
            standardized = (data_arr - mean)/(std_dev + eps)
        if self.despike:
            for i in range(data_arr.shape[0]):
                data_arr[i] = self.de_spike(data_arr[i])
        return data_arr

    def select_electrodes(self, selected) -> np.ndarray:
        '''
            Input:
                word_window_arr = array of shape [n_electrodes, n_words, n_samples]
                electrode_labels = list of all the electrode labels for a sample
            Output:
                word_window_arr = array of shape [n_selected_electrodes, n_words, n_samples]
                                  where the order of electrodes is the same as in self.selected_electrodes

        '''
        labels = self.trial_data.get_brain_region_localization()
        indices = [i for i,e in enumerate(labels) if e in selected]

        assert len(indices) == len(selected)

        with open(self.trial_data.neural_data_hash, 'r') as f:
            lines = f.readlines()
            precomputed_hash = lines[0].split()[0]

        electrode_data = []
        with h5py.File(self.trial_data.neural_data_file, 'r') as hf:
            raw_data = hf['data']#TODO add hash check
            stored_hash = raw_data.attrs['orig_data_hash']
            assert stored_hash == precomputed_hash, "need to update transposed data"

            for i in indices:
                electrode_data.append(raw_data[f'electrode_{i}'][:])
        electrode_data_arr = np.stack(electrode_data)
            
        return electrode_data_arr