import numpy as np 
import random
from csl.graph.SHD import SHD
from csl.utils.DAG2CPDAG import dag2cpdag
from csl.utils.TXT2GeneralGraph import dagadjmat2generalgraph
from csl.search.ConstraintBased.PC import pc
from csl.search.ScoreBased.GES import ges
from csl.utils import cit
import math
from sklearn.neural_network import MLPRegressor

from itertools import combinations
import random
from causallearn.utils.cit import CIT
import matplotlib.pyplot as plt

############### linear gaussian ################
##########x-y ###########
# mu = 1
# mu1 = 2
# mus = 3
# sigma_x = random.uniform(1,2)
# sigma_y = random.uniform(1,3)
# sigma_l = random.uniform(1,3)
# sigma_s = random.uniform(3,6)
# num_sample = 100000
# a = random.uniform(2,4)
# print(a)
# l1 = random.uniform(1,3)
# l2 = random.uniform(1,2)
# s1 = random.uniform(1,3)
# s2 = random.uniform(2,5)

# Ex = np.random.normal(mu,sigma_x,num_sample)
# Ey = np.random.normal(mu1,sigma_y,num_sample)
# El = np.random.normal(mu,sigma_l,num_sample)
# Es = np.random.normal(mus,sigma_s,num_sample)
# Esy = np.random.normal(mu,sigma_s,num_sample)
#####################case 1 (cause)#####################
# x = Ex
# c = np.zeros(100000)
# y = a * x + Ey
# o_data =  np.stack((x,y,c), axis = 1)


# per_cx = np.ones(100000)
# do_x = np.zeros(100000)
# Ey_per = np.random.normal(mu1,sigma_y,num_sample)
# per_y = Ey_per
# pertub_data_x = np.stack((do_x,Ey_per, per_cx), axis=1)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# # print(data_per_x.shape)
# np.save('./simulation_data/case1_do(x).npy', data_per_x)
# # print(pertub_data_x)


# per_cy = np.ones(100000)
# do_y = np.zeros(100000)
# Ex_per = np.random.normal(mu,sigma_x,num_sample)
# per_x = Ex_per
# perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
# data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
# np.save('./simulation_data/case1_do(y).npy', data_per_y)

#####################case 2 (latent)########################
# L = El
# c = np.zeros(100000)
# x = Ex + l1 * L
# y = Ey + l2 * L
# o_data = np.stack((x,y,c),axis=1)

# per_cx = np.ones(100000)
# do_x = np.zeros(100000)
# Ey_per = np.random.normal(mu1,sigma_y,num_sample)
# El_per_x = np.random.normal(mu,sigma_l,num_sample)
# per_y = Ey_per + l2 * El_per_x
# pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# np.save('./simulation_data/case2_do(x).npy', data_per_x)

# per_cy = np.ones(100000)
# do_y = np.zeros(100000)
# Ex_per = np.random.normal(mu,sigma_x,num_sample)
# El_per_y = np.random.normal(mu,sigma_l,num_sample)
# per_x = Ex_per + l1 * El_per_y
# perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
# data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
# np.save('./simulation_data/case2_do(y).npy', data_per_y)

#####################case 3 (selection)########################
# c = np.zeros(100000)
# x = Ex
# y = Ey
# mask = (s1 * x + s2 * y + Es > 3) & (s1 * x + s2 * y + Es < 6)
# x = x[mask]
# y = y[mask]
# c = c[mask]
# o_data = np.stack((x,y,c),axis=1)

# per_cx = np.ones(100000)
# Es_per_x = np.random.normal(mu,sigma_s,num_sample)
# do_x = np.zeros(100000)
# Ey_per = np.random.normal(mu1,sigma_y,num_sample)
# per_y = Ey_per
# mask_per_x = (s1 * do_x + s2 * per_y + Es_per_x > 3) & (s1 * do_x + s2 * per_y + Es_per_x < 6)
# do_x = do_x[mask_per_x]
# per_y = per_y[mask_per_x]
# per_cx = per_cx[mask_per_x]
# pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
# print(pertub_data_x.shape)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# np.save('./simulation_data/case3_do(x).npy', data_per_x)
# print(data_per_x.shape)

# per_cy = np.ones(100000)
# Es_per_y = np.random.normal(mu,sigma_s,num_sample)
# do_y = np.zeros(100000)
# Ex_per = np.random.normal(mu,sigma_x,num_sample)
# per_x = Ex_per
# mask_per_y = (s1 * per_x + s2 * do_y + Es_per_y > 3) & (s1 * per_x + s2 * do_y + Es_per_y < 6)
# per_x = per_x[mask_per_y]
# do_y = do_y[mask_per_y]
# per_cy = per_cy[mask_per_y]
# pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
# print(pertub_data_y.shape)
# data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
# np.save('./simulation_data/case3_do(y).npy', data_per_y)
# print(data_per_y.shape)

#####################case 4 (casue with selection)########################
# c = np.zeros(100000)
# x = Ex 
# y = Ey + a * Ex
# mask = (s1 * x + s2 * y + Es > 5) & (s1 * x + s2 * y + Es < 50)
# print(s1 * x + s2 * y + Es)
# x = x[mask]
# y = y[mask]
# c = c[mask]
# o_data = np.stack((x,y,c),axis=1)

# per_cx = np.ones(100000)
# Es_per_x = np.random.normal(mu,sigma_s,num_sample)
# do_x = np.zeros(100000)
# Ey_per = np.random.normal(mu1,sigma_y,num_sample)
# per_y = Ey_per + do_x * a
# mask_per_x = (s1 * do_x + s2 * per_y + Es_per_x > 5) & (s1 * do_x + s2 * per_y + Es_per_x < 50)
# do_x = do_x[mask_per_x]
# per_y = per_y[mask_per_x]
# per_cx = per_cx[mask_per_x]
# pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# np.save('./simulation_data/case4_do(x).npy', data_per_x)
# print(pertub_data_x.shape)
# print(data_per_x.shape)


# per_cy = np.ones(100000)
# Es_per_y = np.random.normal(mu,sigma_s,num_sample)
# do_y = np.zeros(100000)
# Ex_per = np.random.normal(mu,sigma_x,num_sample)
# per_x = Ex_per
# mask_per_y = (s1 * per_x + s2 * do_y + Es_per_y > 5) & (s1 * per_x + s2 * do_y + Es_per_y < 50)
# per_x = per_x[mask_per_y]
# do_y = do_y[mask_per_y]
# per_cy = per_cy[mask_per_y]
# pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
# data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
# np.save('./simulation_data/case4_do(y).npy', data_per_y)
# print(pertub_data_y.shape)
# print(data_per_y.shape)

# #####################case 5 (casue with latent)########################
# L = El
# c = np.zeros(100000)
# x = Ex + l1 * L
# y = a * Ex + Ey + l2 * L
# o_data = np.stack((x,y,c),axis=1)

# per_cx = np.ones(100000)
# do_x = np.zeros(100000)
# Ey_per = np.random.normal(mu1,sigma_y,num_sample)
# El_per_x = np.random.normal(mu,sigma_l,num_sample)
# per_y = Ey_per + l2 * El_per_x
# pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# np.save('./simulation_data/case5_do(x).npy', data_per_x)

# per_cy = np.ones(100000)
# do_y = np.zeros(100000)
# Ex_per = np.random.normal(mu,sigma_x,num_sample)
# El_per_y = np.random.normal(mu,sigma_l,num_sample)
# per_x = Ex_per + l1 * El_per_y
# perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
# data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
# np.save('./simulation_data/case5_do(y).npy', data_per_y)

# #####################case 6 (selection with latent)########################

# L = El
# c = np.zeros(100000)
# x = Ex + l1 * L
# y = Ey + l2 * L
# mask = (s1 * x + s2 * y + Es > 5) & (s1 * x + s2 * y + Es < 50)
# x = x[mask]
# y = y[mask]
# c = c[mask]
# o_data = np.stack((x,y,c),axis=1)

# per_cx = np.ones(100000)
# El_per_x = np.random.normal(mu,sigma_l,num_sample)
# Es_per_x = np.random.normal(mu,sigma_s,num_sample)
# do_x = np.zeros(100000)
# Ey_per = np.random.normal(mu1,sigma_y,num_sample)
# per_y = Ey_per + l2 * El_per_x
# mask_per_x = (s1 * do_x + s2 * per_y + Es_per_x > 5) & (s1 * do_x + s2 * per_y + Es_per_x < 50)
# do_x = do_x[mask_per_x]
# per_y = per_y[mask_per_x]
# per_cx = per_cx[mask_per_x]
# pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# np.save('./simulation_data/case6_do(x).npy', data_per_x)

# per_cy = np.ones(100000)
# El_per_y = np.random.normal(mu,sigma_l,num_sample)
# Es_per_y = np.random.normal(mu,sigma_s,num_sample)
# do_y = np.zeros(100000)
# Ex_per = np.random.normal(mu,sigma_x,num_sample)
# per_x = Ex_per + l1 * El_per_y
# mask_per_y = (s1 * per_x + s2 * do_y + Es_per_y > 5) & (s1 * per_x + s2 * do_y + Es_per_y < 50)
# per_x = per_x[mask_per_y]
# do_y = do_y[mask_per_y]
# per_cy = per_cy[mask_per_y]
# pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
# data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
# np.save('./simulation_data/case6_do(y).npy', data_per_y)

# #####################case 7 (cause with selection and latent)########################

# L = El
# c = np.zeros(100000)
# x = Ex + l1 * L
# y = Ey + l2 * L + a * x
# mask = (s1 * x + s2 * y + Es > 10) & (s1 * x + s2 * y + Es < 40)
# print(s1 * x + s2 * y + Es)
# x = x[mask]
# y = y[mask]
# c = c[mask]
# o_data = np.stack((x,y,c),axis=1)
# # print(o_data)

# per_cx = np.ones(100000)
# El_per_x = np.random.normal(mu,sigma_l,num_sample)
# Es_per_x = np.random.normal(mus,sigma_s,num_sample)
# do_x = np.zeros(100000)
# Ey_per = np.random.normal(mu1,sigma_y,num_sample)
# per_y = Ey_per + l2 * El_per_x + a * do_x
# mask_per_x = (s1 * do_x + s2 * per_y + Es_per_x > 10) & (s1 * do_x + s2 * per_y + Es_per_x < 40)
# do_x = do_x[mask_per_x]
# per_y = per_y[mask_per_x]
# per_cx = per_cx[mask_per_x]
# pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# np.save('./simulation_data/case7_do(x).npy', data_per_x)
# print(pertub_data_x.shape)
# print(data_per_x.shape)

# per_cy = np.ones(100000)
# El_per_y = np.random.normal(mu,sigma_l,num_sample)
# Es_per_y = np.random.normal(mus,sigma_s,num_sample)
# do_y = np.zeros(100000)
# Ex_per = np.random.normal(mu,sigma_x,num_sample)
# per_x = Ex_per + l1 * El_per_y
# mask_per_y = (s1 * per_x + s2 * do_y + Es_per_y > 10) & (s1 * per_x + s2 * do_y + Es_per_y < 40)
# per_x = per_x[mask_per_y]
# do_y = do_y[mask_per_y]
# per_cy = per_cy[mask_per_y]
# pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
# data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
# np.save('./simulation_data/case7_do(y).npy', data_per_y)
# print(pertub_data_y.shape)
# print(data_per_y.shape)



############### linear non-gaussian ################

# startx = -1
# endx = 2
# starty = 3
# endy = 5
# startl = 7
# endl = 9
# starts = 2
# ends = 4
# num_sample = 4000
# a = random.uniform(5,15)
# print(a)
# l1 = random.uniform(4,6)
# l2 = random.uniform(4,6)
# s1 = random.uniform(-1,3)
# s2 = random.uniform(1,2)
# Ex = np.random.uniform(startx,endx,num_sample)
# Ey = np.random.uniform(starty,endy,num_sample)
# El = np.random.uniform(startl,endl,num_sample)
# Es = np.random.uniform(starts,ends,num_sample)













#####################linear non-gaussian #####################

#####################case 1 (cause)#####################

# startx = -1
# endx = 2
# starty = 3
# endy = 5
# startl = 7
# endl = 9
# starts = 2
# ends = 4
# num_sample = 4000
# a = random.uniform(5,15)
# print(a)
# l1 = random.uniform(4,6)
# l2 = random.uniform(4,6)
# s1 = random.uniform(-1,3)
# s2 = random.uniform(1,2)
# Ex = np.random.uniform(startx,endx,num_sample)
# Ey = np.random.uniform(starty,endy,num_sample)
# El = np.random.uniform(startl,endl,num_sample)
# Es = np.random.uniform(starts,ends,num_sample)

# x = Ex
# c = np.zeros(4000)
# y = a * x + Ey
# o_data =  np.stack((x,y,c), axis = 1)


# per_cx = np.ones(4000)
# do_x = np.zeros(4000)
# Ey_per = np.random.uniform(starty,endy,num_sample)
# per_y = Ey_per
# pertub_data_x = np.stack((do_x,Ey_per, per_cx), axis=1)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# print(data_per_x.shape)
# np.save('./linear_non-gaussian/case1_do(x).npy', data_per_x)
# # print(pertub_data_x)


# per_cy = np.ones(4000)
# do_y = np.zeros(4000)
# Ex_per = np.random.uniform(startx,endx,num_sample)
# per_x = Ex_per
# perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
# data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
# np.save('./linear_non-gaussian/case1_do(y).npy', data_per_y)

#####################case 2 (latent)########################

# startx = -1
# endx = 2
# starty = 3
# endy = 5
# startl = 7
# endl = 9
# starts = 2
# ends = 4
# num_sample = 4000
# a = random.uniform(5,15)
# print(a)
# l1 = random.uniform(4,6)
# l2 = random.uniform(4,6)
# s1 = random.uniform(-1,3)
# s2 = random.uniform(1,2)
# Ex = np.random.uniform(startx,endx,num_sample)
# Ey = np.random.uniform(starty,endy,num_sample)
# El = np.random.uniform(startl,endl,num_sample)
# Es = np.random.uniform(starts,ends,num_sample)

# L = El
# c = np.zeros(4000)
# x = Ex + l1 * L
# y = Ey + l2 * L
# o_data = np.stack((x,y,c),axis=1)

# per_cx = np.ones(4000)
# do_x = np.zeros(4000)
# Ey_per = np.random.uniform(starty,endy,num_sample)
# El_per_x = np.random.uniform(startl, endl,num_sample)
# per_y = Ey_per + l2 * El_per_x
# pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# np.save('./linear_non-gaussian/case2_do(x).npy', data_per_x)

# per_cy = np.ones(4000)
# do_y = np.zeros(4000)
# Ex_per = np.random.uniform(startx, endx,num_sample)
# El_per_y = np.random.uniform(startl, endl,num_sample)
# per_x = Ex_per + l1 * El_per_y
# perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
# data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
# np.save('./linear_non-gaussian/case2_do(y).npy', data_per_y)

#####################case 3 (selection)########################

# startx = -1
# endx = 2
# starty = 3
# endy = 5
# startl = 7
# endl = 9
# starts = 2
# ends = 4
# num_sample = 4000
# a = random.uniform(5,15)
# print(a)
# l1 = random.uniform(4,6)
# l2 = random.uniform(4,6)
# s1 = random.uniform(-1,3)
# s2 = random.uniform(1,2)
# Ex = np.random.uniform(startx,endx,num_sample)
# Ey = np.random.uniform(starty,endy,num_sample)
# El = np.random.uniform(startl,endl,num_sample)
# Es = np.random.uniform(starts,ends,num_sample)


# c = np.zeros(4000)
# x = Ex
# y = Ey
# mask = (s1 * x + s2 * y + Es > 0) & (s1 * x + s2 * y + Es < 10)
# print(s1 * x + s2 * y + Es)
# x = x[mask]
# y = y[mask]
# c = c[mask]
# o_data = np.stack((x,y,c),axis=1)

# per_cx = np.ones(4000)
# Es_per_x = np.random.uniform(starts, ends,num_sample)
# do_x = np.zeros(4000)
# Ey_per = np.random.uniform(starty,endy,num_sample)
# per_y = Ey_per
# mask_per_x = (s1 * do_x + s2 * per_y + Es_per_x > 0) & (s1 * do_x + s2 * per_y + Es_per_x < 10)
# do_x = do_x[mask_per_x]
# per_y = per_y[mask_per_x]
# per_cx = per_cx[mask_per_x]
# pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
# print(pertub_data_x.shape)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# np.save('./linear_non-gaussian/case3_do(x).npy', data_per_x)
# print(data_per_x.shape)

# per_cy = np.ones(4000)
# Es_per_y = np.random.uniform(starts, ends,num_sample)
# do_y = np.zeros(4000)
# Ex_per = np.random.uniform(startx, endx,num_sample)
# per_x = Ex_per
# mask_per_y = (s1 * per_x + s2 * do_y + Es_per_y > 0) & (s1 * per_x + s2 * do_y + Es_per_y < 10)
# print(s1 * per_x + s2 * do_y + Es_per_y)
# per_x = per_x[mask_per_y]
# do_y = do_y[mask_per_y]
# per_cy = per_cy[mask_per_y]
# pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
# print(pertub_data_y.shape)
# data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
# np.save('./linear_non-gaussian/case3_do(y).npy', data_per_y)
# print(data_per_y.shape)

#####################case 4 (casue with selection)########################
# startx = -1
# endx = 2
# starty = 3
# endy = 5
# startl = 7
# endl = 9
# starts = 2
# ends = 4
# num_sample = 4000
# a = random.uniform(5,15)
# print(a)
# l1 = random.uniform(4,6)
# l2 = random.uniform(4,6)
# s1 = random.uniform(-1,3)
# s2 = random.uniform(1,2)
# Ex = np.random.uniform(startx,endx,num_sample)
# Ey = np.random.uniform(starty,endy,num_sample)
# El = np.random.uniform(startl,endl,num_sample)
# Es = np.random.uniform(starts,ends,num_sample)

# c = np.zeros(4000)
# x = Ex 
# y = Ey + a * Ex
# mask = (s1 * x + s2 * y + Es > 0) & (s1 * x + s2 * y + Es < 10)
# print(s1 * x + s2 * y + Es)
# x = x[mask]
# y = y[mask]
# c = c[mask]
# o_data = np.stack((x,y,c),axis=1)

# per_cx = np.ones(4000)
# Es_per_x = np.random.uniform(starts, ends,num_sample)
# do_x = np.zeros(4000)
# Ey_per = np.random.uniform(starty,endy,num_sample)
# per_y = Ey_per + do_x * a
# mask_per_x = (s1 * do_x + s2 * per_y + Es_per_x > 0) & (s1 * do_x + s2 * per_y + Es_per_x < 10)
# do_x = do_x[mask_per_x]
# per_y = per_y[mask_per_x]
# per_cx = per_cx[mask_per_x]
# pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# np.save('./linear_non-gaussian/case4_do(x).npy', data_per_x)
# print(pertub_data_x.shape)
# print(data_per_x.shape)


# per_cy = np.ones(4000)
# Es_per_y = np.random.uniform(starts, ends,num_sample)
# do_y = np.zeros(4000)
# Ex_per = np.random.uniform(startx, endx,num_sample)
# per_x = Ex_per
# mask_per_y = (s1 * per_x + s2 * do_y + Es_per_y > 0) & (s1 * per_x + s2 * do_y + Es_per_y < 10)
# per_x = per_x[mask_per_y]
# do_y = do_y[mask_per_y]
# per_cy = per_cy[mask_per_y]
# pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
# data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
# np.save('./linear_non-gaussian/case4_do(y).npy', data_per_y)
# print(pertub_data_y.shape)
# print(data_per_y.shape)

# #####################case 5 (casue with latent)########################
# L = El
# c = np.zeros(4000)
# x = Ex + l1 * L
# y = a * Ex + Ey + l2 * L
# o_data = np.stack((x,y,c),axis=1)

# per_cx = np.ones(4000)
# do_x = np.zeros(4000)
# Ey_per = np.random.uniform(starty,endy,num_sample)
# El_per_x = np.random.uniform(startl, endl,num_sample)
# per_y = Ey_per + l2 * El_per_x
# pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# np.save('./linear_non-gaussian/case5_do(x).npy', data_per_x)

# per_cy = np.ones(4000)
# do_y = np.zeros(4000)
# Ex_per = np.random.uniform(startx, endx,num_sample)
# El_per_y = np.random.uniform(startl, endl,num_sample)
# per_x = Ex_per + l1 * El_per_y
# perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
# data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
# np.save('./linear_non-gaussian/case5_do(y).npy', data_per_y)

# #####################case 6 (selection with latent)########################

# L = El
# c = np.zeros(4000)
# x = Ex + l1 * L
# y = Ey + l2 * L
# mask = (s1 * x + s2 * y + Es > 60) & (s1 * x + s2 * y + Es < 130)
# print(s1 * x + s2 * y + Es)
# x = x[mask]
# y = y[mask]
# c = c[mask]
# o_data = np.stack((x,y,c),axis=1)

# per_cx = np.ones(4000)
# El_per_x = np.random.uniform(startl, endl,num_sample)
# Es_per_x = np.random.uniform(starts, ends,num_sample)
# do_x = np.zeros(4000)
# Ey_per = np.random.uniform(starty,endy,num_sample)
# per_y = Ey_per + l2 * El_per_x
# mask_per_x = (s1 * do_x + s2 * per_y + Es_per_x > 60) & (s1 * do_x + s2 * per_y + Es_per_x < 130)
# do_x = do_x[mask_per_x]
# per_y = per_y[mask_per_x]
# per_cx = per_cx[mask_per_x]
# pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# np.save('./linear_non-gaussian/case6_do(x).npy', data_per_x)
# print(pertub_data_x.shape)
# print(data_per_x.shape)

# per_cy = np.ones(4000)
# El_per_y = np.random.uniform(startl, endl,num_sample)
# Es_per_y = np.random.uniform(starts, ends,num_sample)
# do_y = np.zeros(4000)
# Ex_per = np.random.uniform(startx, endx,num_sample)
# per_x = Ex_per + l1 * El_per_y
# mask_per_y = (s1 * per_x + s2 * do_y + Es_per_y > 60) & (s1 * per_x + s2 * do_y + Es_per_y < 130)
# print(s1 * per_x + s2 * do_y + Es_per_y)
# per_x = per_x[mask_per_y]
# do_y = do_y[mask_per_y]
# per_cy = per_cy[mask_per_y]
# pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
# data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
# np.save('./linear_non-gaussian/case6_do(y).npy', data_per_y)
# print(pertub_data_y.shape)
# print(data_per_y.shape)
# #####################case 7 (cause with selection and latent)########################
# startx = -1
# endx = 2
# starty = 1
# endy = 3
# startl = 2
# endl = 3
# starts = 2
# ends = 4
# num_sample = 4000
# a = random.uniform(10,15)
# print(a)
# l1 = random.uniform(1,3)
# l2 = random.uniform(1,3)
# s1 = random.uniform(2,3)
# s2 = random.uniform(1,2)
# Ex = np.random.uniform(startx,endx,num_sample)
# Ey = np.random.uniform(starty,endy,num_sample)
# El = np.random.uniform(startl,endl,num_sample)
# Es = np.random.uniform(starts,ends,num_sample)

# L = El
# c = np.zeros(4000)
# x = Ex + l1 * L
# y = Ey + l2 * L + a * x
# mask = (s1 * x + s2 * y + Es > 5) & (s1 * x + s2 * y + Es < 100)
# print(s1 * x + s2 * y + Es)
# x = x[mask]
# y = y[mask]
# c = c[mask]
# print(y)
# o_data = np.stack((x,y,c),axis=1)
# # print(o_data)

# per_cx = np.ones(4000)
# El_per_x = np.random.uniform(startl, endl,num_sample)
# Es_per_x = np.random.uniform(starts,ends,num_sample)
# do_x = np.zeros(4000)
# Ey_per = np.random.uniform(starty,endy,num_sample)
# per_y = Ey_per + l2 * El_per_x + a * do_x
# mask_per_x = (s1 * do_x + s2 * per_y + Es_per_x > 5) & (s1 * do_x + s2 * per_y + Es_per_x < 100)
# print(s1 * do_x + s2 * per_y + Es_per_x )
# do_x = do_x[mask_per_x]
# per_y = per_y[mask_per_x]
# print(per_y)
# per_cx = per_cx[mask_per_x]
# pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
# data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
# np.save('./linear_non-gaussian/case7_do(x).npy', data_per_x)
# print(pertub_data_x.shape)
# print(data_per_x.shape)

# per_cy = np.ones(4000)
# El_per_y = np.random.uniform(startl, endl,num_sample)
# Es_per_y = np.random.uniform(starts,ends,num_sample)
# do_y = np.zeros(4000)
# Ex_per = np.random.uniform(startx, endx,num_sample)
# per_x = Ex_per + l1 * El_per_y
# mask_per_y = (s1 * per_x + s2 * do_y + Es_per_y > 5) & (s1 * per_x + s2 * do_y + Es_per_y < 100)
# print(s1 * per_x + s2 * do_y + Es_per_y)
# per_x = per_x[mask_per_y]
# do_y = do_y[mask_per_y]
# per_cy = per_cy[mask_per_y]
# pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
# data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
# np.save('./linear_non-gaussian/case7_do(y).npy', data_per_y)
# print(pertub_data_y.shape)
# print(data_per_y.shape)









############## non-linear gaussian ################



#########x-y ###########
# mu = 4
# mu1 = 10
# mus = 3
# sigma_x = random.uniform(0,2)
# sigma_y = random.uniform(3,5)
# sigma_l = random.uniform(1,3)
# sigma_s = random.uniform(3,6)
# num_sample = 4000

# l1 = random.uniform(1,3)
# l2 = random.uniform(1,2)
# s1 = random.uniform(1,3)
# s2 = random.uniform(2,5)

# Ex = np.random.normal(mu,sigma_x,num_sample)
# Ey = np.random.normal(mu1,sigma_y,num_sample)
# El = np.random.normal(mu,sigma_l,num_sample)
# Es = np.random.normal(mus,sigma_s,num_sample)
# Esy = np.random.normal(mu,sigma_s,num_sample)

# def sigmoid(x):
#     return 1 / (1 + np.exp(-x))

# def initialize_parameters(input_size, hidden_size, output_size):
#     parameters = {}
#     parameters['W1'] = np.random.randn(hidden_size, input_size) 
#     parameters['b1'] = random.uniform(1, 10)
#     parameters['W2'] = np.random.randn(hidden_size, hidden_size)
#     parameters['b2'] = random.uniform(1, 10)
#     parameters['W3'] = np.random.randn(output_size, hidden_size)
#     parameters['b3'] = np.zeros((output_size, 1))
#     return parameters

# def forward_propagation(X, parameters):
#     W1, b1, W2, b2, W3, b3 = parameters.values()
#     Z1 = np.dot(X, W1) + b1
#     A1 = sigmoid(Z1)
#     Z2 = np.dot(A1, W2) + b2
#     A2 = sigmoid(Z2)
#     # Z3 = np.dot(A2, W3) + b3
#     # A3 = sigmoid(Z3)
#     return A2

# input_size = 1 
# hidden_size = 1 
# output_size = 1 

# import torch

# non_linear = torch.nn.Sequential(torch.nn.Linear(1, 4),
#                     torch.nn.LeakyReLU(),
#                     torch.nn.Linear(4, 4),            
#                     torch.nn.LeakyReLU(),
#                     torch.nn.Linear(4, 1),)

function = ['order2', 'order3', 'x_2', 'x_2_sinx', 'x_3', 'x_3_sinx', 'x_2_tanh', 'x_3_tanh']

def polynomial(cof,r,x):
    f = 0
    for i in range(r+1):
        f = f + cof[i] * x**i
    return f
def power_f(cof,r,x):
    return cof[0] * x**r
def combine1(cof, r,x):
    return cof[0] * x**r + np.sin(x)
def combine2(cof, r,x):
    return cof[0] * x**r + np.tanh(x)

def choose_function(low=0):
    a1 = random.uniform(low,2)
    a2 = random.uniform(low,2)
    a3 = random.uniform(low,2)
    b = random.uniform(low,2)
    cof = [b, a1 ,a2 ,a3]
    f_index = random.randint(0,7)
    f = function[f_index]
    print(f)

    if f == 'order2':
        non_linear = polynomial
        degree = 2
    elif f == 'order3':
        non_linear = polynomial
        degree = 3
    elif f =='x_2':
        non_linear = power_f
        degree =2
    elif f=='x_2_sinx':
        non_linear= combine1
        degree =2
    elif f == 'x_3':
        non_linear = power_f
        degree =3
    elif f=='x_3_sinx':
        non_linear = combine1
        degree = 3
    elif f == 'x_2_tanh':
        non_linear = combine2
        degree = 2
    elif f=='x_3_tanh':
        non_linear=combine2
        degree=3
    else:
        print('function not in the list')

    return non_linear, degree, cof


# for i in range(10):
    
#     mu = 3
#     mu1 = 6
#     mus = 3
#     sigma_x = random.uniform(0,2)
#     sigma_y = random.uniform(1,3)
#     sigma_l = random.uniform(1,3)
#     sigma_s = random.uniform(3,6)
#     num_sample = 2000

#     l1 = random.uniform(1,3)
#     l2 = random.uniform(1,2)
#     s1 = random.uniform(1,3)
#     s2 = random.uniform(2,5)

#     Ex = np.random.normal(mu,sigma_x,num_sample)
#     Ey = np.random.normal(mu1,sigma_y,num_sample)
#     El = np.random.normal(mu,sigma_l,num_sample)
#     Es = np.random.normal(mus,sigma_s,num_sample)
#     Esy = np.random.normal(mu,sigma_s,num_sample)

#     f_index = random.randint(0,7)
#     f = function[f_index]
#     print(f)

#     if f == 'order2':
#         non_linear = polynomial
#         degree = 2
#     elif f == 'order3':
#         non_linear = polynomial
#         degree = 3
#     elif f =='x_2':
#         non_linear = power_f
#         degree =2
#     elif f=='x_2_sinx':
#         non_linear= combine1
#         degree =2
#     elif f == 'x_3':
#         non_linear = power_f
#         degree =3
#     elif f=='x_3_sinx':
#         non_linear = combine1
#         degree = 3
#     elif f == 'x_2_tanh':
#         non_linear = combine2
#         degree = 2
#     elif f=='x_3_tanh':
#         non_linear=combine2
#         degree=3
#     else:
#         print('function not in the list')



#     x = Ex
#     c = np.zeros(2000)
#     # parameters = initialize_parameters(input_size, hidden_size, output_size)
#     # y = forward_propagation(x.reshape(-1,1), parameters).reshape(-1) + Ey
#     # mlp_c.fit(x.reshape(-1,1), np.random.rand(x.shape[0]))
#     # y = mlp_c.predict(x.reshape(-1,1)).reshape(-1) + Ey
#     y = Ey + non_linear(degree, x)
#     o_data = np.stack((x,y,c), axis = 1)

#     per_cx = np.ones(2000)
#     do_x = np.zeros(2000)
#     Ey_per = np.random.normal(mu1,sigma_y,num_sample)
#     per_y = Ey_per + non_linear(degree, do_x)
#     pertub_data_x = np.stack((do_x,Ey_per, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     # print(data_per_x.shape)
#     np.save('./non_linear_gaussian/test_do(x).npy', data_per_x)


#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue < 0.05:
#         continue


#     per_cy = np.ones(2000)
#     Ey_per = np.random.normal(mu1,sigma_y,num_sample)
#     do_y = np.zeros(2000)
#     Ex_per = np.random.normal(mu,sigma_x,num_sample)
#     per_x = Ex_per
#     perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
#     data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
#     np.save('./non_linear_gaussian/test_do(y).npy', data_per_y)
#     import pdb
#     # pdb.set_trace()

    
#     data = np.load('./non_linear_gaussian/test_do(y).npy')
#     indicator = 1

#     kci_obj = CIT(data, "kci") # construct a CIT instance with data and method name
#     if indicator == 0:
#         pValue = kci_obj(1,2,set([]))
#         print(1,2,())
#         print(pValue)
#         pValue = kci_obj(1,2,set([0]))
#         print(1,2,(0))
#         print(pValue)
#     else:
#         pValue = kci_obj(0,2,set([]))
#         print(0,2,())
#         print(pValue)
#         pValue = kci_obj(0,2,set([1]))
#         print(0,2,(1))
#         print(pValue)
#         if pValue < 0.05:
#             break



####################case 1 (cause)#####################
# for i in range(20):
#     mu = 2
#     mu1 = 6
#     mus = 3
#     sigma_x = random.uniform(0,2)
#     sigma_y = random.uniform(1,3)
#     sigma_l = random.uniform(1,3)
#     sigma_s = random.uniform(3,6)
#     num_sample = 4000

#     l1 = random.uniform(1,3)
#     l2 = random.uniform(1,2)
#     s1 = random.uniform(1,3)
#     s2 = random.uniform(2,5)
#     a = random.uniform(0,5)
#     b = random.uniform(0,10)
#     c = random.uniform(5,15)

#     Ex = np.random.normal(mu,sigma_x,num_sample)
#     Ey = np.random.normal(mu1,sigma_y,num_sample)
#     El = np.random.normal(mu,sigma_l,num_sample)
#     Es = np.random.normal(mus,sigma_s,num_sample)
#     Esy = np.random.normal(mu,sigma_s,num_sample)

#     # mlp_c = MLPRegressor(hidden_layer_sizes=(1, 1, 1), activation='relu', solver='adam')

#     x = Ex
#     c = np.zeros(4000)
#     # parameters = initialize_parameters(input_size, hidden_size, output_size)
#     # y = forward_propagation(x.reshape(-1,1), parameters).reshape(-1) + Ey
#     # mlp_c.fit(x.reshape(-1,1), np.random.rand(x.shape[0]))
#     # y = mlp_c.predict(x.reshape(-1,1)).reshape(-1) + Ey
#     y = Ey + non_linear(a,b,c,x)
#     # y = Ey + non_linear(torch.from_numpy(x.reshape(-1,1)).float()).detach().numpy().reshape(-1)
#     o_data =  np.stack((x,y,c), axis = 1)

#     per_cx = np.ones(4000)
#     do_x = np.zeros(4000)
#     Ey_per = np.random.normal(mu1,sigma_y,num_sample)
#     per_y = Ey_per
#     pertub_data_x = np.stack((do_x,Ey_per, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     # print(data_per_x.shape)
#     np.save('./non_linear_gaussian/case1_do(x).npy', data_per_x)
#     # print(pertub_data_x)


#     per_cy = np.ones(4000)
#     Ey_per = np.random.normal(mu1,sigma_y,num_sample)
#     do_y = np.zeros(4000)
#     Ex_per = np.random.normal(mu,sigma_x,num_sample)
#     per_x = Ex_per
#     perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
#     data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
#     np.save('./non_linear_gaussian/case1_do(y).npy', data_per_y)


    
####################case 2 (latent)########################

# for i in range(10):
#     mu = 2
#     mu1 = 6
#     mus = 3
#     sigma_x = random.uniform(0,2)
#     sigma_y = random.uniform(1,3)
#     sigma_l = random.uniform(1,3)
#     sigma_s = random.uniform(3,6)
#     num_sample = 2000

#     l1 = random.uniform(1,3)
#     l2 = random.uniform(1,2)
#     s1 = random.uniform(1,3)
#     s2 = random.uniform(2,5)
#     a_lx = random.uniform(0,5)
#     b_lx = random.uniform(0,10)
#     c_lx = random.uniform(5,15)
#     a_ly = random.uniform(0,5)
#     b_ly = random.uniform(0,10)
#     c_ly = random.uniform(5,15)

#     Ex = np.random.normal(mu,sigma_x,num_sample)
#     Ey = np.random.normal(mu1,sigma_y,num_sample)
#     El = np.random.normal(mu,sigma_l,num_sample)
#     Es = np.random.normal(mus,sigma_s,num_sample)
#     Esy = np.random.normal(mu,sigma_s,num_sample)
#     L1, de1 = choose_function()
#     L2, de2 = choose_function()



#     L = El
#     c = np.zeros(2000)
#     x = Ex + L1(de1, L)
#     y = Ey + L2(de2, L)
#     o_data = np.stack((x,y,c),axis=1)

#     per_cx = np.ones(2000)
#     do_x = np.zeros(2000)
#     Ey_per = np.random.normal(mu1,sigma_y,num_sample)
#     El_per_x = np.random.normal(mu,sigma_l,num_sample)
#     per_y = Ey_per + L2(de2,El_per_x)
#     pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     # np.save('./non_linear_gaussian/case2_do(x).npy', data_per_x)

#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     if pValue < 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue > 0.05:
#         continue


#     per_cy = np.ones(2000)
#     do_y = np.zeros(2000)
#     Ex_per = np.random.normal(mu,sigma_x,num_sample)
#     El_per_y = np.random.normal(mu,sigma_l,num_sample)
#     per_x = Ex_per + L1(de1,El_per_y)
#     perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
#     data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
#     # np.save('./non_linear_gaussian/case2_do(y).npy', data_per_y)

#     kci_obj = CIT(data_per_y, "kci")
#     pValue = kci_obj(0,2,set([]))
#     print(0,2,())
#     print(pValue)
#     if pValue < 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue < 0.05:
#         break


####################case 3 (selection)########################
# for i in range(10):
#     mu = 2
#     mu1 = 6
#     mus = 3
#     sigma_x = random.uniform(0,2)
#     sigma_y = random.uniform(1,3)
#     sigma_l = random.uniform(1,3)
#     sigma_s = random.uniform(3,6)
#     num_sample = 4000

#     l1 = random.uniform(1,3)
#     l2 = random.uniform(1,2)
#     s1 = random.uniform(1,3)
#     s2 = random.uniform(2,5)
#     a_sx = random.uniform(0,5)
#     b_sx = random.uniform(0,10)
#     c_sx = random.uniform(5,15)
#     a_sy = random.uniform(0,5)
#     b_sy = random.uniform(0,10)
#     c_sy = random.uniform(5,15)

#     Ex = np.random.normal(mu,sigma_x,num_sample)
#     Ey = np.random.normal(mu1,sigma_y,num_sample)
#     El = np.random.normal(mu,sigma_l,num_sample)
#     Es = np.random.normal(mus,sigma_s,num_sample)
#     Esy = np.random.normal(mu,sigma_s,num_sample)
#     S1, de1 = choose_function()
#     S2, de2 = choose_function()

#     c = np.zeros(4000)
#     x = Ex
#     y = Ey
#     mask = (S1(de1,x) + S2(de2,y) + Es > 60) & (S1(de1,x) + S2(de2,y) + Es < 100)
#     print(S1(de1,x) + S2(de2,y) + Es)
#     x = x[mask]
#     y = y[mask]
#     c = c[mask]
#     o_data = np.stack((x,y,c),axis=1)

#     per_cx = np.ones(4000)
#     Es_per_x = np.random.normal(mu,sigma_s,num_sample)
#     do_x = np.zeros(4000)
#     Ey_per = np.random.normal(mu1,sigma_y,num_sample)
#     per_y = Ey_per
#     mask_per_x = (S1(de1,do_x) + S2(de2,per_y) + Es_per_x > 60) & (S1(de1,do_x) + S2(de2,per_y) + Es_per_x < 100)
#     # print(do_x * do_x + per_y * per_y + Es_per_x)
#     do_x = do_x[mask_per_x]
#     per_y = per_y[mask_per_x]
#     per_cx = per_cx[mask_per_x]
#     pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
#     print(pertub_data_x.shape)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     np.save('./non_linear_gaussian/case3_do(x).npy', data_per_x)
#     print(data_per_x.shape)

#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue < 0.05:
#         continue

#     per_cy = np.ones(4000)
#     Es_per_y = np.random.normal(mu,sigma_s,num_sample)
#     do_y = np.zeros(4000)
#     Ex_per = np.random.normal(mu,sigma_x,num_sample)
#     per_x = Ex_per
#     mask_per_y = (S1(de1,per_x) + S2(de2,do_y) + Es_per_y > 60) & (S1(de1,per_x) + S2(de2,do_y) + Es_per_y < 100)
#     per_x = per_x[mask_per_y]
#     do_y = do_y[mask_per_y]
#     per_cy = per_cy[mask_per_y]
#     pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
#     print(pertub_data_y.shape)
#     data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
#     np.save('./non_linear_gaussian/case3_do(y).npy', data_per_y)
#     print(data_per_y.shape)

#     kci_obj = CIT(data_per_y, "kci")
#     pValue = kci_obj(0,2,set([]))
#     print(0,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue > 0.05:
#         break

####################case 4 (casue with selection)########################
# for i in range(10):
#     print("########")
#     mu = 1
#     mu1 = 2
#     mus = 3
#     sigma_x = random.uniform(0,1)
#     sigma_y = random.uniform(1,3)
#     sigma_l = random.uniform(1,3)
#     sigma_s = random.uniform(3,6)
#     num_sample = 4000

#     l1 = random.uniform(1,3)
#     l2 = random.uniform(1,2)
#     s1 = random.uniform(1,3)
#     s2 = random.uniform(2,5)
#     a_c = random.uniform(-3,3)
#     b_c = random.uniform(-5,5)
#     c_c = random.uniform(0,5)
#     a_sx = random.uniform(0,5)
#     b_sx = random.uniform(0,10)
#     c_sx = random.uniform(5,15)
#     a_sy = random.uniform(0,5)
#     b_sy = random.uniform(0,10)
#     c_sy = random.uniform(5,15)

#     Ex = np.random.normal(mu,sigma_x,num_sample)
#     Ey = np.random.normal(mu1,sigma_y,num_sample)
#     El = np.random.normal(mu,sigma_l,num_sample)
#     Es = np.random.normal(mus,sigma_s,num_sample)
#     Esy = np.random.normal(mu,sigma_s,num_sample)
#     S1, de1 = choose_function()
#     S2, de2 = choose_function()
#     non_linear,de = choose_function()

#     c = np.zeros(4000)
#     x = Ex 
#     y = Ey + non_linear(de,x)
#     mask = (S1(de1,x) + S2(de2,y) + Es > 0) & (S1(de1,x) + S2(de2,y) + Es < 100)
#     print(S1(de1,x) + S2(de2,y) + Es)
#     x = x[mask]
#     y = y[mask]
#     c = c[mask]
#     o_data = np.stack((x,y,c),axis=1)

#     per_cx = np.ones(4000)
#     Es_per_x = np.random.normal(mu,sigma_s,num_sample)
#     do_x = np.zeros(4000)
#     Ey_per = np.random.normal(mu1,sigma_y,num_sample)
#     per_y = Ey_per + non_linear(de, do_x)
#     mask_per_x = (S1(de1,do_x) + S2(de2,per_y) + Es_per_x > 0) & (S1(de1,do_x) + S2(de2,per_y) + Es_per_x < 100)
#     do_x = do_x[mask_per_x]
#     per_y = per_y[mask_per_x]
#     per_cx = per_cx[mask_per_x]
#     pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     np.save('./non_linear_gaussian/case4_do(x).npy', data_per_x)
#     print(pertub_data_x.shape)
#     print(data_per_x.shape)

#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue < 0.05:
#         continue


#     per_cy = np.ones(4000)
#     Es_per_y = np.random.normal(mu,sigma_s,num_sample)
#     do_y = np.zeros(4000)
#     Ex_per = np.random.normal(mu,sigma_x,num_sample)
#     per_x = Ex_per
#     mask_per_y = (S1(de1,per_x) + S2(de2,do_y) + Es_per_y > 0) & (S1(de1,per_x) + S2(de2,do_y) + Es_per_y < 100)
#     per_x = per_x[mask_per_y]
#     do_y = do_y[mask_per_y]
#     per_cy = per_cy[mask_per_y]
#     pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
#     data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
#     np.save('./non_linear_gaussian/case4_do(y).npy', data_per_y)
#     print(pertub_data_y.shape)
#     print(data_per_y.shape)

#     kci_obj = CIT(data_per_y, "kci")
#     pValue = kci_obj(0,2,set([]))
#     print(0,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue < 0.05:
#         break


# #####################case 5 (casue with latent)########################
# for i in range(10):
#     mu = 2
#     mu1 = 6
#     mus = 3
#     sigma_x = random.uniform(0,2)
#     sigma_y = random.uniform(2,4)
#     sigma_l = random.uniform(1,3)
#     sigma_s = random.uniform(3,6)
#     num_sample = 2000

#     l1 = random.uniform(1,3)
#     l2 = random.uniform(1,2)
#     s1 = random.uniform(1,3)
#     s2 = random.uniform(2,5)
#     a_c = random.uniform(-3,3)
#     b_c = random.uniform(-5,5)
#     c_c = random.uniform(0,5)
#     a_lx = random.uniform(0,5)
#     b_lx = random.uniform(0,10)
#     c_lx = random.uniform(5,15)
#     a_ly = random.uniform(0,5)
#     b_ly = random.uniform(0,10)
#     c_ly = random.uniform(5,15)

#     Ex = np.random.normal(mu,sigma_x,num_sample)
#     Ey = np.random.normal(mu1,sigma_y,num_sample)
#     El = np.random.normal(mu,sigma_l,num_sample)
#     Es = np.random.normal(mus,sigma_s,num_sample)
#     L1, de1 = choose_function()
#     L2, de2 = choose_function()
#     non_linear,de = choose_function()

#     L = El
#     c = np.zeros(2000)
#     x = Ex + L1(0, de1, L)
#     y = L2(0, de2, L) + non_linear(0,de,x) + Ey
#     o_data = np.stack((x,y,c),axis=1)

#     per_cx = np.ones(2000)
#     do_x = np.zeros(2000)
#     Ey_per = np.random.normal(mu1,sigma_y,num_sample)
#     El_per_x = np.random.normal(mu,sigma_l,num_sample)
#     per_y = Ey_per + L2(0, de2, El_per_x) + non_linear(0, de, do_x)
#     pertub_data_x = np.stack((do_x, per_y, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     np.save('./non_linear_gaussian/case5_do(x).npy', data_per_x)
#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue > 0.05:
#         continue

#     per_cy = np.ones(2000)
#     do_y = np.zeros(2000)
#     Ex_per = np.random.normal(mu,sigma_x,num_sample)
#     El_per_y = np.random.normal(mu,sigma_l,num_sample)
#     per_x = Ex_per + L1(0, de1, El_per_y)
#     perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
#     data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
#     np.save('./non_linear_gaussian/case5_do(y).npy', data_per_y)

#     kci_obj = CIT(data_per_y, "kci")
#     pValue = kci_obj(0,2,set([]))
#     print(0,2,())
#     print(pValue)
#     if pValue < 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue < 0.05:
#         break

    
        

#####################case 6 (selection with latent)########################

# for i in range(10):
#     mu = 2
#     mu1 = 6
#     mus = 3
#     sigma_x = random.uniform(0,2)
#     sigma_y = random.uniform(2,4)
#     sigma_l = random.uniform(1,3)
#     sigma_s = random.uniform(3,6)
#     num_sample = 4000

#     l1 = random.uniform(1,3)
#     l2 = random.uniform(1,2)
#     s1 = random.uniform(1,3)
#     s2 = random.uniform(2,5)
#     a_c = random.uniform(-3,3)
#     b_c = random.uniform(-5,5)
#     c_c = random.uniform(0,5)
#     a_lx = random.uniform(-2,2)
#     b_lx = random.uniform(-5,5)
#     c_lx = random.uniform(0,5)
#     a_ly = random.uniform(-2,2)
#     b_ly = random.uniform(-5,5)
#     c_ly = random.uniform(0,5)
#     a_sx = random.uniform(-3,3)
#     b_sx = random.uniform(0,5)
#     c_sx = random.uniform(0,5)
#     a_sy = random.uniform(-3,3)
#     b_sy = random.uniform(0,5)
#     c_sy = random.uniform(0,5)

#     Ex = np.random.normal(mu,sigma_x,num_sample)
#     Ey = np.random.normal(mu1,sigma_y,num_sample)
#     El = np.random.normal(mu,sigma_l,num_sample)
#     Es = np.random.normal(mus,sigma_s,num_sample)
#     L1, de1 = choose_function()
#     L2, de2 = choose_function()

#     S1, ds1 = choose_function()
#     S2, ds2 = choose_function()

#     L = El
#     c = np.zeros(4000)
#     x = Ex + L1(0, de1, L)
#     y = Ey + L2(0, de2, L)
#     mask = (S1(-2, ds1,x) + S2(-2, ds2,y) + Es > 0) & (S1(-2, ds1,x) + S2(-2, ds2,y)  + Es < 100)
#     print(S1(-2, ds1,x) + S2(-2, ds2,y) + Es)
#     x = x[mask]
#     y = y[mask]
#     c = c[mask]
#     o_data = np.stack((x,y,c),axis=1)

#     per_cx = np.ones(4000)
#     El_per_x = np.random.normal(mu,sigma_l,num_sample)
#     Es_per_x = np.random.normal(mu,sigma_s,num_sample)
#     do_x = np.zeros(4000)
#     Ey_per = np.random.normal(mu1,sigma_y,num_sample)
#     per_y = Ey_per + L2(0, de2, El_per_x)
#     mask_per_x = (S1(-2, ds1,do_x) + S2(-2, ds2,per_y) + Es_per_x > 0) & (S1(-2, ds1,do_x) + S2(-2, ds2,per_y) + Es_per_x < 100)
#     do_x = do_x[mask_per_x]
#     per_y = per_y[mask_per_x]
#     per_cx = per_cx[mask_per_x]
#     pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     print(o_data.shape)
#     print(data_per_x.shape)
#     np.save('./non_linear_gaussian/case6_do(x).npy', data_per_x)

#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue > 0.05:
#         continue

#     per_cy = np.ones(4000)
#     El_per_y = np.random.normal(mu,sigma_l,num_sample)
#     Es_per_y = np.random.normal(mu,sigma_s,num_sample)
#     do_y = np.zeros(4000)
#     Ex_per = np.random.normal(mu,sigma_x,num_sample)
#     per_x = Ex_per + L1(0, de1, El_per_y)
#     mask_per_y = (S1(-2, ds1,per_x) + S2(-2, ds2, do_y) + Es_per_y > 0) & (S1(-2, ds1,per_x) + S2(-2, ds2, do_y) + Es_per_y < 100)
#     per_x = per_x[mask_per_y]
#     do_y = do_y[mask_per_y]
#     per_cy = per_cy[mask_per_y]
#     pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
#     data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
#     np.save('./non_linear_gaussian/case6_do(y).npy', data_per_y)
#     print(data_per_y.shape)

#     kci_obj = CIT(data_per_y, "kci")
#     pValue = kci_obj(0,2,set([]))
#     print(0,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue < 0.05:
#         break

   

#####################case 7 (cause with selection and latent)########################
# for i in range(10):
#     mu = 2
#     mu1 = 6
#     mus = 3
#     sigma_x = random.uniform(0,2)
#     sigma_y = random.uniform(2,4)
#     sigma_l = random.uniform(1,3)
#     sigma_s = random.uniform(3,6)
#     num_sample = 4000

#     l1 = random.uniform(1,3)
#     l2 = random.uniform(1,2)
#     s1 = random.uniform(1,3)
#     s2 = random.uniform(2,5)
#     a_c = random.uniform(-3,3)
#     b_c = random.uniform(-5,5)
#     c_c = random.uniform(0,5)
#     a_lx = random.uniform(-2,2)
#     b_lx = random.uniform(-5,5)
#     c_lx = random.uniform(0,5)
#     a_ly = random.uniform(-2,2)
#     b_ly = random.uniform(-5,5)
#     c_ly = random.uniform(0,5)
#     a_sx = random.uniform(-3,3)
#     b_sx = random.uniform(0,5)
#     c_sx = random.uniform(0,5)
#     a_sy = random.uniform(-3,3)
#     b_sy = random.uniform(0,5)
#     c_sy = random.uniform(0,5)

#     Ex = np.random.normal(mu,sigma_x,num_sample)
#     Ey = np.random.normal(mu1,sigma_y,num_sample)
#     El = np.random.normal(mu,sigma_l,num_sample)
#     Es = np.random.normal(mus,sigma_s,num_sample)
#     L1, de1 = choose_function()
#     L2, de2 = choose_function()

#     S1, ds1 = choose_function()
#     S2, ds2 = choose_function()
#     non_linear,de = choose_function()
#     L = El
#     c = np.zeros(4000)
#     x = Ex + L1(0, de1, L)
#     y = Ey + L2(0, de2, L) + non_linear(0, de, x)
#     mask = (S1(-2, ds1, x) + S2(-2, ds2, y)+ Es > 0) & (S1(-2, ds1, x) + S2(-2, ds2, y) + Es < 100)
#     print(S1(-2, ds1, x) + S2(-2, ds2, y)+ Es)
#     x = x[mask]
#     y = y[mask]
#     c = c[mask]
#     o_data = np.stack((x,y,c),axis=1)
#     # print(o_data)

#     per_cx = np.ones(4000)
#     El_per_x = np.random.normal(mu,sigma_l,num_sample)
#     Es_per_x = np.random.normal(mus,sigma_s,num_sample)
#     do_x = np.zeros(4000)
#     Ey_per = np.random.normal(mu1,sigma_y,num_sample)
#     per_y = Ey_per + L2(0, de2, El_per_x) + non_linear(0, de, do_x)
#     mask_per_x = (S1(-2, ds1,do_x) + S2(-2, ds2,per_y) + Es_per_x > 0) & (S1(-2, ds1,do_x) + S2(-2, ds2,per_y) + Es_per_x < 100)
#     do_x = do_x[mask_per_x]
#     per_y = per_y[mask_per_x]
#     per_cx = per_cx[mask_per_x]
#     pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     np.save('./non_linear_gaussian/case7_do(x).npy', data_per_x)
#     print(pertub_data_x.shape)
#     print(data_per_x.shape)
#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue > 0.05:
#         continue

#     per_cy = np.ones(4000)
#     El_per_y = np.random.normal(mu,sigma_l,num_sample)
#     Es_per_y = np.random.normal(mus,sigma_s,num_sample)
#     do_y = np.zeros(4000)
#     Ex_per = np.random.normal(mu,sigma_x,num_sample)
#     per_x = Ex_per + L1(0, de1, El_per_y)
#     mask_per_y = (S1(-2, ds1,per_x) + S2(-2, ds2, do_y) + Es_per_y > 0) & (S1(-2, ds1,per_x) + S2(-2, ds2, do_y) + Es_per_y < 100)
#     print(S1(-2, ds1,per_x) + S2(-2, ds2, do_y) + Es_per_y)
#     per_x = per_x[mask_per_y]
#     do_y = do_y[mask_per_y]
#     per_cy = per_cy[mask_per_y]
#     pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
#     data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
#     np.save('./non_linear_gaussian/case7_do(y).npy', data_per_y)
#     print(pertub_data_y.shape)
#     print(data_per_y.shape)
#     kci_obj = CIT(data_per_y, "kci")
#     pValue = kci_obj(0,2,set([]))
#     print(0,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue < 0.05:
#         break


############## non-linear non-gaussian ################
#########x-y ###########
####################case 1 (cause)#####################
# for i in range(10):
#     startx = 1
#     endx = 3
#     starty = 3
#     endy = 6
#     startl = 7
#     endl = 9
#     starts = 2
#     ends = 4
#     num_sample = 4000

#     l1 = random.uniform(4,6)
#     l2 = random.uniform(4,6)
#     s1 = random.uniform(-1,3)
#     s2 = random.uniform(1,2)
#     Ex = np.random.uniform(startx,endx,num_sample)
#     Ey = np.random.uniform(starty,endy,num_sample)
#     El = np.random.uniform(startl,endl,num_sample)
#     Es = np.random.uniform(starts,ends,num_sample)

#     non_linear,de, cof = choose_function()

#     x = Ex
#     c = np.zeros(4000)
#     y = non_linear(cof, de, x) + Ey
#     # print(y)
#     o_data =  np.stack((x,y,c), axis = 1)

#     per_cx = np.ones(4000)
#     do_x = np.zeros(4000)
#     Ey_per = np.random.uniform(starty, endy,num_sample)
#     per_y = Ey_per + non_linear(cof, de, do_x)
#     print(per_y)
#     pertub_data_x = np.stack((do_x,Ey_per, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     # print(data_per_x.shape)
#     np.save('./non_linear_nongaussian/case1_do(x).npy', data_per_x)
#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue < 0.05:
#         continue


#     per_cy = np.ones(4000)
#     do_y = np.zeros(4000)
#     Ex_per = np.random.uniform(startx,endx,num_sample)
#     per_x = Ex_per
#     perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
#     data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
#     np.save('./non_linear_nongaussian/case1_do(y).npy', data_per_y)
#     kci_obj = CIT(data_per_y, "kci")
#     pValue = kci_obj(0,2,set([]))
#     print(0,2,())
#     print(pValue)
#     if pValue < 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue < 0.05:
#         break

####################case 2 (latent)########################
# for i in range(10):
#     startx = 1
#     endx = 3
#     starty = 2
#     endy = 4
#     startl = 4
#     endl = 6
#     starts = 2
#     ends = 4
#     num_sample = 4000

#     Ex = np.random.uniform(startx,endx,num_sample)
#     Ey = np.random.uniform(starty,endy,num_sample)
#     # plt.hist(Ey, bins=30)
#     # plt.show

#     El = np.random.uniform(startl,endl,num_sample)
   

#     L1, de1, cof1 = choose_function()
#     L2, de2, cof2 = choose_function()

    
#     L = El
#     c = np.zeros(num_sample)
#     x = Ex + L1(cof1, de1, L)
#     y = Ey + L2(cof2, de2, L)
#     o_data = np.stack((x,y,c),axis=1)
#     # plt.hist(L2(cof2, de2, L))
#     # plt.show()
#     per_cx = np.ones(num_sample)
#     do_x = np.zeros(num_sample)
#     Ey_per = np.random.uniform(starty,endy,num_sample)
#     El_per_x = np.random.uniform(startl,endl,num_sample)
#     # plt.hist(L2(cof2, de2, El_per_x))
#     # plt.show()
#     per_y = Ey_per + L2(cof2, de2, El_per_x)
#     # import pdb
#     # pdb.set_trace()
#     pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     np.save('./non_linear_nongaussian/case2_do(x).npy', data_per_x)
#     # plt.scatter(data_per_x[:,2].reshape(-1), data_per_x[:,1].reshape(-1))
#     # print(data_per_x)
#     # plt.scatter(data_per_x[:,1].reshape(-1), data_per_x[:,2].reshape(-1))
#     # plt.show()
#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     if pValue < 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue > 0.05:
#         continue

#     per_cy = np.ones(4000)
#     do_y = np.zeros(4000)
#     Ex_per = np.random.uniform(startx,endx,num_sample)
#     El_per_y = np.random.uniform(startl,endl,num_sample)
#     per_x = Ex_per + L1(cof1, de1, El_per_y)
#     perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
#     data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
#     np.save('./non_linear_nongaussian/case2_do(y).npy', data_per_y)

#     kci_obj = CIT(data_per_y, "kci")
#     pValue = kci_obj(0,2,set([]))
#     print(0,2,())
#     print(pValue)
#     if pValue < 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue < 0.05:
#         break

####################case 3 (selection)########################
# for i in range(10):
#     startx = 1
#     endx = 3
#     starty = 3
#     endy = 4
#     startl = 5
#     endl = 8
#     starts = 2
#     ends = 4
#     num_sample = 4000

#     Ex = np.random.uniform(startx,endx,num_sample)
#     Ey = np.random.uniform(starty,endy,num_sample)
#     El = np.random.uniform(startl,endl,num_sample)
#     Es = np.random.uniform(starts,ends,num_sample)
#     S1, de1, cof1 = choose_function(0)
#     S2, de2, cof2 = choose_function(-2)
#     c = np.zeros(4000)
#     x = Ex
#     y = Ey
#     mask = (S1(cof1, de1,x) + S2(cof2, de2,y) + Es > 0) & (S1(cof1, de1,x) + S2(cof2, de2,y) + Es < 50)
#     print(S1(cof1, de1,x) + S2(cof2, de2,y) + Es)
#     x = x[mask]
#     y = y[mask]
#     c = c[mask]
#     o_data = np.stack((x,y,c),axis=1)

#     per_cx = np.ones(4000)
#     Es_per_x = np.random.uniform(starts,ends,num_sample)
#     do_x = np.zeros(4000)
#     Ey_per = np.random.uniform(starty,endy,num_sample)
#     per_y = Ey_per
#     mask_per_x = (S1(cof1, de1,do_x) + S2(cof2, de2,per_y) + Es_per_x > 0) & (S1(cof1, de1,do_x) + S2(cof2, de2,per_y) + Es_per_x < 50)
#     print(S1(cof1, de1,do_x) + S2(cof2, de2,per_y) + Es_per_x)
#     do_x = do_x[mask_per_x]
#     per_y = per_y[mask_per_x]
#     per_cx = per_cx[mask_per_x]
#     pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
#     print(pertub_data_x.shape)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     np.save('./non_linear_nongaussian/case3_do(x).npy', data_per_x)
#     print(data_per_x.shape)
#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue < 0.05:
#         continue

#     per_cy = np.ones(4000)
#     Es_per_y = np.random.uniform(starts,ends,num_sample)
#     do_y = np.zeros(4000)
#     Ex_per = np.random.uniform(startx,endx,num_sample)
#     per_x = Ex_per
#     mask_per_y = (S1(cof1, de1, per_x) + S2(cof2, de2, do_y) + Es_per_y > 0) & (S1(cof1, de1,per_x) + S2(cof2, de2,do_y) + Es_per_y < 50)
#     per_x = per_x[mask_per_y]
#     do_y = do_y[mask_per_y]
#     per_cy = per_cy[mask_per_y]
#     pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
#     print(pertub_data_y.shape)
#     data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
#     np.save('./non_linear_nongaussian/case3_do(y).npy', data_per_y)
#     print(data_per_y.shape)

#     kci_obj = CIT(data_per_y, "kci")
#     pValue = kci_obj(0,2,set([]))
#     print(0,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue > 0.05:
#         break

####################case 4 (casue with selection)########################
# for i in range(10):
#     startx = 1
#     endx = 2
#     starty = 3
#     endy = 6
#     startl = 7
#     endl = 9
#     starts = 2
#     ends = 4
#     num_sample = 4000

#     l1 = random.uniform(4,6)
#     l2 = random.uniform(4,6)
#     s1 = random.uniform(-1,3)
#     s2 = random.uniform(1,2)
#     Ex = np.random.uniform(startx,endx,num_sample)
#     Ey = np.random.uniform(starty,endy,num_sample)
#     El = np.random.uniform(startl,endl,num_sample)
#     Es = np.random.uniform(starts,ends,num_sample)
#     S1, de1 = choose_function()
#     S2, de2 = choose_function()
#     non_linear,de = choose_function()

#     c = np.zeros(4000)
#     x = Ex 
#     y = Ey + non_linear(0, de, x)
#     mask = (S1(-2, de1,x) + S2(-2, de2,y) + Es > 5) & (S1(-2, de1,x) + S2(-2, de2,y) + Es < 70)
#     print(S1(-2, de1,x) + S2(-2, de2,y) + Es)
#     x = x[mask]
#     y = y[mask]
#     c = c[mask]
#     o_data = np.stack((x,y,c),axis=1)

#     per_cx = np.ones(4000)
#     Es_per_x = np.random.uniform(starts,ends,num_sample)
#     do_x = np.zeros(4000)
#     Ey_per = np.random.uniform(starty,endy,num_sample)
#     per_y = Ey_per + non_linear(0, de, do_x)
#     mask_per_x = (S1(-2, de1,do_x) + S2(-2, de2,per_y) + Es_per_x > 5) & (S1(-2, de1,do_x) + S2(-2, de2,per_y) + Es_per_x < 70)
#     print(S1(-2, de1,do_x) + S2(-2, de2,per_y) + Es_per_x)
#     do_x = do_x[mask_per_x]
#     per_y = per_y[mask_per_x]
#     per_cx = per_cx[mask_per_x]
#     pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     np.save('./non_linear_nongaussian/case4_do(x).npy', data_per_x)
#     print(pertub_data_x.shape)
#     print(data_per_x.shape)

#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue < 0.05:
#         continue

#     per_cy = np.ones(4000)
#     Es_per_y = np.random.uniform(starts,ends,num_sample)
#     do_y = np.zeros(4000)
#     Ex_per = np.random.uniform(startx,endx,num_sample)
#     per_x = Ex_per
#     mask_per_y = (S1(-2, de1,per_x) + S2(-2, de2,do_y) + Es_per_y > 5) & (S1(-2, de1,per_x) + S2(-2, de2,do_y) + Es_per_y < 70)
#     per_x = per_x[mask_per_y]
#     do_y = do_y[mask_per_y]
#     per_cy = per_cy[mask_per_y]
#     pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
#     data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
#     np.save('./non_linear_nongaussian/case4_do(y).npy', data_per_y)
#     print(pertub_data_y.shape)
#     print(data_per_y.shape)
#     kci_obj = CIT(data_per_y, "kci")
#     pValue = kci_obj(0,2,set([]))
#     print(0,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue < 0.05:
#         break

# #####################case 5 (casue with latent)########################
# for i in range(10):
#     startx = 1
#     endx = 3
#     starty = 3
#     endy = 6
#     startl = 1
#     endl = 3
#     starts = 2
#     ends = 4
#     num_sample = 4000

#     l1 = random.uniform(4,6)
#     l2 = random.uniform(4,6)
#     s1 = random.uniform(-1,3)
#     s2 = random.uniform(1,2)
#     Ex = np.random.uniform(startx,endx,num_sample)
#     Ey = np.random.uniform(starty,endy,num_sample)
#     El = np.random.uniform(startl,endl,num_sample)
#     Es = np.random.uniform(starts,ends,num_sample)

#     L1, de1, cof1= choose_function()
#     L2, de2, cof2 = choose_function()
#     non_linear,de, cof_c = choose_function()

#     L = El
#     c = np.zeros(4000)
#     x = Ex + L1(cof1, de1, L)
#     y = L2(cof2, de2, L) + non_linear(cof_c,de,x) + Ey
#     o_data = np.stack((x,y,c),axis=1)

#     per_cx = np.ones(4000)
#     do_x = np.zeros(4000)
#     Ey_per = np.random.uniform(starty,endy,num_sample)
#     El_per_x = np.random.uniform(startl,endl,num_sample)
#     per_y = Ey_per + L2(cof2, de2, El_per_x) + non_linear(cof_c, de, do_x)
#     pertub_data_x = np.stack((do_x, per_y, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     np.save('./non_linear_nongaussian/case5_do(x).npy', data_per_x)

#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue > 0.05:
#         continue

#     per_cy = np.ones(4000)
#     do_y = np.zeros(4000)
#     Ex_per = np.random.uniform(startx,endx,num_sample)
#     El_per_y = np.random.uniform(startl,endl,num_sample)
#     per_x = Ex_per + L1(cof1, de1, El_per_y)
#     perturb_data_y = np.stack((per_x,do_y,per_cy), axis = 1)
#     data_per_y = np.concatenate((o_data,perturb_data_y), axis = 0)
#     np.save('./non_linear_nongaussian/case5_do(y).npy', data_per_y)

#     kci_obj = CIT(data_per_y, "kci")
#     pValue = kci_obj(0,2,set([]))
#     print(0,2,())
#     print(pValue)
#     if pValue < 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue < 0.05:
#         break

#####################case 6 (selection with latent)########################
# for i in range(10):
#     startx = 0
#     endx = 2
#     starty = 1
#     endy = 3
#     startl = 0
#     endl = 2
#     starts = 1
#     ends = 3
#     num_sample = 4000


#     Ex = np.random.uniform(startx,endx,num_sample)
#     Ey = np.random.uniform(starty,endy,num_sample)
#     El = np.random.uniform(startl,endl,num_sample)
#     Es = np.random.uniform(starts,ends,num_sample)

#     L1, de1, cof_l1 = choose_function()
#     L2, de2, cof_l2 = choose_function()

#     S1, ds1, cof_s1 = choose_function()
#     S2, ds2, cof_s2 = choose_function(-2)

#     L = El
#     c = np.zeros(4000)
#     x = Ex + L1(cof_l1, de1, L)
#     y = Ey + L2(cof_l2, de2, L)
#     mask = (S1(cof_s1, ds1,x) + S2(cof_s2, ds2,y) + Es  > 0) & (S1(cof_s1, ds1,x) + S2(cof_s2, ds2,y) + Es  < 200)
#     print(S1(cof_s1, ds1,x) + S2(cof_s2, ds2,y) + Es )
#     x = x[mask]
#     y = y[mask]
#     c = c[mask]
#     o_data = np.stack((x,y,c),axis=1)

#     per_cx = np.ones(4000)
#     El_per_x = np.random.uniform(startl,endl,num_sample)
#     Es_per_x = np.random.uniform(starts,ends,num_sample)
#     do_x = np.zeros(4000)
#     Ey_per = np.random.uniform(starty,endy,num_sample)
#     per_y = Ey_per + L2(cof_l2, de2, El_per_x)
#     mask_per_x = (S1(cof_s1, ds1,do_x) + S2(cof_s2, ds2,per_y) + Es_per_x > 0) & (S1(cof_s1, ds1,do_x) + S2(cof_s2, ds2,per_y) + Es_per_x < 200)
#     print(S1(cof_s1, ds1,do_x) + S2(cof_s2, ds2,per_y))
#     do_x = do_x[mask_per_x]
#     per_y = per_y[mask_per_x]
#     per_cx = per_cx[mask_per_x]
#     pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     np.save('./non_linear_nongaussian/case6_do(x).npy', data_per_x)
#     print(o_data.shape)
#     print(pertub_data_x.shape)
#     print(data_per_x.shape)

#     kci_obj = CIT(data_per_x, "kci", est_width='median')
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     print(pValue)
#     if np.isnan(pValue):
#         continue
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue > 0.05:
#         continue

#     per_cy = np.ones(4000)
#     El_per_y = np.random.uniform(startl,endl,num_sample)
#     Es_per_y = np.random.uniform(starts,ends,num_sample)
#     do_y = np.zeros(4000)
#     Ex_per = np.random.uniform(startx,endx,num_sample)
#     per_x = Ex_per + L1(cof_l1, de1, El_per_y)
#     mask_per_y = (S1(cof_s1, ds1,per_x) + S2(cof_s2, ds2, do_y) + Es_per_y > 0) & (S1(cof_s1, ds1,per_x) + S2(cof_s2, ds2, do_y) + Es_per_y < 200)
#     print(S1(cof_s1, ds1,per_x) + S2(cof_s2, ds2, do_y) + Es_per_y)
#     per_x = per_x[mask_per_y]
#     do_y = do_y[mask_per_y]
#     per_cy = per_cy[mask_per_y]
#     pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
#     data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
#     np.save('./non_linear_nongaussian/case6_do(y).npy', data_per_y)
#     print(pertub_data_y.shape)
#     print(data_per_y.shape)

#     kci_obj = CIT(data_per_y, "kci", est_width='median')
#     pValue = kci_obj(0,2,set([]))
#     print(0,2,())
#     print(pValue)
#     if np.isnan(pValue):
#         continue
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue < 0.05:
#         break

#####################case 7 (cause with selection and latent)########################
# for i in range(10):
#     startx = 1
#     endx = 2
#     starty = 2
#     endy = 3
#     startl = 0
#     endl = 2
#     starts = 2
#     ends = 4
#     num_sample = 4000

#     Ex = np.random.uniform(startx,endx,num_sample)
#     Ey = np.random.uniform(starty,endy,num_sample)
#     El = np.random.uniform(startl,endl,num_sample)
#     Es = np.random.uniform(starts,ends,num_sample)
#     L1, de1, cof_l1 = choose_function()
#     L2, de2, cof_l2 = choose_function()

#     S1, ds1, cof_s1 = choose_function()
#     S2, ds2, cof_s2 = choose_function(-2)
#     non_linear,de, cof_c = choose_function()

#     L = El
#     c = np.zeros(4000)
#     x = Ex + L1(cof_l1, de1, L)
#     y = Ey + L2(cof_l2, de2, L) + non_linear(cof_c, de, x)
#     mask = (S1(cof_s1, ds1, x) + S2(cof_s2, ds2, y) + Es > 0) & (S1(cof_s1, ds1, x) + S2(cof_s2, ds2, y) + Es < 200)
#     print(S1(cof_s1, ds1, x) + S2(cof_s2, ds2, y) + Es)
#     x = x[mask]
#     y = y[mask]
#     c = c[mask]
#     o_data = np.stack((x,y,c),axis=1)
#     # print(o_data)

#     per_cx = np.ones(4000)
#     El_per_x = np.random.uniform(startl,endl,num_sample)
#     Es_per_x = np.random.uniform(starts,ends,num_sample)
#     do_x = np.zeros(4000)
#     Ey_per = np.random.uniform(starty,endy,num_sample)
#     per_y = Ey_per + L2(cof_l2, de2, El_per_x) + non_linear(cof_c, de, do_x)
#     mask_per_x = (S1(cof_s1, ds1,do_x) + S2(cof_s2, ds2,per_y) + Es_per_x > 0) & (S1(cof_s1, ds1,do_x) + S2(cof_s2, ds2,per_y) + Es_per_x < 200)
#     print(S1(cof_s1, ds1,do_x) + S2(cof_s2, ds2,per_y) + Es_per_x)
#     do_x = do_x[mask_per_x]
#     per_y = per_y[mask_per_x]
#     per_cx = per_cx[mask_per_x]
#     pertub_data_x = np.stack((do_x,per_y, per_cx), axis=1)
#     data_per_x = np.concatenate((o_data,pertub_data_x), axis = 0)
#     np.save('./non_linear_nongaussian/case7_do(x).npy', data_per_x)
#     print(pertub_data_x.shape)
#     print(data_per_x.shape)
#     if (data_per_x.shape[0] - pertub_data_x.shape[0] < 1000):
#         continue

#     kci_obj = CIT(data_per_x, "kci")
#     pValue = kci_obj(1,2,set([]))
#     print(1,2,())
#     if np.isnan(pValue):
#         continue
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(1,2,set([0]))
#     print(1,2,(0))
#     print(pValue)
#     if pValue > 0.05:
#         continue

#     per_cy = np.ones(4000)
#     El_per_y = np.random.uniform(startl,endl,num_sample)
#     Es_per_y = np.random.uniform(starts,ends,num_sample)
#     do_y = np.zeros(4000)
#     Ex_per = np.random.uniform(startx,endx,num_sample)
#     per_x = Ex_per + L1(cof_l1, de1, El_per_y)
#     mask_per_y = (S1(cof_s1, ds1,per_x) + S2(cof_s2, ds2, do_y) + Es_per_y > 0) & (S1(cof_s1, ds1,per_x) + S2(cof_s2, ds2, do_y)+ Es_per_y < 200)
#     print(S1(cof_s1, ds1,per_x) + S2(cof_s2, ds2, do_y) + Es_per_y)
#     per_x = per_x[mask_per_y]
#     do_y = do_y[mask_per_y]
#     per_cy = per_cy[mask_per_y]
#     pertub_data_y = np.stack((per_x,do_y, per_cy), axis=1)
#     data_per_y = np.concatenate((o_data,pertub_data_y), axis = 0)
#     np.save('./non_linear_nongaussian/case7_do(y).npy', data_per_y)
#     print(pertub_data_y.shape)
#     print(data_per_y.shape)
#     if (data_per_y.shape[0] - pertub_data_y.shape[0] < 1000):
#         continue

#     kci_obj = CIT(data_per_y, "kci")
#     pValue = kci_obj(0,2,set([]))
#     if np.isnan(pValue):
#         continue
#     print(0,2,())
#     print(pValue)
#     if pValue > 0.05:
#         continue
#     pValue = kci_obj(0,2,set([1]))
#     print(0,2,(1))
#     print(pValue)
#     if pValue < 0.05:
#         break