'''
start from 'C'


'''

### 1. import
import os
import numpy as np 
from time import time
from tqdm import tqdm 
from matplotlib import pyplot as plt
import pickle 
from random import shuffle 
import torch
import torch.nn as nn
import torch.nn.functional as F
from tdc import Oracle
torch.manual_seed(1)
np.random.seed(2)
from chemutils import * 
'''
chemutils 
	smiles2differentiable_graph
	differentiable_graph2smiles
	qed_logp_jnk_gsk_fusion
'''
from tdc import Evaluator




## 2. data and oracle
start_smiles_lst = ['CCC(C1=CC=CC=C1)C1=CC=CC=C1', 'CCC(C)C', 'CCC(C)C1=CC=CC=C1', 'CCCC', 'CCCC1=CC=CC=C1']


logp = Oracle(name = 'logp')



def logp_modifier2(logp_score):
    return max(0.0,1/10*(logp_score+5))

def oracle(smiles):
	return logp_modifier2(logp(smiles))



## 3. load model 
# device = 'cuda' if torch.cuda.is_available() else 'cpu'
device = 'cpu' ## cpu is better 
prop = 'logp'
model_ckpt = "save_model/LogP_epoch_0_iter_103800_validloss_0.5577.ckpt"
gnn = torch.load(model_ckpt)
gnn.switch_device(device)



## 4. inference function 
from inference_utils import * 

'''
def optimize_single_molecule_one_iterate(smiles, gnn):
	...
	return smiles_set


def gnn_screening(smiles_set, gnn):
	... 
	return smiles_lst

def oracle_screening(smiles_set, oracle):
	... 
	return smiles_score_lst 


def dpp(smiles_score_lst, num_return):

	return smiles_lst 

'''



def distribution_learning(start_smiles_lst, gnn, oracle, generations, population_size, lamb, topk, epsilon, result_pkl):
	trace_dict = dict() 
	# existing_set = set(start_smiles_lst)  ### existing_set: if allow repeat molecule 
	current_set = set(start_smiles_lst)
	average_f = np.mean([oracle(smiles) for smiles in current_set])
	f_lst = [(average_f, 0.0)]
	idx_2_smiles2f = {}
	smiles2f_new = {smiles:oracle(smiles) for smiles in start_smiles_lst} 
	idx_2_smiles2f[-1] = smiles2f_new, current_set 
	for i_gen in tqdm(range(generations)):
		next_set = set()
		# for smiles in current_set:
		# 	smiles_set = optimize_single_molecule_one_iterate_v1(smiles, gnn)  ### optimize_single_molecule_one_iterate_v2
		# 	# if len(smiles) < 5: #### short smiles
		# 	# 	smiles_set = optimize_single_molecule_one_iterate(smiles, gnn)  ### optimize_single_molecule_one_iterate_v2
		# 	# else:
		# 	# 	smiles_set = optimize_single_molecule_one_iterate_v2(smiles, gnn)
		# 	for smi in smiles_set:
		# 		if smi not in trace_dict:
		# 			trace_dict[smi] = smiles 
		# 	next_set = next_set.union(smiles_set)

		for smiles in current_set:
			# smiles_set = optimize_single_molecule_one_iterate(smiles, gnn)  ### 
			# if substr_num(smiles) < 3: #### short smiles
			# 	smiles_set = optimize_single_molecule_one_iterate_v1(smiles, gnn)  ### optimize_single_molecule_one_iterate_v2
			# else:
			# 	# smiles_set = optimize_single_molecule_one_iterate_v3(smiles, gnn, topk = topk, epsilon = epsilon)
			smiles_set = optimize_single_molecule_one_iterate_nonleafexpand(smiles, gnn, topk = topk, epsilon = epsilon)
			for smi in smiles_set:
				if smi not in trace_dict:
					trace_dict[smi] = smiles 
			next_set = next_set.union(smiles_set)





		# next_set = next_set.difference(existing_set)
		smiles_score_lst = oracle_screening(next_set, oracle)  ###  sorted smiles_score_lst 
		print(smiles_score_lst[:12])
		# Option I:  select top-k molecule 
		current_set = [i[0] for i in smiles_score_lst[:population_size]]  #
		# Option II: DPP
		# current_set,_,_ = dpp(smiles_score_lst = smiles_score_lst, num_return = population_size, lamb = lamb)
		# existing_set = existing_set.union(next_set)

		# save 
		smiles2f_new = {smiles:score for smiles,score in smiles_score_lst} 
		idx_2_smiles2f[i_gen] = smiles2f_new, current_set 
		pickle.dump((idx_2_smiles2f, trace_dict), open(result_pkl, 'wb'))

		#### compute f-score
		score_lst = [smiles2f_new[smiles] for smiles in current_set] 
		average_f = np.mean(score_lst)
		std_f = np.std(score_lst)
		best_value = max(score_lst)
		f_lst.append((best_value, average_f))
		str_f_lst = [str(i[0])[:5]+'\t'+str(i[1])[:5] for i in f_lst]
		with open("result/denovo_" + prop + "_f_t.txt", 'w') as fout:
			fout.write('\n'.join(str_f_lst))





## 5. run 
if __name__ == "__main__":
	generations = 300
	population_size = 10
	# result_file = "result/denovo_from_" + start_smiles_lst[0] + "_generation_" + str(generations) + "_population_" + str(population_size) + ".pkl"
	result_pkl = "result/denovo_from_" + start_smiles_lst[0] + '_' + prop + ".pkl"
	best_smiles_score_lst, existing_set, trace_dict = distribution_learning(start_smiles_lst, gnn, oracle, 
																	generations = generations, 
																	population_size = population_size, 
																	lamb=3, 
																	topk = 5, 
																	epsilon = 0.7, 
																	result_pkl = result_pkl) 










