import pickle
import os
from tqdm import tqdm
base_model_path=f''
nodes_num = 500

method = 'path'

types = 'com'
k_ratio = 0.05
p_in = 0.3
p_out = 0.01
train_num_ratio = 1
p = 0.025
data_type = 'soft'
base_model_path = os.path.join(base_model_path,f"{nodes_num}_{k_ratio}_{p_in}_{p_out}")
base_model_path = os.path.join(base_model_path,f"train_language")
txt_data_path = os.path.join(base_model_path,f'data_txt')

if os.path.exists(txt_data_path):
    for fname in os.listdir(txt_data_path):
        fpath = os.path.join(txt_data_path, fname)
        if os.path.isfile(fpath):
            os.remove(fpath)
else:
    os.makedirs(txt_data_path)
    
epoch_list = []
for files in os.listdir(base_model_path):
    if files.startswith('language_data_') and files.endswith('.pkl'):
        epoch_num = int(files.split('_')[-1].split('.')[0])
        epoch_list.append(epoch_num)
max_epoch = max(epoch_list)
print(f'Loading language data from epoch: {max_epoch}')
for i in tqdm(range(1, max_epoch+1), total=max_epoch):
    with open(os.path.join(base_model_path,f'language_data_{i}.pkl'),'rb') as f:
            data = pickle.load(f)
    for j in range(len(data)):
        text_data = data[i]
        text = text_data['answer'] + '\n'
        break
    break

print(len(data))
print(data[0])