# %%
import pandas as pd
import sqlalchemy as sqla
import sys
import os
from tqdm.contrib.concurrent import process_map
import json

sys.path.append(os.path.abspath(os.path.join(os.path.dirname(__file__), "..")))
from track.track_MIMIC.patient import Patient

# %%
engine = sqla.create_engine(
    "<your-database-connection-string>",
    max_overflow=100,
    pool_size=100,
    pool_timeout=30,
    pool_recycle=180
)

subject_id_list = Patient.get_subject_id_list(engine)

# %%

def process_subject_id(subject_id):
    local_engine = sqla.create_engine(
        "<your-database-connection-string>",
        max_overflow=1,
        pool_size=48,
        pool_timeout=1,
        pool_recycle=10
    )
    with local_engine.connect() as conn:
        patient = Patient(subject_id)
        patient.add_patient_info(conn)
        
        if not patient.admission:
            return
        
        folder = os.path.join(
            os.path.dirname(__file__),
            "..", 
            "data", 
            "json", 
            str(subject_id%100).zfill(2),
        )
        
        file_path = os.path.join(folder, f"{subject_id}.json")
        if not os.path.exists(folder):
            os.makedirs(folder)
        with open(file_path, "w") as f:
            json.dump(patient.to_dict(), f, indent=4, default=str)
            
    local_engine.dispose()

process_map(
    process_subject_id, 
    subject_id_list, 
    max_workers=96, 
    chunksize=32
)