import subprocess
import os
import itertools

# Resolve local directories relative to this script for portability.
SCRIPT_DIR = os.path.dirname(os.path.abspath(__file__))

# Configuration
DATA_PATH = os.path.join(SCRIPT_DIR, "cache", "combined_dataset_210.jsonl")
OFFLINE_EMBEDDINGS = os.path.join(SCRIPT_DIR, "cache", "query_embeddings_combined.json")
OFFLINE_RESULTS = os.path.join(SCRIPT_DIR, "cache", "pruned_question_trials_combined.csv")
MAX_PROBLEMS = 210
WARM_UP = 50
ACTION_SPACE = "routing_full"

# Files
SEMANTIC_EMBEDDINGS = os.path.join(SCRIPT_DIR, "cache", "action_embeddings_semantic.json")
RANDOM_EMBEDDINGS = os.path.join(SCRIPT_DIR, "cache", "action_embeddings_random.json")

# Metrics
DA_METRIC = "Difficulty_Aware_Normalized_EFLOPS"
NORM_METRIC = "Normalized_EFLOPS"

# Parameters
ALPHAS = [0.5, 1.0, 2.0, 3.0, 5.0]

# Reward Weights
# Format: [w_acc, w_ver, w_cost, bias]
WEIGHTS_UNISCALE = [
    [0.1, 0.1, 0.8, 0.8],
    [0.2, 0.2, 0.6, 0.6],
    [0.3, 0.3, 0.4, 0.4],
    [0.4, 0.4, 0.2, 0.2]
]

WEIGHTS_WO_CF = [
    [0.2, 0.0, 0.8, 0.8],
    [0.4, 0.0, 0.6, 0.6],
    [0.6, 0.0, 0.4, 0.4],
    [0.8, 0.0, 0.2, 0.2]
]

def run_experiment(exp_name, alpha, weights, action_emb_file, cost_metric):
    """
    Run a single experiment configuration.
    """
    # Construct exp_label
    # Format: {exp_name}_alpha{alpha}_w{weights_str}
    w_str = f"{weights[0]}_{weights[1]}_{weights[2]}"
    exp_label = f"{exp_name}_alpha{alpha}_{w_str}"
    
    cmd = [
        "python", os.path.join(SCRIPT_DIR, "main.py"),
        "--algorithm", "lin_ucb",
        "--alpha", str(alpha),
        "--virtual_dataset",
        "--offline_embeddings", OFFLINE_EMBEDDINGS,
        "--offline_results", OFFLINE_RESULTS,
        "--max_problems", str(MAX_PROBLEMS),
        "--warm_up", str(WARM_UP),
        "--allowed_action_space", ACTION_SPACE,
        "--exp_label", exp_label,
        "--action_embedding_file", action_emb_file,
        "--cost_metric", cost_metric,
        "--reward_weights"
    ] + [str(w) for w in weights]
    
    print(f"\n[Experiment] Running: {exp_label}")
    # print(f"Command: {' '.join(cmd)}")
    
    try:
        subprocess.run(cmd, check=True)
    except subprocess.CalledProcessError as e:
        print(f"Error running experiment {exp_label}: {e}")

def main():
    tasks = []
    
    # 5. wo_DA_wo_CF (New Request)
    # wo_DA (NORM_METRIC) + wo_CF (Ver=0 Weights)
    # For Alpha=1.0
    
    # WEIGHTS_WO_CF are already defined:
    # [0.2, 0.0, 0.8, 0.8] corresponding to [0.1, 0.1, 0.8, 0.8]
    # [0.4, 0.0, 0.6, 0.6] corresponding to [0.2, 0.2, 0.6, 0.6]
    # [0.6, 0.0, 0.4, 0.4] corresponding to [0.3, 0.3, 0.4, 0.4]
    # [0.8, 0.0, 0.2, 0.2] corresponding to [0.4, 0.4, 0.2, 0.2]
    
    target_alpha = 1.0
    
    for weights in WEIGHTS_WO_CF:
        tasks.append({
            "exp_name": "wo_DA_wo_CF",
            "alpha": target_alpha,
            "weights": weights,
            "action_emb_file": SEMANTIC_EMBEDDINGS,
            "cost_metric": NORM_METRIC
        })
            
    print(f"Total experiments to run: {len(tasks)}")
    
    for i, task in enumerate(tasks):
        print(f"\n--- Progress: {i+1}/{len(tasks)} ---")
        run_experiment(
            task["exp_name"],
            task["alpha"],
            task["weights"],
            task["action_emb_file"],
            task["cost_metric"]
        )

if __name__ == "__main__":
    main()
