#!/bin/bash

# Define the root directory where all generated data will be stored
ROOT_DIRECTORY="/code/jiateng-sandbox/Inject_Complex_Policies/Data_Synthesizer/Sample_Data"

# Create the root directory if it doesn't exist
mkdir -p "$ROOT_DIRECTORY"

# Simplified data generation - generates both training and evaluation sets from the same policy
echo "=== GENERATING SIMPLIFIED TRAINING AND EVALUATION DATA ==="
echo "Total configurations: 6 (1 depth × 6 task/args/complexity combinations)"
echo "Root directory: $ROOT_DIRECTORY"
echo "Data per configuration: 2000 training + 300 evaluation = 100300 total"

# Structure complexity 1 configurations
echo "--- Structure Complexity 1 ---"

# Depth 3 configurations (fixed depth)
echo "Depth 3:"
python3 Synthesize.py --depth 3 --tasks 3 --structure_complexity 1 --args_num 3 --output_dir "$ROOT_DIRECTORY/Generated_data_layer_3_task_3_structure_1_args_3"
python3 Synthesize_QA.py --base_dir "$ROOT_DIRECTORY/Generated_data_layer_3_task_3_structure_1_args_3" --total_requests 100300 --eval_size 300

python3 Synthesize.py --depth 3 --tasks 5 --structure_complexity 1 --args_num 5 --output_dir "$ROOT_DIRECTORY/Generated_data_layer_3_task_5_structure_1_args_5"
python3 Synthesize_QA.py --base_dir "$ROOT_DIRECTORY/Generated_data_layer_3_task_5_structure_1_args_5" --total_requests 100300 --eval_size 300

python3 Synthesize.py --depth 3 --tasks 8 --structure_complexity 1 --args_num 8 --output_dir "$ROOT_DIRECTORY/Generated_data_layer_3_task_8_structure_1_args_8"
python3 Synthesize_QA.py --base_dir "$ROOT_DIRECTORY/Generated_data_layer_3_task_8_structure_1_args_8" --total_requests 100300 --eval_size 300

python3 Synthesize.py --depth 3 --tasks 12 --structure_complexity 1 --args_num 12 --output_dir "$ROOT_DIRECTORY/Generated_data_layer_3_task_12_structure_1_args_12"
python3 Synthesize_QA.py --base_dir "$ROOT_DIRECTORY/Generated_data_layer_3_task_12_structure_1_args_12" --total_requests 100300 --eval_size 300

# Structure complexity 2 configurations (only for task 5)
echo "--- Structure Complexity 2 ---"

echo "Depth 3:"
python3 Synthesize.py --depth 3 --tasks 5 --structure_complexity 2 --args_num 5 --output_dir "$ROOT_DIRECTORY/Generated_data_layer_3_task_5_structure_2_args_5"
python3 Synthesize_QA.py --base_dir "$ROOT_DIRECTORY/Generated_data_layer_3_task_5_structure_2_args_5" --total_requests 100300 --eval_size 300

# Structure complexity 3 configurations (only for task 5)
echo "--- Structure Complexity 3 ---"

echo "Depth 3:"
python3 Synthesize.py --depth 3 --tasks 5 --structure_complexity 3 --args_num 5 --output_dir "$ROOT_DIRECTORY/Generated_data_layer_3_task_5_structure_3_args_5"
python3 Synthesize_QA.py --base_dir "$ROOT_DIRECTORY/Generated_data_layer_3_task_5_structure_3_args_5" --total_requests 100300 --eval_size 300

echo "=== DATA GENERATION COMPLETE ==="
echo "Generated 6 configurations total:"
echo "  - 1 depth level: 3"
echo "  - Tasks 3, 8, 12: structure complexity 1 only"
echo "  - Task 5: all structure complexities (1, 2, 3)"
echo "Each configuration generates:"
echo "  - 2,000 training queries in qa_train.json"
echo "  - 300 evaluation queries in qa_eval.json"
echo "  - Both sets share the same underlying policy for consistent evaluation" 