#!/usr/bin/env python3
"""
ManifoldKV Single RULER Experiment Runner
ICML 2026 - Run individual RULER benchmark experiments

Examples:
    # Run ManifoldKV at 4K context
    python run_ruler_main.py --method adakv_manifold_kv --context 4096

    # Run KeyDiff baseline at 8K context
    python run_ruler_main.py --method adakv_keydiff --context 8192

    # Run with custom compression ratio
    python run_ruler_main.py --method adakv_manifold_kv --compression 0.30
"""

import argparse
import json
import os
import sys
from pathlib import Path

# Add parent directory to path
sys.path.insert(0, str(Path(__file__).parent.parent))

# Set up evaluation path
eval_path = Path(__file__).parent.parent / "evaluation"
sys.path.insert(0, str(eval_path))


def main():
    parser = argparse.ArgumentParser(description="Run single RULER experiment")
    parser.add_argument("--method", type=str, default="adakv_manifold_kv",
                       choices=[
                           "adakv_manifold_kv", "manifold_kv",
                           "adakv_keydiff", "keydiff",
                           "adakv_snapkv", "snapkv",
                           "windowed_manifold_4k", "windowed_manifold_8k",
                           "manifold_kv_l1", "manifold_kv_linf",
                       ])
    parser.add_argument("--model", type=str, default="meta-llama/Meta-Llama-3.1-8B-Instruct")
    parser.add_argument("--context", type=int, default=4096, 
                       choices=[4096, 8192, 16384, 32768, 65536])
    parser.add_argument("--compression", type=float, default=0.20)
    parser.add_argument("--max_context", type=int, default=None,
                       help="Max context length for evaluation (default: same as context)")
    parser.add_argument("--output_dir", type=str, default="../results/ruler")
    parser.add_argument("--gpu", type=int, default=0)
    parser.add_argument("--tasks", type=str, default=None,
                       help="Comma-separated list of tasks to run (default: all)")
    parser.add_argument("--fraction", type=float, default=1.0,
                       help="Fraction of dataset to use (for quick testing)")
    args = parser.parse_args()
    
    # Set GPU
    os.environ["CUDA_VISIBLE_DEVICES"] = str(args.gpu)
    
    # Import evaluation after setting GPU
    from evaluate import EvaluationConfig, EvaluationRunner
    
    # Determine max context
    max_context = args.max_context or args.context
    
    print("="*60)
    print("ManifoldKV RULER Benchmark")
    print("="*60)
    print(f"Method:      {args.method}")
    print(f"Model:       {args.model}")
    print(f"Context:     {args.context}")
    print(f"Max Context: {max_context}")
    print(f"Compression: {args.compression}")
    print(f"Output:      {args.output_dir}")
    print("="*60)
    
    # Create configuration
    config = EvaluationConfig(
        dataset="ruler",
        data_dir=str(args.context),
        model=args.model,
        press_name=args.method,
        compression_ratio=args.compression,
        max_context_length=max_context,
        output_dir=args.output_dir,
        fraction=args.fraction,
    )
    
    # Run evaluation
    runner = EvaluationRunner(config)
    runner.run_evaluation()
    
    print("\n" + "="*60)
    print("Experiment complete!")
    print("="*60)


if __name__ == "__main__":
    main()
