# core/agents/direct.py
"""
Direct inference agent.
Single-model inference without iteration/escalation.
"""

import time
from typing import Dict, Any, List

from .base import SingleModelAgent
from core.models import get_vlm_response_generic
from config.prompts import DIRECT_FINAL_PROMPT, build_question_text


class DirectAgent(SingleModelAgent):
    """
    Direct inference agent.
    Uses a single model for direct inference.
    """
    
    def __init__(self, model, processor, **kwargs):
        super().__init__(model, processor, **kwargs)
    
    def infer(self, task: Dict, video_path: str, frame_indices: List[int], 
              generation_kwargs: Dict, **kwargs) -> Dict[str, Any]:
        """
        Run single-model inference.

        Args:
            task: Task dict.
            video_path: Path to video.
            frame_indices: Frame indices to use.
            generation_kwargs: Generation parameters.

        Returns:
            Result dict.
        """
        # Build prompt
        question_text = build_question_text(task)
        prompt = DIRECT_FINAL_PROMPT.format(question_text=question_text)
        
        # Inference
        start_time = time.time()
        response = get_vlm_response_generic(
            self.model, self.processor, prompt, video_path, frame_indices, generation_kwargs
        )
        end_time = time.time()
        
        inference_time = end_time - start_time
        final_answer = response["text"]
        
        return {
            "final_answer": final_answer,
            "iterations": 1,
            "times": {
                "agent_inference_time": inference_time,
            },
            "tokens": response["tokens"],
            "debug": {
                "prompt": prompt,
                "raw_response": final_answer
            }
        }
    
    def get_metadata(self):
        """Return agent metadata."""
        metadata = super().get_metadata()
        metadata.update({
            "description": "Single model direct inference without iterations",
            "model_count": 1,
            "supports_iteration": False,
            "supports_escalation": False
        })
        return metadata
