# api_server.py
# FastAPI wrapper exposing /infer endpoint. Uses InferenceService (from earlier inference.py).
# If InferenceService is not available, a fallback dummy handler will be used.

from fastapi import FastAPI, HTTPException
from pydantic import BaseModel
from typing import Optional, Dict, Any
import uvicorn
import logging

logger = logging.getLogger("api_server")
logger.setLevel(logging.INFO)

# try import InferenceService from your project
try:
    from inference import InferenceService
except Exception as e:
    logger.warning("Could not import InferenceService: %s. Using fallback.", e)
    InferenceService = None

app = FastAPI(title="EDM Inference API", version="0.1")

class InferRequest(BaseModel):
    text: str
    meta: Optional[Dict[str, Any]] = None
    # audio could be base64; for prototype we skip audio in API
    audio_base64: Optional[str] = None

class InferResponse(BaseModel):
    response: str
    escalated: bool
    debug: Optional[Dict[str, Any]] = None

# instantiate once
svc = InferenceService() if InferenceService is not None else None

@app.post("/infer", response_model=InferResponse)
async def infer(req: InferRequest):
    if svc is None:
        # fallback: echo template
        return InferResponse(response="Service not initialized. This is a fallback response.", escalated=False, debug={"note": "fallback"})
    try:
        # if audio_base64 is provided, decode and convert to waveform externally (omitted here)
        response, escalated, debug = svc.handle_request(req.text, audio=None, meta=req.meta)
        return InferResponse(response=response, escalated=escalated, debug=debug)
    except Exception as e:
        logger.exception("Inference failed: %s", e)
        raise HTTPException(status_code=500, detail=str(e))

if __name__ == "__main__":
    # run with: python api_server.py
    uvicorn.run(app, host="0.0.0.0", port=8080)
