from typing import List, Tuple
from datetime import datetime, timedelta

from flex_attention_vllm.entities.request import Request
from flex_attention_vllm.scheduler.global_scheduler.base_global_scheduler import BaseGlobalScheduler
from flex_attention_vllm.scheduler.utils.double_hash_global_scheduler_utils import DoubleHashGlobalSchedulerUtils
from flex_attention_vllm.scheduler.utils.shared import SharedState
from flex_attention_vllm.logger import init_logger

logger = init_logger(__name__)


class MinTTFTGlobalScheduler(BaseGlobalScheduler):
    def __init__(self, num_replicas, shared_state: SharedState, args):
        super().__init__(num_replicas)
        self.shared_state = shared_state
        self.double_hash_util = DoubleHashGlobalSchedulerUtils(num_replicas, shared_state, args)

    async def schedule(self, request: Request) -> int:
        if request is None:
            return -1
        target_replica_id,_ = await self.shared_state.get_min_ttft_replica(request)

        if target_replica_id != -1: 
            return target_replica_id

    def finish_request(
        self, func_output=None, text: str = None, input_ids=None
    ):
        return