
import numpy as np
from agent import Agent
from collections import deque


class RoundRobinAgent(Agent):
    # Round Robin scheduling algorithm
    # scheduling complexity: O(num_jobs * num_nodes)
    def __init__(self, time_slice=1):
        Agent.__init__(self)
        self.job_queue = deque()  # Queue of jobs in round-robin order
        self.time_slice = time_slice  # Number of executors per job per round
        self.current_allocation = {}  # Track current allocation per job
        
    def get_action(self, obs):
        # parse observation
        job_dags, source_job, num_source_exec, \
        frontier_nodes, executor_limits, \
        exec_commit, moving_executors, action_map = obs
        
        # Update job queue with new jobs
        current_jobs = set(job_dags)
        self.job_queue = deque([j for j in self.job_queue if j in current_jobs])
        for job in job_dags:
            if job not in self.job_queue:
                self.job_queue.append(job)
        
        # Reset allocation tracking each round
        self.current_allocation = {job: 0 for job in job_dags}
        
        # First try to assign executor to the same job
        if source_job is not None:
            # immediately schedulable nodes
            for node in source_job.frontier_nodes:
                if node in frontier_nodes:
                    return node, num_source_exec
            # schedulable node in the job
            for node in frontier_nodes:
                if node.job_dag == source_job:
                    return node, num_source_exec
        
        # If we have jobs in the queue, try Round Robin allocation
        if self.job_queue:
            # Get the next job in round-robin order
            current_job = self.job_queue.popleft()
            self.job_queue.append(current_job)  # Put it back at the end
            
            # Find a schedulable node for this job
            next_node = None
            # immediately schedulable node first
            for node in current_job.frontier_nodes:
                if node in frontier_nodes:
                    next_node = node
                    break
            # then schedulable node in the job
            if next_node is None:
                for node in frontier_nodes:
                    if node in current_job.nodes:
                        next_node = node
                        break
                        
            # node is selected, compute limit (use time_slice as max)
            if next_node is not None:
                use_exec = min(
                    node.num_tasks - node.next_task_idx - 
                    exec_commit.node_commit[node] - 
                    moving_executors.count(node),
                    self.time_slice,
                    num_source_exec)
                return node, use_exec
        
        # If round robin allocation failed, try any job
        for job_dag in job_dags:
            for node in frontier_nodes:
                if node in job_dag.nodes:
                    use_exec = min(
                        node.num_tasks - node.next_task_idx - 
                        exec_commit.node_commit[node] - 
                        moving_executors.count(node),
                        num_source_exec)
                    return node, use_exec
        
        # there is more executors than tasks in the system
        return None, num_source_exec