import json
import heapq
from typing import Dict, Any, List, Optional
import numpy as np

from hrc_core.llm_planner import LLMPlanner
from hrc_core.optimizer_wrapper import solve_schedule
from hrc_core.human_simulator import generate_ground_truth, HumanActionRandomizer

class SimulationManager:
    def __init__(self, scene_file_path: str, llm_api_key: str):
        with open(scene_file_path, 'r') as f:
            self.scene_info = json.load(f)
        self.llm_planner = LLMPlanner(api_key=llm_api_key)
        
        # --- Core simulation state variables ---
        self.current_time = 0.0
        self.completed_tasks = []
        self.active_tasks = {}
        self.full_plan = {}
        self.replanning_count = 0
        self.log = []

        # --- Performance learning variables ---
        self.is_performance_calibrated = False
        self.learned_human_multiplier = None

        # --- Metrics tracking variables ---
        self.metrics_total_required_tasks = 0
        self.metrics_completed_task_count_per_agent = {'human': 0, 'robot': 0}




    def run_experiment(self, initial_goal: str):
        """
        Runs a full simulation experiment for a given high-level goal.
        This involves initial planning, simulation execution, and handling interrupts.
        """
        print("\n" + "="*50)
        print("           STARTING NEW EXPERIMENT")
        print(f"Goal: '{initial_goal}'")
        print("="*50)

        user_supplied_mode = 'pause' # default: None

        if user_supplied_mode in ("goal_change", "pause"):
            self.scenario_mode = user_supplied_mode
        else:
            self.scenario_mode = np.random.choice(["pause", "goal_change"])

        print(f"[SimManager] Scenario mode for this run: '{self.scenario_mode}'")

        # 1. Initialize human behavior model
        human_randomizer = HumanActionRandomizer()
        print(f"[SimManager] Human performance multiplier for this run is set to: {human_randomizer.performance_multiplier:.3f}")

        # 2. Generate the initial plan using LLM
        decomposed_plan = self.llm_planner.decompose_task(initial_goal, self.scene_info)

        tasks_to_estimate = decomposed_plan.get("tasks", [])
        if not tasks_to_estimate:
            return {"success": False, "reason": "Task decomposition failed"}
        
        task_locations = self._generate_task_locations(tasks_to_estimate, self.scene_info)
        decomposed_plan["task_locations"] = task_locations

        duration_data = self.llm_planner.estimate_eet(tasks_to_estimate)
        self.full_plan = {**decomposed_plan, **duration_data}


        self.required_tasks_for_success = set(self.full_plan.get("tasks", []))
        self.metrics_total_required_tasks = len(self.required_tasks_for_success)

        # 3. Solve for the optimal initial schedule
        schedule_result = solve_schedule(self.full_plan, self.scene_info)
        if not schedule_result:
            return {"success": False, "reason": "Initial scheduling failed"}

        # 4. Generate the ground truth for human actions based on the schedule
        human_schedule = {t: info for t, info in schedule_result["schedule"].items() if info["agent"] == "human"}

        human_gt_log = generate_ground_truth(
            human_schedule,
            randomizer=human_randomizer,
            is_calibrated=False,
            scenario_mode=self.scenario_mode
        )
        print("\n--- Initial Plan & Ground Truth ---")
        self._print_schedule(schedule_result)
        self._print_human_gt(human_gt_log)
        
        # 5. Execute the main simulation loop and calculate final metrics
        final_result = self._execute_simulation_loop(schedule_result, human_gt_log, human_randomizer)
        final_metrics = self._calculate_final_metrics()
        final_result.update(final_metrics)

        print("\n" + "="*50)
        print("           EXPERIMENT FINISHED")
        print("="*50)
        
        return final_result



    def _execute_simulation_loop(self, current_schedule: Dict, human_gt_log: List[Dict], randomizer: HumanActionRandomizer):
        """
        The main event-driven loop of the simulation.
        Processes events from a priority queue until the plan is complete or an interrupt occurs.
        """
        # --- Initialize simulation state for this loop ---
        self.current_time = 0.0
        self.completed_tasks = []
        self.active_tasks = {}
        self.is_performance_calibrated = False
        self.original_human_gt_log = list(human_gt_log)
        self.metrics_completed_task_count_per_agent = {'human': 0, 'robot': 0}

        robot_tasks = sorted([info for info in current_schedule["schedule"].values() if info["agent"] == "robot"], key=lambda x: x['start'])

        human_tasks_gt = sorted([event for event in human_gt_log if event["event_type"] == "human_task_actual_end"], key=lambda x: x['actual_start_time'])

        checkpoint_time = float('inf')
        if robot_tasks and human_tasks_gt:
            t_h1_actual_end = human_tasks_gt[0]['actual_end_time']


            t_r1_end = robot_tasks[0]['end']
            if t_h1_actual_end <= t_r1_end:
                checkpoint_time = t_r1_end
            

            elif len(robot_tasks) > 1:
                t_r2_end = robot_tasks[1]['end']
                if t_h1_actual_end <= t_r2_end:
                    checkpoint_time = t_r2_end
                

                elif len(robot_tasks) > 2:
                    t_r3_end = robot_tasks[2]['end']
                    if t_h1_actual_end <= t_r3_end:
                        checkpoint_time = t_r3_end
                    else:

                        checkpoint_time = t_r3_end
                else:

                    checkpoint_time = t_r2_end
            else:

                checkpoint_time = t_r1_end
        
        print(f"[SimManager] Performance check scheduled at t={checkpoint_time:.2f}s")
        
        gt_events_by_task = {}
        for event in human_gt_log:
            task_name = event.get("task_name") or event.get("task_in_progress")
            if task_name not in gt_events_by_task:
                gt_events_by_task[task_name] = []
            gt_events_by_task[task_name].append(event)
        
        # --- Build the event priority queue ---
        event_queue = []
        entry_counter = 0
        for task, info in current_schedule["schedule"].items():
            heapq.heappush(event_queue, (info['start'], entry_counter, "task_planned_start", {"task_name": task, "agent": info["agent"]}))
            entry_counter += 1
            heapq.heappush(event_queue, (info['end'], entry_counter, "task_planned_end", {"task_name": task, "agent": info["agent"]}))
            entry_counter += 1
        for event in human_gt_log:
            heapq.heappush(event_queue, (event['event_time'], entry_counter, event['event_type'], event))
            entry_counter += 1
        
        # --- Main Event Loop ---
        while event_queue:
            event_time, _, event_type, data = heapq.heappop(event_queue)
            
            task_name = data.get("task_name") or data.get("task_in_progress")
            if task_name in self.completed_tasks and event_type not in ["human_task_actual_start", "human_interrupt_pause", "human_interrupt_goal_change"]:
                continue

            self.current_time = event_time
            display_event_type = event_type


            if event_type in ["task_planned_start", "task_planned_end"]:
                agent = data.get("agent", "N/A")
                display_event_type = f"{event_type} ({agent})"

            print(f"\n[SimManager @ t={self.current_time:.2f}s] Event: '{display_event_type}' on Task: '{task_name}'")

            interrupt_occurred = False
            interrupt_reason = ""
            agent_constraints = {}
            
            # --- Event Handling Logic ---
            if event_type == "task_planned_start":
                self.active_tasks[data["task_name"]] = {"start_time": self.current_time, "agent": data["agent"]}
                continue

            elif event_type == "human_task_actual_start":
                if task_name in self.active_tasks:
                    self.active_tasks[task_name]['start_time'] = self.current_time
                pass
            
            elif event_type == "human_interrupt_pause":
                interrupt_occurred = True
                pause_duration = data['duration']
                task_paused = data['task_in_progress']
                interrupt_reason = f"Human paused for {pause_duration:.2f}s during task '{task_paused}'."
                agent_constraints = {"human": {"unavailable_until": self.current_time + pause_duration}, "robot": {"unavailable_until": self.current_time}}

            elif event_type == "human_interrupt_goal_change":
                interrupt_occurred = True
                details = data.get('details', 'No details provided.')
                interrupt_reason = f"Human requested a goal change: '{details}'"

                trigger_task_name = data.get("trigger_task")
                agent_constraints = {
                    "human": {
                        "unavailable_until": self.current_time,
                        "must_do_task": trigger_task_name
                    },
                    "robot": {
                        "unavailable_until": self.current_time
                    }
                }

            
            elif event_type == "human_task_actual_end":
                print(f"  - INFO: Human's Ground-Truth end for '{task_name}'. State updated.")
                if task_name not in self.completed_tasks:
                    self.completed_tasks.append(task_name)

                    self.metrics_completed_task_count_per_agent['human'] += 1

                if task_name in self.active_tasks:
                    del self.active_tasks[task_name]

            elif event_type == "task_planned_end":
                agent = data.get("agent")
                
                if agent == "robot":
                    if task_name not in self.completed_tasks:
                        self.completed_tasks.append(task_name)

                        self.metrics_completed_task_count_per_agent['robot'] += 1

                    if task_name in self.active_tasks:
                        del self.active_tasks[task_name]
                    
                    if not self.is_performance_calibrated and self.current_time >= checkpoint_time:
                        interrupt_occurred = True
                        self.is_performance_calibrated = True
                        self.learned_human_multiplier = randomizer.performance_multiplier
                        interrupt_reason = "Human performance deviation detected."
                        agent_constraints = {"human": {"unavailable_until": self.current_time}, "robot": {"unavailable_until": self.current_time}}
                
                elif agent == "human":
                    pass
            
            # --- Re-planning Logic ---
            if interrupt_occurred:
                self.replanning_count += 1
                print(f"  >>> INTERRUPT: {interrupt_reason}")
                print(f"  --- Triggering Dynamic Re-planning (Count: {self.replanning_count}) ---")



                future_goal_change_event = next((event for event in self.original_human_gt_log 
                                                 if event['event_type'] == 'human_interrupt_goal_change' and event['event_time'] > self.current_time), None)
                

                if future_goal_change_event:
                    trigger_task = future_goal_change_event.get("trigger_task")

                    if trigger_task:
                        print(f"  - INFO: Preserving future goal change trigger. Task '{trigger_task}' must be done by human.")

                        if "human" not in agent_constraints:
                            agent_constraints["human"] = {}
                        agent_constraints["human"]["must_do_task"] = trigger_task



                if "Human requested a goal change" in interrupt_reason:

                    print("  - Performing full re-planning from scratch due to goal change.")
                    

                    new_goal = "to make a salad with apple not tomato"
                    print(f"  - New high-level goal: '{new_goal}'")


                    new_decomposed_plan = self.llm_planner.decompose_task(new_goal, self.scene_info)
                    

                    new_tasks = new_decomposed_plan.get("tasks", [])
                    remaining_tasks_for_new_plan = [t for t in new_tasks if t not in self.completed_tasks]
                    print(f"  - Filtering completed tasks. Remaining for new plan: {remaining_tasks_for_new_plan}")

                    task_locations_for_new_plan = self._generate_task_locations(remaining_tasks_for_new_plan, self.scene_info)
                    

                    new_duration_data = self.llm_planner.estimate_eet(remaining_tasks_for_new_plan) 
                    base_durations = new_duration_data.get("mani_time", {})
                    

                    final_durations = {}
                    if self.is_performance_calibrated:
                        print(f"  - Applying learned multiplier ({self.learned_human_multiplier:.2f}) to the new plan.")
                        for task, base_eet in base_durations.items():
                            calibrated_eet = base_eet * self.learned_human_multiplier
                            final_durations[task] = {"robot": base_eet, "human": calibrated_eet}
                    else:
                        for task, base_eet in base_durations.items():
                            final_durations[task] = {"robot": base_eet, "human": base_eet}


                    self.full_plan = {
                        "tasks": remaining_tasks_for_new_plan,
                        "dependencies": [dep for dep in new_decomposed_plan.get("dependencies", []) if dep[0] in remaining_tasks_for_new_plan and dep[1] in remaining_tasks_for_new_plan],
                        "capability": new_duration_data.get("capability", {}),
                        "task_locations": task_locations_for_new_plan,
                        "mani_time": final_durations,
                        "nav_time": new_duration_data.get("nav_time", {})
                    }

                    self.required_tasks_for_success = set(new_decomposed_plan.get("tasks", []))
                    print(f"  - Success condition has been RESET. New required tasks: {self.required_tasks_for_success}")

                    new_tasks_set = set(self.full_plan.get("tasks", []))
                    self.active_tasks = {task: status for task, status in self.active_tasks.items() if task in new_tasks_set}
                    print(f"  - Active tasks pruned. Remaining: {list(self.active_tasks.keys())}")
                
                else:


                    print("  - Performing partial re-planning for remaining tasks.")
                    

                    current_active_tasks = {t: s for t, s in self.active_tasks.items() if s.get("start_time", 0.0) <= self.current_time}
                    self.active_tasks = current_active_tasks
                    
                    remaining_durations = {}
                    in_progress_task_locations = {}
                    for task, status in self.active_tasks.items():
                        agent = status["agent"]
                        time_spent = 0
                        remaining_duration = 0

                        if agent == "robot":
                            original_info = current_schedule["schedule"][task]
                            original_duration = original_info["end"] - original_info["start"]
                            time_spent = self.current_time - original_info["start"]
                            remaining_duration = max(0, original_duration - time_spent)
                        
                        elif agent == "human":

                            actual_start_time = status["start_time"]
                            

                            end_event_tuple = next((item for item in event_queue if item[2] == 'human_task_actual_end' and item[3].get('task_name') == task), None)

                            if end_event_tuple:

                                actual_end_time = end_event_tuple[0]
                                

                                actual_total_duration = actual_end_time - actual_start_time
                                time_spent = self.current_time - actual_start_time
                                remaining_duration = max(0, actual_total_duration - time_spent)
                            else:

                                print(f"  - WARNING: Could not find 'human_task_actual_end' in event_queue for task '{task}'. Remaining time set to 0.")
                                remaining_duration = 0

                        print(f"  - Handling in-progress task '{task}' ({agent}): spent {time_spent:.2f}s, remaining {remaining_duration:.2f}s")
                        remaining_durations[task] = remaining_duration
                        end_location = self.full_plan["task_locations"][task]["end"]
                        in_progress_task_locations[task] = {"start": end_location, "end": end_location}

                    interrupt_context = {
                        "reason": interrupt_reason,
                        "current_time": self.current_time,
                        "completed_tasks": list(self.completed_tasks),
                        "active_tasks": self.active_tasks,
                        "schedule_before_interrupt": current_schedule['schedule'] 
                    }
                    if self.learned_human_multiplier:
                        interrupt_context["learned_human_multiplier"] = self.learned_human_multiplier
                    
                    re_decomposed_plan = self.llm_planner.generate_replanning(interrupt_context, self.full_plan)
                    tasks_to_re_estimate = re_decomposed_plan.get("tasks", [])
                    if not tasks_to_re_estimate: break

                    task_locations_for_replan = self._generate_task_locations(tasks_to_re_estimate, self.scene_info)

                    duration_data = self.llm_planner.estimate_eet(tasks_to_re_estimate)
                    base_durations = duration_data.get("mani_time", {})

                    final_durations = {}
                    if self.is_performance_calibrated:
                        print(f"  - Calibrating all tasks with learned multiplier: {self.learned_human_multiplier:.2f}")
                        for task, base_eet in base_durations.items():

                            calibrated_eet = base_eet * self.learned_human_multiplier
                            final_durations[task] = {
                                "robot": base_eet,
                                "human": calibrated_eet
                            }
                            print(f"    - Task '{task}': robot_eet={base_eet:.2f}s, human_eet={calibrated_eet:.2f}s")
                    else:

                        for task, base_eet in base_durations.items():
                            final_durations[task] = {
                                "robot": base_eet,
                                "human": base_eet
                            }
                    
                    for task, rem_dur in remaining_durations.items():
                        final_durations[task] = {"robot": rem_dur, "human": rem_dur}


                    final_locations = task_locations_for_replan
                    final_locations.update(in_progress_task_locations)
                    
                    self.full_plan = {
                        "tasks": tasks_to_re_estimate, 
                        "dependencies": re_decomposed_plan.get("dependencies", []),
                        "capability": duration_data.get("capability", {}),
                        "task_locations": final_locations, 
                        "mani_time": final_durations,
                        "nav_time": duration_data.get("nav_time", {})}


                new_schedule = solve_schedule(self.full_plan, self.scene_info, agent_constraints=agent_constraints)
                if not new_schedule:
                    return {"success": False, "reason": "Re-scheduling failed"}
                current_schedule = new_schedule                
                self._print_schedule(current_schedule, from_time=self.current_time)

                # Rebuild the event queue with the new plan
                event_queue = []
                entry_counter = 0
                for task, info in current_schedule["schedule"].items():
                    if task not in self.completed_tasks:
                        heapq.heappush(event_queue, (info['start'], entry_counter, "task_planned_start", {"task_name": task, "agent": info["agent"]}))
                        entry_counter += 1
                        heapq.heappush(event_queue, (info['end'], entry_counter, "task_planned_end", {"task_name": task, "agent": info["agent"]}))
                        entry_counter += 1
                

                remaining_human_schedule = {
                    t: info for t, info in new_schedule["schedule"].items() 
                    if info["agent"] == "human" and t not in self.completed_tasks
                }
                
                if remaining_human_schedule:

                    is_gt_calibrated = self.is_performance_calibrated
                    
                    new_task_gt_log = generate_ground_truth(
                        remaining_human_schedule, 
                        randomizer=randomizer, 
                        is_calibrated=is_gt_calibrated, 
                        scenario_mode=self.scenario_mode,
                        schedule_start_time=self.current_time,
                        generate_async_events=False
                    )
                    self._print_human_gt(new_task_gt_log)
                    
                    for event in new_task_gt_log:

                        if event["event_type"] in ["human_task_actual_start", "human_task_actual_end"]:
                            heapq.heappush(event_queue, (event['event_time'], entry_counter, event['event_type'], event))
                            entry_counter += 1
                

                print("  - Restoring future asynchronous ground truth events...")
                for event in self.original_human_gt_log:

                    if event["event_type"] == "human_interrupt_pause" and event["event_time"] > self.current_time:
                        print(f"    - Restoring '{event['event_type']}' scheduled at t={event['event_time']:.2f}s")
                        heapq.heappush(event_queue, (event['event_time'], entry_counter, event['event_type'], event))
                        entry_counter += 1
                    

                    elif event["event_type"] == "human_interrupt_goal_change":
                        trigger_task = event.get("trigger_task")
                        

                        if trigger_task and trigger_task not in self.completed_tasks:

                            new_end_event = next((e for e in new_task_gt_log if e['event_type'] == 'human_task_actual_end' and e['task_name'] == trigger_task), None)
                            
                            if new_end_event:
                                new_trigger_time = new_end_event['actual_end_time']

                                event['event_time'] = new_trigger_time 
                                print(f"    - Relinking '{event['event_type']}' to task '{trigger_task}' end at new time t={new_trigger_time:.2f}s")
                                heapq.heappush(event_queue, (new_trigger_time, entry_counter, event['event_type'], event))
                                entry_counter += 1
                            else:
                                print(f"    - WARNING: Could not find new end time for trigger task '{trigger_task}'. Goal change event might be lost.")
                
                continue    # Restart the loop with the new event queue


        final_makespan = self.current_time
        completed_tasks_set = set(self.completed_tasks)
        print("\nDEBUG for completed_tasks_set: ", completed_tasks_set)
        print("DEBUG for required_tasks: ", self.required_tasks_for_success)
        success = self.required_tasks_for_success.issubset(completed_tasks_set)
        return { "success": success, "final_makespan": final_makespan, "replanning_count": self.replanning_count }


    def _print_schedule(self, schedule_result, from_time=0.0):
        """Helper function to print the schedule in a readable format."""
        header = f"--- Optimal Schedule (from t={from_time:.2f}s, Makespan: {schedule_result['makespan']:.2f}s) ---"
        print(header)
        sorted_schedule = sorted(schedule_result["schedule"].items(), key=lambda i: i[1]['start'])
        for task, info in sorted_schedule:
            if task not in self.completed_tasks:
                print(f"    - {task:<22} | {info['agent']:<7} | {info['start']:>6.2f} -> {info['end']:>6.2f}")
    

    def _print_human_gt(self, human_gt_log):
        """Helper function to print the human's ground truth behavior."""
        print("--- Human's Ground Truth Behavior ---")
        for event in human_gt_log:
            event_type = event.get('event_type', 'unknown')


            if event_type == 'human_task_actual_end':
                task_name = event['task_name']
                

                p_start = event.get('planned_start_time', 0)
                a_start = event.get('actual_start_time', p_start)
                p_end = event.get('planned_end_time', 0)
                a_end = event.get('actual_end_time', 0)
                

                planned_duration = p_end - p_start
                actual_duration = a_end - a_start
                

                print(f"    - Task: {task_name:<22} | Planned: {planned_duration:>5.2f}s | Actual (GT): {actual_duration:>5.2f}s | Actual End: {a_end:>5.2f}s")

            elif event_type == 'human_interrupt_pause':
                task_name = event['task_in_progress']
                duration = event['duration']
                print(f"    - PAUSE EVENT @ t={event['event_time']:.2f}s: Paused for {duration:.2f}s during '{task_name}'")

            elif event_type == 'human_interrupt_goal_change':
                 print(f"    - GOAL CHANGE @ t={event['event_time']:.2f}s: {event.get('details', 'No details')}")
    

    def _parse_task_string(self, task: str) -> Dict[str, Any]:
        """Parses a task string (e.g., 'pickup_Bowl') into an action and its parameters."""


        if task.startswith("toggle_on_"):
            return {"action": "toggle_on", "params": [task.replace("toggle_on_", "")]}
        if task.startswith("toggle_off_"):
            return {"action": "toggle_off", "params": [task.replace("toggle_off_", "")]}
        

        if task.startswith("put_"):
            if "_on_" in task:
                parts = task.split("_on_")
                object_name = parts[0].replace("put_", "")
                receptacle_name = parts[1]
                return {"action": "put", "params": [object_name, receptacle_name]}
            elif "_in_" in task:
                parts = task.split("_in_")
                object_name = parts[0].replace("put_", "")
                receptacle_name = parts[1]
                return {"action": "put", "params": [object_name, receptacle_name]}
        

        if "_by_" in task:
            action, remaining = task.split("_", 1)
            if "_by_" in remaining:
                param1, param2 = remaining.split("_by_")
                return {"action": action, "params": [param1, param2]}


        parts = task.split("_", 1)
        if len(parts) == 2:
            action, param = parts
            return {"action": action, "params": [param]}
            
        return {"action": task, "params": []}
    
    
    def _get_base_object_name(self, object_name_with_suffix: str) -> str:
        """Removes numeric suffixes from object names."""


        parts = object_name_with_suffix.split('_')

        if len(parts) > 1 and parts[-1].isdigit():
            return '_'.join(parts[:-1])

        return object_name_with_suffix

    
    def _generate_task_locations(self, tasks: List[str], scene_info: Dict[str, Any]) -> Dict[str, Any]:
        """Generates start and end locations for each task based on the scene information."""


        print("  - Generating task locations from scene info using new parser...")
        task_locations = {}
        

        object_location_map = {}
        for obj_id, obj_data in scene_info.get("pickable_objects", {}).items():

            object_location_map[obj_data.get("objectType")] = obj_data.get("parentReceptacles", [None])[0]

        for receptacle_id, recep_data in scene_info.get("receptacles", {}).items():
             object_location_map[recep_data.get("objectType")] = receptacle_id


        for task in tasks:
            try:
                parsed = self._parse_task_string(task)
                action = parsed["action"]
                params = parsed["params"]
                
                if action in ["pickup", "slice", "open", "close", "toggle_on", "toggle_off"]:
                    base_target_obj = self._get_base_object_name(params[0])
                    location = object_location_map.get(base_target_obj)
                    if location:
                        task_locations[task] = {"start": location, "end": location}
                
                elif action == "put":
                    base_obj_to_put = self._get_base_object_name(params[0])
                    base_target_receptacle = self._get_base_object_name(params[1])
                    start_loc = object_location_map.get(base_obj_to_put)
                    end_loc = object_location_map.get(base_target_receptacle)
                    if start_loc and end_loc:
                        task_locations[task] = {"start": start_loc, "end": end_loc}
                
                elif action in ["Heat", "Boil"]:
                    base_appliance = self._get_base_object_name(params[1]) 
                    location = object_location_map.get(base_appliance)
                    if location:
                        task_locations[task] = {"start": location, "end": location}

            except Exception as e:
                print(f"    - WARNING: Could not parse or find location for task '{task}'. Error: {e}")
                
        return task_locations
    

    def _calculate_final_metrics(self) -> Dict[str, Any]:
        """Calculates final performance metrics for the experiment."""


        # TR (Transport Rate)
        num_completed_in_goal = len(self.required_tasks_for_success.intersection(set(self.completed_tasks)))
        num_required_for_goal = len(self.required_tasks_for_success)
        transport_rate = num_completed_in_goal / num_required_for_goal if num_required_for_goal > 0 else 0

        # B (Balance)
        counts = list(self.metrics_completed_task_count_per_agent.values())
        min_tasks = min(counts)
        max_tasks = max(counts)
        balance = min_tasks / (max_tasks + 1e-6) if max_tasks > 0 else 1.0

        # L (Average Steps)
        total_steps = len(self.completed_tasks)

        return {
            "transport_rate": round(transport_rate, 3),
            "balance": round(balance, 3),
            "total_steps": total_steps
        }


if __name__ == "__main__":
    # --- Experiment Configuration ---
    SCENE_FILE = "scene_data/FloorPlan1_physics.json"
    LLM_API_KEY = "DUMMY_KEY_FOR_MANUAL_INPUT"
    
    # --- Run Simulation ---
    manager = SimulationManager(scene_file_path=SCENE_FILE, llm_api_key=LLM_API_KEY)
    results = manager.run_experiment(initial_goal="to make a salad")
    
    print("\n--- FINAL RESULTS ---")
    print(json.dumps(results, indent=4))