# multicore/migration_penalty.py
"""
Migration penalty utilities.

Purpose:
  - Track which tasks were running on which cores in previous timestep(s)
  - Compute migration count (number of tasks that changed core assignment)
  - Provide a function to adjust rewards by subtracting lambda * migration_count

Usage:
  prev_assignments: list of length n_cores giving previous task per core (or -1)
  new_assignments: current list length n_cores
  migration_count = count_migrations(prev_assignments, new_assignments)
  adjusted_reward = apply_migration_penalty(base_reward, migration_count, lambda_)
"""
from typing import List

IDLE_TASK = -1

def count_migrations(prev_assignments: List[int], new_assignments: List[int]) -> int:
    """
    Count migrations as the number of tasks that appear on a different core than before.
    If task was idle and becomes assigned -> counts as 'migration' only if it previously ran on other core.
    Implementation notes:
      - Build mapping task->core for prev and new; count tasks that exist in both mappings but with different cores.
    """
    prev_map = {}
    for core, task in enumerate(prev_assignments):
        if task != IDLE_TASK:
            prev_map[task] = core
    new_map = {}
    for core, task in enumerate(new_assignments):
        if task != IDLE_TASK:
            new_map[task] = core
    # Count tasks that moved (present in both maps and core changed)
    migrations = sum(1 for t in new_map.keys() if (t in prev_map and prev_map[t] != new_map[t]))
    return int(migrations)

def apply_migration_penalty(base_reward: float, prev_assign: List[int], new_assign: List[int], lambda_mig: float) -> float:
    """
    Subtract lambda_mig * migrations from base_reward, returning adjusted reward.
    """
    m = count_migrations(prev_assign, new_assign)
    return base_reward - lambda_mig * float(m)
