import math

import numpy as np

MAX_NUM_COLOR_GROUPS = 8


def preamble_variable_regions_greedy(**kwargs):
    prompt = []
    num_variable_regions = kwargs['num_variable_regions']
    grid_size = kwargs['grid_size']

    # ── context shortcuts ────────────────────────────────────────────────
    node_names = kwargs['node_name_list']  # list[str]
    placed_num_macro = kwargs['placed_num_macro']
    num_macro_placed = kwargs['num_macro_placed']
    color_cfg = kwargs['color_config']  # {macro:color}
    cg_count = kwargs['color_group_count']  # {color:int}
    cg_to_first_macro = kwargs['color_group_to_first_macro']  # {color:macro}
    node_shortname = kwargs['node_name_to_short_name']  # {macro:str}
    node_to_idx = kwargs['node_to_idx']  # {macro:int}
    dims_int = kwargs['node_dims_int']  # (M,2) ints
    dims_real = kwargs['node_dims_real']  # (M,2) µm
    ratio_x = kwargs['ratio_x']  # µm ↔ grid
    ratio_y = kwargs['ratio_y']

    # ── 1) Task description ─────────────────────────────────────────────
    prompt.append(
            "You are guiding a low-level placement policy for computer chip "
            "floorplanning. Your task is to suggest rectangular regions for "
            "placing macros on the chip canvas, which has been divided into a "
            "grid. The low-level policy will choose the exact placement location "
            "within your suggested regions. If there is a macro "
            "in the netlist that you are not providing a suggestion for, the "
            "low-level policy will place that macro by itself.\n\n"
            "The macros are grouped by colors based on their connectivity in the "
            "netlist graph, where macros with higher interconnectivity (more pin "
            "connections between them) are assigned similar colors. Your "
            "suggestions will provide a starting point for creating a complete "
            "chip floorplan.\n"
    )

    # ── 2) Choose the macros to suggest regions for ---------------------
    remaining_macros = node_names[num_macro_placed:placed_num_macro]

    colors, group_counts = zip(*cg_count.items())  # parallel tuples
    total_count = sum(group_counts)
    probs_by_grp = [cnt / total_count for cnt in group_counts]

    # a) one macro per colour group (without replacement)
    selected_groups = np.random.choice(
            colors,
            size=min(num_variable_regions, len(colors)),
            replace=False,
            p=probs_by_grp
    )

    selected_macros = set()
    for g in selected_groups:
        m = cg_to_first_macro[g]
        if m in remaining_macros:
            selected_macros.add(m)

    # b) add extra macros if we still need more (area-weighted)
    remaining_macros = list(set(remaining_macros) - selected_macros)
    if len(selected_macros) < num_variable_regions and remaining_macros:
        idxs = [node_to_idx[m] for m in remaining_macros]
        areas = np.array([dims_real[i, 0] * dims_real[i, 1] for i in idxs],
                         dtype=np.float64)
        probs = areas / areas.sum()

        need = min(num_variable_regions - len(selected_macros),
                   len(remaining_macros))
        extra = np.random.choice(remaining_macros, size=need,
                                 replace=False, p=probs)
        selected_macros.update(extra)

    # ── 3) Build first_macros list --------------------------------------
    first_macros = []
    for m in selected_macros:
        idx = node_to_idx[m]
        w_int, h_int = dims_int[idx]
        first_macros.append(dict(
                name=m,
                short_name=node_shortname[m],
                color=color_cfg[m],
                width=int(w_int),
                height=int(h_int),
                num_macros_in_group=cg_count[color_cfg[m]],
        ))

    # ── 4) Explanatory text ---------------------------------------------
    prompt.append(
            "This is a global optimization task where you need to consider:\n"
            "- The impact of your suggested regions on macros that will be placed "
            "in the future\n"
            "- The overall arrangement of the selected macros that minimizes "
            "wirelength\n\n"
    )

    prompt.append("\n\n# MACRO NAMES AND PROPERTIES FOR THIS NETLIST:\n\n")
    prompt.append(
            "THE TABLE BELOW DISPLAYS ALL MACROS IN THE ORDER THAT THEY WILL BE PLACED:\n\n"
    )

    # table describing every macro
    macro_data = []
    for m in node_names:
        idx = node_to_idx[m]
        macro_data.append(dict(
                name=node_shortname[m],
                full_name=m,
                color=color_cfg[m],
                width=int(dims_int[idx, 0]),
                height=int(dims_int[idx, 1]),
        ))

    hdr = "|| " + " | ".join(d['name'] for d in macro_data) + " |\n"
    hdr += "|:----------:|" + "|".join([":---:"] * len(macro_data)) + "|\n"
    row_color = "| **Color**  | " + " | ".join(
            f" {d['color']} " for d in macro_data) + " |\n"
    row_size = "| **W x H**  | " + " | ".join(
            f" {d['width']} x {d['height']} " for d in macro_data) + " |\n"
    prompt.append(hdr + row_color + row_size + "\n\n")

    # placement rules
    prompt.append("# IMPORTANT PLACEMENT RULES:\n")
    prompt.append(f"1. THE CHIP CANVAS IS {grid_size}x{grid_size}\n")
    prompt.append(
            "2. COORDINATE SYSTEM:\n"
            f"   - ORIGIN (0,0) IS AT BOTTOM-LEFT CORNER\n"
            f"   - TOP-LEFT CORNER IS (0,{grid_size})\n"
            f"   - BOTTOM-RIGHT CORNER IS ({grid_size},0)\n"
            f"   - TOP-RIGHT CORNER IS ({grid_size},{grid_size})\n"
    )
    prompt.append(
            "3. SUGGESTED REGIONS MUST BE DEFINED BY BOTTOM-LEFT AND TOP-RIGHT CORNERS OF THE RECTANGLE\n")
    prompt.append("4. SUGGESTED REGIONS MUST NOT OVERLAP WITH EACH OTHER\n")
    prompt.append("5. SUGGESTIONS ARE NEEDED FOR THESE SELECTED MACROS:\n")

    # list selected macros sorted by area (largest first)
    for info in sorted(first_macros,
                       key=lambda d: d['width'] * d['height'],
                       reverse=True):
        prompt.append(
                f"\t - {info['short_name']}\n"
                f"\t\t - Size: {info['width']:.0f} x {info['height']:.0f}\n"
                f"\t\t - Color: {info['color']}\n"
        )
    prompt.append('\n')

    prompt.append("# PLACEMENT QUALITY METRICS:\n")
    prompt.append("- LOWER WIRELENGTH IS BETTER\n")
    prompt.append("- MACRO OVERLAP MUST BE ZERO (overlapping placements are invalid)\n\n")

    return prompt, dict(
            selected_macros=selected_macros,
            first_macros=sorted(first_macros,
                                key=lambda d: d['width'] * d['height'],
                                reverse=True),
            macro_data=macro_data
    )


def preamble_recall_test(**kwargs):
    """
    Prompt variant used in the *Verbatim-Recall* ablation.
    Almost identical to `preamble_variable_regions`, but the task description
    makes clear that the model must **repeat the coordinates from a reference
    episode** instead of suggesting new regions, and the footer tells the
    model what output format to use.
    """
    prompt = []
    num_variable_regions = kwargs["num_variable_regions"]
    grid_size = kwargs["grid_size"]

    # ---------- context shortcuts ----------------------------------------
    node_names = kwargs["node_name_list"]
    placed_num_macro = kwargs["placed_num_macro"]
    num_macro_placed = kwargs["num_macro_placed"]
    color_cfg = kwargs["color_config"]  # {macro: color}
    cg_count = kwargs["color_group_count"]  # {color: int}
    cg_to_first_macro = kwargs["color_group_to_first_macro"]
    node_shortname = kwargs["node_name_to_short_name"]  # {macro: str}
    node_to_idx = kwargs["node_to_idx"]  # {macro: int}
    dims_int = kwargs["node_dims_int"]  # (M, 2) grid
    dims_real = kwargs["node_dims_real"]  # (M, 2) µm
    target_episode_index = kwargs["target_episode_index"]  # 1-based
    # ---------------------------------------------------------------------
    # 1) Task description  (changed: highlight “recall test”)
    # ---------------------------------------------------------------------
    prompt.append(
            "You are guiding a low-level placement policy for computer-chip "
            "floorplanning. **This is a *recall test*: do not optimise or invent "
            "new placements.  Simply repeat the exact macro locations from "
            f"reference episode #{target_episode_index + 1}.**\n\n"
            "The macros are grouped by colors based on their connectivity in the "
            "netlist graph (more pin connections → similar colors).  You will be "
            "asked to output the bottom-left corner of each selected macro.\n"
    )

    # ---------------------------------------------------------------------
    # 2) Choose which macros to “recall” (same logic as baseline)
    # ---------------------------------------------------------------------
    remaining_macros = node_names[num_macro_placed:placed_num_macro]

    colors, group_counts = zip(*cg_count.items())
    probs_by_group = np.array(group_counts) / sum(group_counts)

    selected_groups = np.random.choice(
            colors,
            size=min(num_variable_regions, len(colors)),
            replace=False,
            p=probs_by_group,
    )

    selected_macros = set()
    for g in selected_groups:
        m = cg_to_first_macro[g]
        if m in remaining_macros:
            selected_macros.add(m)

    remaining_macros = list(set(remaining_macros) - selected_macros)
    if len(selected_macros) < num_variable_regions and remaining_macros:
        idxs = [node_to_idx[m] for m in remaining_macros]
        areas = np.array(
                [dims_real[i, 0] * dims_real[i, 1] for i in idxs],
                dtype=np.float64
        )
        probs = areas / areas.sum()
        need = min(num_variable_regions - len(selected_macros),
                   len(remaining_macros))
        extras = np.random.choice(remaining_macros, size=need,
                                  replace=False, p=probs)
        selected_macros.update(extras)

    # ---------------------------------------------------------------------
    # Build first_macros list (unchanged)
    # ---------------------------------------------------------------------
    first_macros = []
    for m in selected_macros:
        idx = node_to_idx[m]
        first_macros.append(
                dict(
                        name=m,
                        short_name=node_shortname[m],
                        color=color_cfg[m],
                        width=int(dims_int[idx, 0]),  # grid units
                        height=int(dims_int[idx, 1]),
                        num_macros_in_group=cg_count[color_cfg[m]],
                )
        )

    # ---------------------------------------------------------------------
    # 3) Macro table (unchanged)
    # ---------------------------------------------------------------------
    prompt.append("\n\n# MACRO NAMES AND PROPERTIES FOR THIS NETLIST:\n\n")

    macro_data = []
    for m in node_names:
        idx = node_to_idx[m]
        macro_data.append(
                dict(
                        name=node_shortname[m],
                        full_name=m,
                        color=color_cfg[m],
                        width=int(dims_int[idx, 0]),
                        height=int(dims_int[idx, 1]),
                )
        )

    header = "|| " + " | ".join(d["name"] for d in macro_data) + " |\n"
    header += "|:----------:|" + "|".join([":---:"] * len(macro_data)) + "|\n"
    row_clr = "| **Color**  | " + " | ".join(
            f" {d['color']} " for d in macro_data
    ) + " |\n"
    row_sz = "| **W x H**  | " + " | ".join(
            f" {d['width']:.0f} x {d['height']:.0f} " for d in macro_data
    ) + " |\n"
    prompt.append(header + row_clr + row_sz + "\n\n")

    # ---------------------------------------------------------------------
    # 4) Placement rules (mostly same; trimmed optimisation bits)
    # ---------------------------------------------------------------------
    prompt.append("# IMPORTANT RULES / COORDINATE SYSTEM:\n")
    prompt.append(f"1. CHIP CANVAS SIZE: {grid_size} × {grid_size}\n")
    prompt.append(
            "2. ORIGIN (0,0) is bottom-left; (0,{g}) is top-left; "
            "({g},0) is bottom-right; ({g},{g}) is top-right.\n".format(
                    g=grid_size)
    )
    prompt.append("\n")

    # ---------------------------------------------------------------------
    # 5) Response format (replaces quality-metric block)
    # ---------------------------------------------------------------------
    prompt.append("# RESPONSE FORMAT:\n")
    prompt.append("Provide one line for each macro you are asked to recall:\n")
    prompt.append("    <SHORT_NAME>: (x, y)\n\n")

    # ---------------------------------------------------------------------
    return prompt, dict(
            selected_macros=selected_macros,
            first_macros=sorted(first_macros,
                                key=lambda d: d["width"] * d["height"],
                                reverse=True),
            macro_data=macro_data,
    )


def preamble_variable_regions(**kwargs):
    prompt = []
    num_variable_regions = kwargs['num_variable_regions']
    grid_size = kwargs['grid_size']

    # ---------- context shortcuts ----------------------------------------
    node_names = kwargs['node_name_list']
    placed_num_macro = kwargs['placed_num_macro']
    num_macro_placed = kwargs['num_macro_placed']
    color_cfg = kwargs['color_config']  # {macro:color}
    cg_count = kwargs['color_group_count']  # {color:int}
    cg_to_first_macro = kwargs['color_group_to_first_macro']  # {color:macro}
    node_shortname = kwargs['node_name_to_short_name']  # {macro:str}
    node_to_idx = kwargs['node_to_idx']  # {macro:int}
    dims_int = kwargs['node_dims_int']  # (M,2) ints
    dims_real = kwargs['node_dims_real']  # (M,2) µm

    # ---------------------------------------------------------------------
    # 1) Task description
    # ---------------------------------------------------------------------
    prompt.append(
            "You are guiding a low-level placement policy for computer chip "
            "floorplanning. Your primary goal is to create the most optimal chip "
            "floorplan possible that minimizes wirelength. Your task is to "
            "suggest rectangular regions for placing macros on the chip canvas, "
            "which has been divided into a grid. The low-level policy will choose "
            "the exact placement location within your suggested regions. Your "
            "suggestions should be highly precise and optimal. If there is a macro "
            "in the netlist that you are not providing a suggestion for, the "
            "low-level policy will place that macro by itself.\n\n"
            "The macros are grouped by colors based on their connectivity in the "
            "netlist graph, where macros with higher interconnectivity "
            "(more pin connections between them) are assigned similar colors. "
            "Your goal is to provide optimal region suggestions that will result "
            "in the best possible chip floorplan with minimal wirelength.\n\n"
            "After you place the macros, an analytical placer automatically "
            "positions the standard cells around them. Your macro placement "
            "directly affects how the standard cells are arranged.\n"
    )

    # ---------------------------------------------------------------------
    # 2) Choose which macros to suggest regions for
    # ---------------------------------------------------------------------
    remaining_macros = node_names[num_macro_placed:placed_num_macro]

    colors, group_counts = zip(*cg_count.items())
    probs_by_group = np.array(group_counts) / sum(group_counts)

    # One macro from each selected colour group
    selected_groups = np.random.choice(
            colors,
            size=min(num_variable_regions, len(colors)),
            replace=False,
            p=probs_by_group
    )

    selected_macros = set()
    for g in selected_groups:
        m = cg_to_first_macro[g]
        if m in remaining_macros:
            selected_macros.add(m)

    # Add extra macros (area-weighted) if needed
    remaining_macros = list(set(remaining_macros) - selected_macros)
    if len(selected_macros) < num_variable_regions and remaining_macros:
        idxs = [node_to_idx[m] for m in remaining_macros]
        areas = np.array([dims_real[i, 0] * dims_real[i, 1] for i in idxs],
                         dtype=np.float64)
        probs = areas / areas.sum()
        need = min(num_variable_regions - len(selected_macros),
                   len(remaining_macros))
        extras = np.random.choice(remaining_macros, size=need,
                                  replace=False, p=probs)
        selected_macros.update(extras)

    # Build first_macros list
    first_macros = []
    for m in selected_macros:
        idx = node_to_idx[m]
        first_macros.append(dict(
                name=m,
                short_name=node_shortname[m],
                color=color_cfg[m],
                width=int(dims_int[idx, 0]),  # grid units
                height=int(dims_int[idx, 1]),
                num_macros_in_group=cg_count[color_cfg[m]],
        ))

    # ---------------------------------------------------------------------
    # 3) Explanatory section & full macro table
    # ---------------------------------------------------------------------
    prompt.append(
            "This is a global optimization task where you need to consider:\n"
            "- The impact of your suggested regions on macros that will be placed in the future\n"
            "- The overall arrangement of the selected macros that minimizes wirelength\n\n"
    )

    prompt.append("\n\n# MACRO NAMES AND PROPERTIES FOR THIS NETLIST:\n\n")

    macro_data = []
    for m in node_names:
        idx = node_to_idx[m]
        macro_data.append(dict(
                name=node_shortname[m],
                full_name=m,
                color=color_cfg[m],
                width=int(dims_int[idx, 0]),
                height=int(dims_int[idx, 1]),
        ))

    header = "|| " + " | ".join(d["name"] for d in macro_data) + " |\n"
    header += "|:----------:|" + "|".join([":---:"] * len(macro_data)) + "|\n"
    row_clr = "| **Color**  | " + " | ".join(
            f" {d['color']} " for d in macro_data) + " |\n"
    row_sz = "| **W x H**  | " + " | ".join(
            f" {d['width']:.0f} x {d['height']:.0f} " for d in
            macro_data) + " |\n"
    prompt.append(header + row_clr + row_sz + "\n\n")

    # ---------------------------------------------------------------------
    # 4) Placement rules and list selected macros
    # ---------------------------------------------------------------------
    prompt.append("# IMPORTANT PLACEMENT RULES:\n")
    prompt.append(f"1. THE CHIP CANVAS IS {grid_size}x{grid_size}\n")
    prompt.append(
            "2. COORDINATE SYSTEM:\n"
            f"   - ORIGIN (0,0) IS AT BOTTOM-LEFT CORNER\n"
            f"   - TOP-LEFT CORNER IS (0,{grid_size})\n"
            f"   - BOTTOM-RIGHT CORNER IS ({grid_size},0)\n"
            f"   - TOP-RIGHT CORNER IS ({grid_size},{grid_size})\n"
    )
    prompt.append(
            "3. SUGGESTED REGIONS MUST BE DEFINED BY BOTTOM-LEFT AND TOP-RIGHT CORNERS OF THE RECTANGLE\n")
    prompt.append("4. SUGGESTED REGIONS MUST NOT OVERLAP WITH EACH OTHER\n")
    prompt.append("5. SUGGESTIONS ARE NEEDED FOR THESE SELECTED MACROS:\n")

    for info in sorted(first_macros,
                       key=lambda d: d['width'] * d['height'],
                       reverse=True):
        prompt.append(
                f"\t - {info['short_name']}\n"
                f"\t\t - Size: {info['width']:.0f} x {info['height']:.0f}\n"
                f"\t\t - Color: {info['color']}\n"
        )
    prompt.append('\n')

    prompt.append("# PLACEMENT QUALITY METRICS:\n")
    prompt.append("- LOWER WIRELENGTH IS BETTER\n")
    prompt.append("- MACRO OVERLAP MUST BE ZERO (overlapping placements are invalid)\n\n")

    return prompt, dict(
            selected_macros=selected_macros,
            first_macros=sorted(first_macros,
                                key=lambda d: d['width'] * d['height'],
                                reverse=True),
            macro_data=macro_data
    )


def preamble_all_regions(**kwargs):
    """
    Content-equivalent rewrite of the original function with **no `env`
    reference**.  All data come from the unpacked context dict.
    """
    prompt = []

    # ───────────────────── context shortcuts ──────────────────────────
    node_names = kwargs['node_name_list']
    placed_num_macro = kwargs['placed_num_macro']
    num_macro_placed = kwargs['num_macro_placed']
    color_group_count = kwargs['color_group_count']  # {color:int}
    first_macro_of_cg = kwargs['first_macro_of_color_group']  # {macro:color}
    node_shortname = kwargs['node_name_to_short_name']  # {macro:str}
    node_to_idx = kwargs['node_to_idx']  # {macro:int}
    dims_int = kwargs['node_dims_int']  # (M,2) ints
    color_cfg = kwargs['color_config']  # {macro:color}

    # ------------------------------------------------------------------
    #  Task description – identical text
    # ------------------------------------------------------------------
    prompt.append(
            "You are guiding a low-level placement policy for computer chip floorplanning. "
            "Your task is to suggest rectangular regions that can FULLY CONTAIN the first "
            "macro of each color group on the chip canvas, which has been divided into a grid. "
            "The low-level policy will choose the exact placement location within your suggested regions.\n\n"
            "The color groups are derived from analyzing the connectivity graph between macros, "
            "where macros with higher interconnectivity (more pin connections between them) "
            "are assigned the same color. Your guidance for the first macro of each color "
            "will help establish a pattern for placing all remaining macros of that color.\n"
    )

    # ------------------------------------------------------------------
    #  Select colour groups (weighted by group size) and gather macros
    # ------------------------------------------------------------------
    colors, group_counts = zip(*color_group_count.items())  # tuples
    total = sum(group_counts)
    probs = np.array(group_counts) / total

    chosen_groups = np.random.choice(
            colors,
            size=min(MAX_NUM_COLOR_GROUPS, len(colors)),
            replace=False,
            p=probs
    )
    chosen_groups = set(chosen_groups)

    selected_macros = set()
    first_macros = []

    for m in node_names[num_macro_placed:placed_num_macro]:
        if m in first_macro_of_cg and first_macro_of_cg[m] in chosen_groups:
            color = first_macro_of_cg[m]
            idx = node_to_idx[m]
            w_int, h_int = dims_int[idx]

            selected_macros.add(m)
            first_macros.append(dict(
                    name=m,
                    short_name=node_shortname[m],
                    color=color,
                    width=int(w_int),
                    height=int(h_int),
                    num_macros_in_group=color_group_count[color]
            ))

    # ------------------------------------------------------------------
    #  Additional explanatory text (unchanged)
    # ------------------------------------------------------------------
    prompt.append(
            "This is a global optimization task where you need to consider:\n"
            "- How each color group's first macro placement affects the remaining macros of that color\n"
            "- The impact of completed color groups on future color group placements\n"
            "- The overall arrangement of color groups to minimize wirelength\n\n"
            "Focus on suggesting regions that will EXPLORE the design space to further minimize overall wirelength.\n\n"
    )

    return prompt, dict(selected_macros=selected_macros,
                        first_macros=first_macros)


def preamble_random_regions(**kwargs):
    """
    Select up to MAX_NUM_COLOR_GROUPS colour groups (weighted by size) and
    return the first macro of each chosen group.  Produces **no prompt text**
    – the caller uses the metadata only.
    """
    # ── context shortcuts ────────────────────────────────────────────────
    node_names = kwargs['node_name_list']
    placed_num_macro = kwargs['placed_num_macro']
    num_macro_placed = kwargs['num_macro_placed']
    color_group_count = kwargs['color_group_count']  # {color:int}
    first_macro_of_cg = kwargs['first_macro_of_color_group']  # {macro:color}
    node_shortname = kwargs['node_name_to_short_name']  # {macro:str}
    node_to_idx = kwargs['node_to_idx']  # {macro:int}
    dims_int = kwargs['node_dims_int']  # (M,2) ints

    # ── choose colour groups (weighted by size) -------------------------
    colors, group_counts = zip(*color_group_count.items())  # parallel tuples
    probs = np.array(group_counts) / sum(group_counts)

    selected_groups = np.random.choice(
            colors,
            size=min(MAX_NUM_COLOR_GROUPS, len(colors)),
            replace=False,
            p=probs
    )
    selected_groups = set(selected_groups)

    # ── gather the first macro of each selected group -------------------
    selected_macros = set()
    first_macros = []

    for macro in node_names[num_macro_placed:placed_num_macro]:
        if (macro in first_macro_of_cg and
                first_macro_of_cg[macro] in selected_groups):
            color = first_macro_of_cg[macro]
            idx = node_to_idx[macro]
            width = int(math.ceil(dims_int[idx, 0]))
            height = int(math.ceil(dims_int[idx, 1]))

            selected_macros.add(macro)
            first_macros.append(dict(
                    name=macro,
                    short_name=node_shortname[macro],
                    color=color,
                    width=width,
                    height=height,
                    num_macros_in_group=color_group_count[color],
            ))

    # Return *empty* prompt plus metadata (matches original behaviour)
    return [], dict(selected_macros=selected_macros,
                    first_macros=first_macros)


def preamble_exploration(**kwargs):
    """
    Identical to preamble_variable_regions_greedy, but with instructions
    explicitly encouraging exploration and novelty.
    """
    prompt = []
    num_variable_regions = kwargs['num_variable_regions']
    grid_size = kwargs['grid_size']

    # ── context shortcuts ────────────────────────────────────────────────
    node_names = kwargs['node_name_list']  # list[str]
    placed_num_macro = kwargs['placed_num_macro']
    num_macro_placed = kwargs['num_macro_placed']
    color_cfg = kwargs['color_config']  # {macro:color}
    cg_count = kwargs['color_group_count']  # {color:int}
    cg_to_first_macro = kwargs['color_group_to_first_macro']  # {color:macro}
    node_shortname = kwargs['node_name_to_short_name']  # {macro:str}
    node_to_idx = kwargs['node_to_idx']  # {macro:int}
    dims_int = kwargs['node_dims_int']  # (M,2) ints
    dims_real = kwargs['node_dims_real']  # (M,2) µm
    ratio_x = kwargs['ratio_x']  # µm ↔ grid
    ratio_y = kwargs['ratio_y']

    # ── 1) Task description (MODIFIED FOR EXPLORATION) ──────────────────
    prompt.append(
            "You are guiding a low-level placement policy for computer chip "
            "floorplanning. Your primary goal is to EXPLORE NOVEL design configurations to discover new, optimal floorplans that minimize wirelength. "
            "The previous examples provided are for context only, to show you what has been tried. Do not be constrained by them. Your task is to suggest "
            "diverse and creative rectangular regions for placing macros on the chip canvas. Prioritize novelty and exploration to find potentially superior placements.\n\n"
            "The macros are grouped by colors based on their connectivity in the "
            "netlist graph, where macros with higher interconnectivity (more pin "
            "connections between them) are assigned similar colors. Your "
            "suggestions will provide a starting point for creating a complete "
            "chip floorplan.\n"
    )

    # ── 2) Choose the macros to suggest regions for (UNCHANGED) ---------------------
    remaining_macros = node_names[num_macro_placed:placed_num_macro]

    colors, group_counts = zip(*cg_count.items())  # parallel tuples
    total_count = sum(group_counts)
    probs_by_grp = [cnt / total_count for cnt in group_counts]

    # a) one macro per colour group (without replacement)
    selected_groups = np.random.choice(
            colors,
            size=min(num_variable_regions, len(colors)),
            replace=False,
            p=probs_by_grp
    )

    selected_macros = set()
    for g in selected_groups:
        m = cg_to_first_macro[g]
        if m in remaining_macros:
            selected_macros.add(m)

    # b) add extra macros if we still need more (area-weighted)
    remaining_macros = list(set(remaining_macros) - selected_macros)
    if len(selected_macros) < num_variable_regions and remaining_macros:
        idxs = [node_to_idx[m] for m in remaining_macros]
        areas = np.array([dims_real[i, 0] * dims_real[i, 1] for i in idxs],
                         dtype=np.float64)
        probs = areas / areas.sum()

        need = min(num_variable_regions - len(selected_macros),
                   len(remaining_macros))
        extra = np.random.choice(remaining_macros, size=need,
                                 replace=False, p=probs)
        selected_macros.update(extra)

    # ── 3) Build first_macros list (UNCHANGED) --------------------------------------
    first_macros = []
    for m in selected_macros:
        idx = node_to_idx[m]
        w_int, h_int = dims_int[idx]
        first_macros.append(dict(
                name=m,
                short_name=node_shortname[m],
                color=color_cfg[m],
                width=int(w_int),
                height=int(h_int),
                num_macros_in_group=cg_count[color_cfg[m]],
        ))

    # ── 4) Explanatory text (UNCHANGED) ---------------------------------------------
    prompt.append(
            "This is a global optimization task where you need to consider:\n"
            "- The impact of your suggested regions on macros that will be placed "
            "in the future\n"
            "- The overall arrangement of the selected macros that minimizes "
            "wirelength\n\n"
    )

    prompt.append("\n\n# MACRO NAMES AND PROPERTIES FOR THIS NETLIST:\n\n")
    prompt.append(
            "THE TABLE BELOW DISPLAYS ALL MACROS IN THE ORDER THAT THEY WILL BE PLACED:\n\n"
    )

    # table describing every macro
    macro_data = []
    for m in node_names:
        idx = node_to_idx[m]
        macro_data.append(dict(
                name=node_shortname[m],
                full_name=m,
                color=color_cfg[m],
                width=int(dims_int[idx, 0]),
                height=int(dims_int[idx, 1]),
        ))

    hdr = "|| " + " | ".join(d['name'] for d in macro_data) + " |\n"
    hdr += "|:----------:|" + "|".join([":---:"] * len(macro_data)) + "|\n"
    row_color = "| **Color**  | " + " | ".join(
            f" {d['color']} " for d in macro_data) + " |\n"
    row_size = "| **W x H**  | " + " | ".join(
            f" {d['width']} x {d['height']} " for d in macro_data) + " |\n"
    prompt.append(hdr + row_color + row_size + "\n\n")

    # placement rules
    prompt.append("# IMPORTANT PLACEMENT RULES:\n")
    prompt.append(f"1. THE CHIP CANVAS IS {grid_size}x{grid_size}\n")
    prompt.append(
            "2. COORDINATE SYSTEM:\n"
            f"   - ORIGIN (0,0) IS AT BOTTOM-LEFT CORNER\n"
            f"   - TOP-LEFT CORNER IS (0,{grid_size})\n"
            f"   - BOTTOM-RIGHT CORNER IS ({grid_size},0)\n"
            f"   - TOP-RIGHT CORNER IS ({grid_size},{grid_size})\n"
    )
    prompt.append(
            "3. SUGGESTED REGIONS MUST BE DEFINED BY BOTTOM-LEFT AND TOP-RIGHT CORNERS OF THE RECTANGLE\n")
    prompt.append("4. SUGGESTED REGIONS MUST NOT OVERLAP WITH EACH OTHER\n")
    prompt.append("5. SUGGESTIONS ARE NEEDED FOR THESE SELECTED MACROS:\n")

    # list selected macros sorted by area (largest first)
    for info in sorted(first_macros,
                       key=lambda d: d['width'] * d['height'],
                       reverse=True):
        prompt.append(
                f"\t - {info['short_name']}\n"
                f"\t\t - Size: {info['width']:.0f} x {info['height']:.0f}\n"
                f"\t\t - Color: {info['color']}\n"
        )
    prompt.append('\n')

    prompt.append("# PLACEMENT QUALITY METRICS:\n")
    prompt.append("- LOWER WIRELENGTH IS BETTER\n")
    prompt.append("- MACRO OVERLAP MUST BE ZERO (overlapping placements are invalid)\n\n")

    return prompt, dict(
            selected_macros=selected_macros,
            first_macros=sorted(first_macros,
                                key=lambda d: d['width'] * d['height'],
                                reverse=True),
            macro_data=macro_data
    )


def preamble_conservative(**kwargs):
    """
    Identical to preamble_variable_regions_greedy, but with instructions
    explicitly encouraging conservative, safe placements based on history.
    """
    prompt = []
    num_variable_regions = kwargs['num_variable_regions']
    grid_size = kwargs['grid_size']

    # ── context shortcuts ────────────────────────────────────────────────
    node_names = kwargs['node_name_list']  # list[str]
    placed_num_macro = kwargs['placed_num_macro']
    num_macro_placed = kwargs['num_macro_placed']
    color_cfg = kwargs['color_config']  # {macro:color}
    cg_count = kwargs['color_group_count']  # {color:int}
    cg_to_first_macro = kwargs['color_group_to_first_macro']  # {color:macro}
    node_shortname = kwargs['node_name_to_short_name']  # {macro:str}
    node_to_idx = kwargs['node_to_idx']  # {macro:int}
    dims_int = kwargs['node_dims_int']  # (M,2) ints
    dims_real = kwargs['node_dims_real']  # (M,2) µm
    ratio_x = kwargs['ratio_x']  # µm ↔ grid
    ratio_y = kwargs['ratio_y']

    # ── 1) Task description (MODIFIED FOR CONSERVATISM) ──────────────────
    prompt.append(
            "You are guiding a low-level placement policy for computer chip "
            "floorplanning. Your goal is to refine existing high-quality placements. "
            "The previous examples provided are high-quality solutions. Your task is to suggest regions that are VERY SIMILAR to these successful examples. "
            "Do not deviate significantly. The goal is to exploit the known good solutions, not explore new ones.\n\n"
            "The macros are grouped by colors based on their connectivity in the "
            "netlist graph, where macros with higher interconnectivity (more pin "
            "connections between them) are assigned similar colors. Your "
            "suggestions will provide a starting point for creating a complete "
            "chip floorplan.\n"
    )

    # ── 2) Choose the macros to suggest regions for (UNCHANGED) ---------------------
    remaining_macros = node_names[num_macro_placed:placed_num_macro]

    colors, group_counts = zip(*cg_count.items())  # parallel tuples
    total_count = sum(group_counts)
    probs_by_grp = [cnt / total_count for cnt in group_counts]

    # a) one macro per colour group (without replacement)
    selected_groups = np.random.choice(
            colors,
            size=min(num_variable_regions, len(colors)),
            replace=False,
            p=probs_by_grp
    )

    selected_macros = set()
    for g in selected_groups:
        m = cg_to_first_macro[g]
        if m in remaining_macros:
            selected_macros.add(m)

    # b) add extra macros if we still need more (area-weighted)
    remaining_macros = list(set(remaining_macros) - selected_macros)
    if len(selected_macros) < num_variable_regions and remaining_macros:
        idxs = [node_to_idx[m] for m in remaining_macros]
        areas = np.array([dims_real[i, 0] * dims_real[i, 1] for i in idxs],
                         dtype=np.float64)
        probs = areas / areas.sum()

        need = min(num_variable_regions - len(selected_macros),
                   len(remaining_macros))
        extra = np.random.choice(remaining_macros, size=need,
                                 replace=False, p=probs)
        selected_macros.update(extra)

    # ── 3) Build first_macros list (UNCHANGED) --------------------------------------
    first_macros = []
    for m in selected_macros:
        idx = node_to_idx[m]
        w_int, h_int = dims_int[idx]
        first_macros.append(dict(
                name=m,
                short_name=node_shortname[m],
                color=color_cfg[m],
                width=int(w_int),
                height=int(h_int),
                num_macros_in_group=cg_count[color_cfg[m]],
        ))

    # ── 4) Explanatory text (UNCHANGED) ---------------------------------------------
    prompt.append(
            "This is a global optimization task where you need to consider:\n"
            "- The impact of your suggested regions on macros that will be placed "
            "in the future\n"
            "- The overall arrangement of the selected macros that minimizes "
            "wirelength\n\n"
    )

    prompt.append("\n\n# MACRO NAMES AND PROPERTIES FOR THIS NETLIST:\n\n")
    prompt.append(
            "THE TABLE BELOW DISPLAYS ALL MACROS IN THE ORDER THAT THEY WILL BE PLACED:\n\n"
    )

    # table describing every macro
    macro_data = []
    for m in node_names:
        idx = node_to_idx[m]
        macro_data.append(dict(
                name=node_shortname[m],
                full_name=m,
                color=color_cfg[m],
                width=int(dims_int[idx, 0]),
                height=int(dims_int[idx, 1]),
        ))

    hdr = "|| " + " | ".join(d['name'] for d in macro_data) + " |\n"
    hdr += "|:----------:|" + "|".join([":---:"] * len(macro_data)) + "|\n"
    row_color = "| **Color**  | " + " | ".join(
            f" {d['color']} " for d in macro_data) + " |\n"
    row_size = "| **W x H**  | " + " | ".join(
            f" {d['width']} x {d['height']} " for d in macro_data) + " |\n"
    prompt.append(hdr + row_color + row_size + "\n\n")

    # placement rules
    prompt.append("# IMPORTANT PLACEMENT RULES:\n")
    prompt.append(f"1. THE CHIP CANVAS IS {grid_size}x{grid_size}\n")
    prompt.append(
            "2. COORDINATE SYSTEM:\n"
            f"   - ORIGIN (0,0) IS AT BOTTOM-LEFT CORNER\n"
            f"   - TOP-LEFT CORNER IS (0,{grid_size})\n"
            f"   - BOTTOM-RIGHT CORNER IS ({grid_size},0)\n"
            f"   - TOP-RIGHT CORNER IS ({grid_size},{grid_size})\n"
    )
    prompt.append(
            "3. SUGGESTED REGIONS MUST BE DEFINED BY BOTTOM-LEFT AND TOP-RIGHT CORNERS OF THE RECTANGLE\n")
    prompt.append("4. SUGGESTED REGIONS MUST NOT OVERLAP WITH EACH OTHER\n")
    prompt.append("5. SUGGESTIONS ARE NEEDED FOR THESE SELECTED MACROS:\n")

    # list selected macros sorted by area (largest first)
    for info in sorted(first_macros,
                       key=lambda d: d['width'] * d['height'],
                       reverse=True):
        prompt.append(
                f"\t - {info['short_name']}\n"
                f"\t\t - Size: {info['width']:.0f} x {info['height']:.0f}\n"
                f"\t\t - Color: {info['color']}\n"
        )
    prompt.append('\n')

    prompt.append("# PLACEMENT QUALITY METRICS:\n")
    prompt.append("- LOWER WIRELENGTH IS BETTER\n")
    prompt.append("- MACRO OVERLAP MUST BE ZERO (overlapping placements are invalid)\n\n")

    return prompt, dict(
            selected_macros=selected_macros,
            first_macros=sorted(first_macros,
                                key=lambda d: d['width'] * d['height'],
                                reverse=True),
            macro_data=macro_data
    )
