"""
Robot Ontology Generation Pipeline

This script generates:
1. output_robot_graph/: UR5 standalone ontology results
2. output_mapping/: Panda + UR5 aligned ontology results (cross-robot skill mapping)
3. guidance JSON files for structured infilling (auto-generated from skill_substitutions)

Usage:
    python generate_ontology.py [--use_llm] [--model MODEL_NAME]
"""

import argparse
import json
import sys
import re
from typing import Optional
from pathlib import Path
from copy import deepcopy
from difflib import SequenceMatcher

sys.path.insert(0, str(Path(__file__).parent))

from ontology import TripleGraph, Predicates, robot_id, skill_id, obj_id
from parse_robot import parse_robot
from reasoning import (
    infer_capabilities,
    infer_skill_substitutions,
    infer_object_mappings,
    generate_report
)
from llm_hf import create_llm, DummyLLM


# Base directory
BASE_DIR = Path(__file__).parent
PROJECT_ROOT = BASE_DIR.parent

# Robot configurations
ROBOTS_RLBENCH = {
    "panda": {
        "urdf": PROJECT_ROOT / "robots/panda/panda.urdf",
        "srdf": PROJECT_ROOT / "robots/panda/panda.srdf",
        "skills": BASE_DIR / "data/panda_skills.json"
    },
    "ur5": {
        "urdf": PROJECT_ROOT / "robots/ur5/ur5_robotiq85.urdf",
        "srdf": PROJECT_ROOT / "robots/ur5/ur5_robotiq85.srdf",
        "skills": BASE_DIR / "data/ur5_skills.json"
    },
    "sawyer": {
        "urdf": PROJECT_ROOT / "robots/sawyer/sawyer_with_baxter_gripper.urdf",
        "srdf": PROJECT_ROOT / "robots/sawyer/sawyer_with_baxter_gripper.srdf",
        "skills": BASE_DIR / "data/sawyer_skills.json"
    }
}

# Genesis robot configurations
ROBOTS_GENESIS = {
    "panda": {
        "urdf": PROJECT_ROOT / "robots/panda/panda.urdf",
        "srdf": PROJECT_ROOT / "robots/panda/panda.srdf",
        "skills": BASE_DIR / "data/panda_genesis_skills.json"
    },
    "robotiq": {
        "urdf": PROJECT_ROOT / "robots/robotiq/franka_robotiq85.urdf",
        "srdf": PROJECT_ROOT / "robots/robotiq/franka_robotiq85.srdf",
        "skills": BASE_DIR / "data/robotiq_skills.json"
    },
    "suction": {
        "urdf": PROJECT_ROOT / "robots/suction/franka_suction.urdf",
        "srdf": PROJECT_ROOT / "robots/suction/franka_suction.srdf",
        "skills": BASE_DIR / "data/suction_skills.json"
    }
}

# Default: RLBench robots (for backward compatibility)
ROBOTS = ROBOTS_RLBENCH

# Score threshold for considering skill equivalence
EQUIVALENCE_SCORE_THRESHOLD = 0.8


def load_skills(skills_path: Path) -> list:
    """Load skills from JSON file."""
    with open(skills_path, 'r') as f:
        data = json.load(f)
    return data.get('skills', [])


def load_skills_as_dict(skills_path: Path) -> dict:
    """Load skills as a dictionary keyed by skill name."""
    skills = load_skills(skills_path)
    return {s['name']: s for s in skills}


def load_scene(scene_path: Path) -> dict:
    """Load scene from JSON file."""
    with open(scene_path, 'r') as f:
        return json.load(f)


def predicate_to_string(pred_item) -> str:
    """Convert predicate (dict or string) to string representation."""
    if isinstance(pred_item, str):
        return pred_item
    if isinstance(pred_item, dict):
        # Format: predicate(arg1, arg2, ...) or not(predicate(...))
        predicate = pred_item.get('predicate', '')
        args = pred_item.get('args', [])
        positive = pred_item.get('positive', True)
        pred_str = f"{predicate}({', '.join(args)})"
        if not positive:
            pred_str = f"not({pred_str})"
        return pred_str
    return str(pred_item)


def add_skills_to_graph(graph: TripleGraph, robot_name: str, skills: list):
    """Add skill triples to the graph."""
    rid = robot_id(robot_name)

    for skill in skills:
        sid = skill_id(robot_name, skill['name'])
        graph.add(rid, Predicates.HAS_SKILL, sid)
        graph.add(sid, Predicates.HAS_DESCRIPTION, skill.get('description', ''))

        for param in skill.get('parameters', []):
            param_str = f"{param['name']}:{param.get('type', 'unknown')}"
            if 'semantic' in param:
                param_str += f":{param['semantic']}"
            graph.add(sid, Predicates.HAS_PARAM, param_str)

        for pre in skill.get('preconditions', []):
            graph.add(sid, Predicates.HAS_PRE, predicate_to_string(pre))

        for eff in skill.get('effects', []):
            graph.add(sid, Predicates.HAS_EFF, predicate_to_string(eff))

        for cap in skill.get('required_capabilities', []):
            graph.add(sid, Predicates.REQUIRES_CAP, cap)


def add_scene_to_graph(graph: TripleGraph, scene: dict):
    """Add scene objects and relations to the graph."""
    scene_id = scene.get('scene_id', 'default')

    for obj in scene.get('objects', []):
        oid = obj_id(scene_id, obj['id'])
        graph.add(f"scene:{scene_id}", Predicates.HAS_OBJECT, oid)
        graph.add(oid, Predicates.HAS_TYPE, obj['type'])

        if 'pose' in obj:
            graph.add(oid, Predicates.HAS_POSE, json.dumps(obj['pose']))

        for aff in obj.get('affordances', []):
            graph.add(oid, Predicates.HAS_AFFORDANCE, aff)

    for rel in scene.get('relations', []):
        sub_oid = obj_id(scene_id, rel['sub'])
        obj_oid = obj_id(scene_id, rel['obj'])
        pred = f"rel:{rel['pred']}"
        graph.add(sub_oid, pred, obj_oid)


# ============================================================================
# Semantic Categories for Validation
# ============================================================================

# Semantic groups that MUST match for valid parameter mapping
# If a semantic belongs to a strict group, it can ONLY map to another semantic in the same group
SEMANTIC_STRICT_GROUPS = {
    'position': {'position'},
    'quat': {'quaternion'},
    'orientation': {'orientation'},
    'gripper_state': {'gripper_state', 'gripper_open_value', 'gripper_close_value'},
    'time_limit': {'time_limit'},
    'distance': {'distance', 'approach_distance'},
    'tolerance': {'position_tolerance', 'orientation_tolerance'},
}


def get_strict_group(semantic: str) -> Optional[str]:
    """Get the strict group name for a semantic, or None if not in any strict group."""
    for group_name, members in SEMANTIC_STRICT_GROUPS.items():
        if semantic in members:
            return group_name
    return None


def is_strict_semantic_mismatch(sem1: str, sem2: str) -> bool:
    """
    Check if two semantics have a strict group mismatch.
    Returns True if one semantic is in a strict group but the other is in a different group
    (or not in the same group). This is a hard reject condition.
    """
    if sem1 == sem2:
        return False

    group1 = get_strict_group(sem1)
    group2 = get_strict_group(sem2)

    # If neither is in a strict group, no strict mismatch
    if group1 is None and group2 is None:
        return False

    # If one is in a strict group, they must be in the SAME group
    if group1 is not None and group2 is not None:
        return group1 != group2

    # One is in strict group, the other is not -> strict mismatch
    return True

# Semantic groups that are compatible (can map to each other)
SEMANTIC_COMPATIBLE = {
    'position': {'position'},
    'quat': {'quaternion'},
    'orientation': {'orientation'},
    'approach_axis': {'approach_axis'},
    'approach_distance': {'approach_distance', 'distance'},
    'position_tolerance': {'position_tolerance'},
    'orientation_tolerance': {'orientation_tolerance'},
    'time_limit': {'time_limit'},
    'iteration_limit': {'iteration_limit'},
    'trajectory_resolution': {'trajectory_resolution'},
    'gripper_state': {'gripper_state', 'gripper_open_value', 'gripper_close_value'},
    'gripper_open_value': {'gripper_state', 'gripper_open_value'},
    'gripper_close_value': {'gripper_state', 'gripper_close_value'},
    'gripper_action_steps': {'gripper_action_steps', 'stabilization_steps'},
    'stabilization_steps': {'stabilization_steps', 'gripper_action_steps'},
}

# Forbidden mappings (semantic pairs that should NEVER match)
SEMANTIC_FORBIDDEN = [
    ('time_limit', 'gripper_state'),
    ('time_limit', 'gripper_open_value'),
    ('time_limit', 'gripper_close_value'),
    ('position', 'orientation'),
    ('position_tolerance', 'orientation_tolerance'),
    ('iteration_limit', 'time_limit'),
]


# ============================================================================
# Parameter Mapping Inference (Semantic-based)
# ============================================================================

def get_semantic(param: dict) -> str:
    """Get semantic field from parameter, with fallback to type-based inference."""
    if 'semantic' in param:
        return param['semantic']

    # Fallback: infer from name/type
    name = param.get('name', '').lower()
    ptype = param.get('type', '').lower()

    if 'pos' in name and 'tol' not in name:
        return 'position'
    if 'quat' in name:
        return 'quaternion'
    if 'orientation' in name:
        return 'orientation'
    if 'timeout' in name or 'time' in name:
        return 'time_limit'
    if 'threshold' in name or 'tol' in name:
        if 'pos' in name:
            return 'position_tolerance'
        if 'ori' in name:
            return 'orientation_tolerance'
        return 'position_tolerance'  # default
    if 'gripper' in name:
        if 'open' in name:
            return 'gripper_open_value'
        if 'close' in name:
            return 'gripper_close_value'
        return 'gripper_state'
    if 'max_steps' in name or 'steps' in name:
        return 'iteration_limit'
    if 'axis' in name:
        return 'approach_axis'
    if 'distance' in name:
        return 'approach_distance'

    return 'unknown'


def semantic_compatible(sem1: str, sem2: str) -> bool:
    """
    Check if two semantics are compatible for mapping.
    Bidirectional: checks both sem1's and sem2's compatibility sets.
    """
    if sem1 == sem2:
        return True

    # Check forbidden pairs
    for (a, b) in SEMANTIC_FORBIDDEN:
        if (sem1 == a and sem2 == b) or (sem1 == b and sem2 == a):
            return False

    # Check compatible groups (bidirectional)
    # sem1 -> sem2 compatible OR sem2 -> sem1 compatible
    compat_set_1 = SEMANTIC_COMPATIBLE.get(sem1, set())
    compat_set_2 = SEMANTIC_COMPATIBLE.get(sem2, set())
    return sem2 in compat_set_1 or sem1 in compat_set_2


def semantic_similarity(sem1: str, sem2: str) -> float:
    """Calculate semantic similarity score."""
    if sem1 == sem2:
        return 1.0

    # Check if compatible
    if semantic_compatible(sem1, sem2):
        return 0.8

    # Check forbidden
    for (a, b) in SEMANTIC_FORBIDDEN:
        if (sem1 == a and sem2 == b) or (sem1 == b and sem2 == a):
            return 0.0

    return 0.2  # Unknown/weak relation


def normalize_param_name(name: str) -> str:
    """Normalize parameter name for comparison."""
    name = name.lower()
    name = re.sub(r'^(target_|grasp_|place_|approach_)', '', name)
    name = re.sub(r'(_s|_rad|_tol)$', '', name)
    return name


def param_name_similarity(name1: str, name2: str) -> float:
    """Calculate similarity between two parameter names."""
    n1 = normalize_param_name(name1)
    n2 = normalize_param_name(name2)

    if n1 == n2:
        return 1.0
    if n1 in n2 or n2 in n1:
        return 0.8
    return SequenceMatcher(None, n1, n2).ratio()


def type_compatible(type1: str, type2: str) -> bool:
    """Check if two parameter types are compatible."""
    type_groups = [
        {'vec3', 'position', 'pos', 'point'},
        {'quat', 'quat_xyzw', 'quaternion', 'orientation'},
        {'float', 'double', 'number'},
        {'int', 'integer'},
        {'string', 'str'},
        {'dict', 'object', 'map'},
    ]

    t1, t2 = type1.lower(), type2.lower()
    if t1 == t2:
        return True

    for group in type_groups:
        if t1 in group and t2 in group:
            return True

    return False


def units_compatible(units1: str, units2: str) -> bool:
    """Check if units are compatible."""
    if not units1 or not units2:
        return True  # No units specified, assume compatible

    return units1.lower() == units2.lower()


def infer_parameter_mapping(source_params: list, target_params: list) -> tuple:
    """
    Infer parameter mapping between source and target skills using semantic matching.

    Returns:
        tuple: (mappings, risk_flags)
        - mappings: list of mapping dicts with confidence breakdown
        - risk_flags: list of potential issues detected
    """
    mappings = []
    risk_flags = []
    used_targets = set()

    for sp in source_params:
        sp_name = sp['name']
        sp_type = sp.get('type', '')
        sp_semantic = get_semantic(sp)
        sp_units = sp.get('units', '')

        best_match = None
        best_score = 0.0
        best_breakdown = {}

        for tp in target_params:
            if tp['name'] in used_targets:
                continue

            tp_name = tp['name']
            tp_type = tp.get('type', '')
            tp_semantic = get_semantic(tp)
            tp_units = tp.get('units', '')

            # Check forbidden semantic pairs (hard filter)
            is_forbidden = False
            for (a, b) in SEMANTIC_FORBIDDEN:
                if (sp_semantic == a and tp_semantic == b) or (sp_semantic == b and tp_semantic == a):
                    is_forbidden = True
                    break

            if is_forbidden:
                continue

            # Check strict semantic group mismatch (hard reject)
            if is_strict_semantic_mismatch(sp_semantic, tp_semantic):
                continue

            # Multi-factor scoring
            name_score = param_name_similarity(sp_name, tp_name)
            semantic_score = semantic_similarity(sp_semantic, tp_semantic)

            # Type score: conservative when type info is missing
            if not sp_type or not tp_type:
                # Type info missing - use conservative score (no bonus)
                type_score = 0.3
            elif type_compatible(sp_type, tp_type):
                # Type explicitly compatible - give bonus
                type_score = 1.0
            else:
                # Type explicitly incompatible - penalty
                type_score = 0.2

            units_score = 1.0 if units_compatible(sp_units, tp_units) else 0.5

            # Weighted combination (semantic is most important)
            total_score = (
                name_score * 0.2 +
                semantic_score * 0.5 +
                type_score * 0.2 +
                units_score * 0.1
            )

            if total_score > best_score and total_score > 0.4:
                best_score = total_score
                best_match = tp_name
                best_breakdown = {
                    'name_similarity': round(name_score, 3),
                    'semantic_similarity': round(semantic_score, 3),
                    'type_compatibility': round(type_score, 3),
                    'units_compatibility': round(units_score, 3),
                    'source_semantic': sp_semantic,
                    'target_semantic': tp_semantic,
                }

        if best_match:
            used_targets.add(best_match)
            mappings.append({
                'source': sp_name,
                'target': best_match,
                'confidence': round(best_score, 3),
                'breakdown': best_breakdown
            })

            # Add risk flags for low confidence or semantic mismatch
            if best_score < 0.7:
                risk_flags.append({
                    'type': 'low_confidence',
                    'param': sp_name,
                    'target': best_match,
                    'score': best_score,
                    'message': f"Low confidence mapping: {sp_name} -> {best_match} ({best_score:.2f})"
                })

            if best_breakdown.get('semantic_similarity', 0) < 0.8:
                risk_flags.append({
                    'type': 'semantic_mismatch',
                    'param': sp_name,
                    'source_semantic': best_breakdown.get('source_semantic'),
                    'target_semantic': best_breakdown.get('target_semantic'),
                    'message': f"Semantic mismatch: {sp_name}({best_breakdown.get('source_semantic')}) -> {best_match}({best_breakdown.get('target_semantic')})"
                })

    return mappings, risk_flags


def generate_param_mapping_text(mappings: list) -> str:
    """Generate human-readable parameter mapping text."""
    if not mappings:
        return "No direct parameter mappings identified."

    lines = ["Parameter Mapping:"]
    for m in mappings:
        lines.append(f"- {m['source']} -> {m['target']}")
    return "\n".join(lines)


def generate_function_signature(skill: dict, robot_prefix: str = "") -> str:
    """Generate a Python function signature from skill definition."""
    name = skill['name']
    params = skill.get('parameters', [])
    desc = skill.get('description', '')

    # Build parameter list
    param_strs = ["env", "task"]
    for p in params:
        pname = p['name']
        ptype = p.get('type', 'Any')

        # Map types to Python type hints
        type_map = {
            'vec3': 'np.ndarray',
            'quat_xyzw': 'np.ndarray',
            'float': 'float',
            'int': 'int',
            'string': 'str',
            'dict': 'dict',
            'bool': 'bool',
            'object': 'Shape',  # PyRep Shape object
        }
        py_type = type_map.get(ptype, 'Any')

        # Add default value for optional-looking params
        if 'timeout' in pname.lower() or 'max' in pname.lower() or 'tol' in pname.lower():
            param_strs.append(f"{pname}: {py_type} = None")
        else:
            param_strs.append(f"{pname}: {py_type}")

    param_str = ",\n    ".join(param_strs)

    signature = f"""def {name}(
    {param_str}
) -> tuple[Observation, float, bool]:
    \"\"\"
    {desc}
    \"\"\"
    pass"""

    return signature


def generate_interface_example(skill: dict, param_mappings: list, example_vars: dict = None) -> str:
    """Generate an example interface call."""
    name = skill['name']
    params = skill.get('parameters', [])

    # Default example variable names
    if example_vars is None:
        example_vars = {
            'pos': 'target_position',
            'quat': 'target_quaternion',
            'distance': '0.15',
            'axis': "'z'",
            'timeout': '10.0',
            'object': 'target_object',
        }

    args = ["env", "task"]
    default_axis = "'z'"

    # First pass: add target_object parameter if exists (by semantic or name)
    for p in params:
        pname = p['name']
        semantic = p.get('semantic', '')

        # Handle target_object parameter specifically
        if semantic == 'target_object' or pname == 'target_object':
            args.append(f"{pname}={example_vars.get('object', 'target_object')}")

    # Second pass: add other parameters (limit to first 3 non-target_object params for brevity)
    non_object_count = 0
    for p in params:
        pname = p['name']
        semantic = p.get('semantic', '')

        # Skip target_object (already added)
        if semantic == 'target_object' or pname == 'target_object':
            continue

        if non_object_count >= 3:
            break

        # Try to find a sensible example value
        if 'pos' in pname.lower():
            args.append(f"{pname}={example_vars.get('pos', 'pos')}")
            non_object_count += 1
        elif 'quat' in pname.lower():
            args.append(f"{pname}={example_vars.get('quat', 'quat')}")
            non_object_count += 1
        elif 'distance' in pname.lower():
            args.append(f"{pname}={example_vars.get('distance', '0.15')}")
            non_object_count += 1
        elif 'axis' in pname.lower():
            args.append(f"{pname}={example_vars.get('axis', default_axis)}")
            non_object_count += 1
        elif 'timeout' in pname.lower():
            args.append(f"{pname}={example_vars.get('timeout', '10.0')}")
            non_object_count += 1

    return f"{name}({', '.join(args)})"


# ============================================================================
# Guidance Generation (Auto from skill_substitutions.json)
# ============================================================================

def get_ee_offset_from_graph(graph: TripleGraph, robot_name: str) -> Optional[list]:
    """
    Get end-effector offset (down direction) from the ontology graph.

    Args:
        graph: The TripleGraph containing robot ontology
        robot_name: Name of the robot (e.g., 'panda', 'sawyer')

    Returns:
        List of [x, y, z] offset values, or None if not found
    """
    robot_uri = robot_id(robot_name)
    offsets = graph.objects(robot_uri, Predicates.HAS_EE_OFFSET_DOWN)

    if offsets:
        # Parse the string representation "[x, y, z]" to list
        offset_str = list(offsets)[0]
        try:
            return json.loads(offset_str)
        except json.JSONDecodeError:
            return None
    return None


def compute_gripper_offset_adjustment(
    graph: TripleGraph,
    source_robot: str,
    target_robot: str
) -> Optional[dict]:
    """
    Compute the gripper offset adjustment needed when transferring skills
    from source robot to target robot.

    Args:
        graph: The TripleGraph containing robot ontology
        source_robot: Source robot name (e.g., 'panda')
        target_robot: Target robot name (e.g., 'sawyer')

    Returns:
        Dict with offset adjustment info, or None if offsets not available
    """
    source_offset = get_ee_offset_from_graph(graph, source_robot)
    target_offset = get_ee_offset_from_graph(graph, target_robot)

    if source_offset is None or target_offset is None:
        return None

    # Calculate axis differences (gripper offset differences)
    x_diff = round(target_offset[0] - source_offset[0], 5)
    y_diff = round(target_offset[1] - source_offset[1], 5)
    z_diff = round(target_offset[2] - source_offset[2], 5)

    # Check if any axis has significant difference (>= 1mm)
    has_significant_diff = (
        abs(x_diff) >= 0.001 or
        abs(y_diff) >= 0.001 or
        abs(z_diff) >= 0.001
    )

    if not has_significant_diff:
        return None

    # Generate human-readable note for each significant axis
    notes = []
    if abs(x_diff) >= 0.001:
        direction = "forward" if x_diff > 0 else "backward"
        notes.append(f"X-axis: {direction} by {abs(x_diff)*100:.1f}cm")
    if abs(y_diff) >= 0.001:
        direction = "left" if y_diff > 0 else "right"
        notes.append(f"Y-axis: {direction} by {abs(y_diff)*100:.1f}cm")
    if abs(z_diff) >= 0.001:
        direction = "up" if z_diff > 0 else "down"
        notes.append(f"Z-axis: {direction} by {abs(z_diff)*100:.1f}cm")

    note = f"Gripper offset adjustment needed ({source_robot} -> {target_robot}): " + ", ".join(notes)

    return {
        "source_robot": source_robot,
        "target_robot": target_robot,
        "source_ee_offset": source_offset,
        "target_ee_offset": target_offset,
        "x_adjustment": x_diff,
        "y_adjustment": y_diff,
        "z_adjustment": z_diff,
        "note": note
    }


def get_ee_type_from_graph(graph: TripleGraph, robot_name: str) -> Optional[str]:
    """
    Get end-effector type from the ontology graph.

    Args:
        graph: The TripleGraph containing robot ontology
        robot_name: Name of the robot

    Returns:
        EE type string (e.g., 'gripper', 'robotiq85', 'suction'), or None if not found
    """
    robot_uri = robot_id(robot_name)
    ee_types = graph.objects(robot_uri, Predicates.HAS_EE_TYPE)

    if ee_types:
        return list(ee_types)[0]
    return None


def check_primitive_match(name_a: str, name_b: str) -> bool:
    """
    Check if two skill names represent the same primitive.

    Args:
        name_a: Source skill name
        name_b: Target skill name

    Returns:
        True if primitives match (same name), False otherwise
    """
    return name_a == name_b


def create_primitive_match_warning(
    skill_name: str,
    source_robot: str,
    target_robot: str,
    source_ee_type: Optional[str],
    target_ee_type: Optional[str],
    offset_adjustment: Optional[dict]
) -> Optional[dict]:
    """
    Create a warning entry for primitive match cases where robot/gripper characteristics differ.

    Args:
        skill_name: Name of the matched primitive
        source_robot: Source robot name
        target_robot: Target robot name
        source_ee_type: Source robot's end-effector type
        target_ee_type: Target robot's end-effector type
        offset_adjustment: Gripper offset adjustment info

    Returns:
        Warning dict if characteristics differ, None otherwise
    """
    warnings = []

    # Check EE type difference
    if source_ee_type and target_ee_type and source_ee_type != target_ee_type:
        warnings.append({
            "type": "ee_type_mismatch",
            "source_ee_type": source_ee_type,
            "target_ee_type": target_ee_type,
            "message": f"End-effector type differs: {source_ee_type} -> {target_ee_type}. "
                       f"Behavior may vary (e.g., depth handling, grasp mechanics)."
        })

    # Check gripper offset difference
    if offset_adjustment is not None:
        x_adj = offset_adjustment.get('x_adjustment', 0)
        y_adj = offset_adjustment.get('y_adjustment', 0)
        z_adj = offset_adjustment.get('z_adjustment', 0)

        # Only warn if significant difference (>= 1cm)
        if abs(x_adj) >= 0.01 or abs(y_adj) >= 0.01 or abs(z_adj) >= 0.01:
            warnings.append({
                "type": "gripper_offset_difference",
                "source_ee_offset": offset_adjustment.get("source_ee_offset"),
                "target_ee_offset": offset_adjustment.get("target_ee_offset"),
                "adjustment": {"x": x_adj, "y": y_adj, "z": z_adj},
                "message": offset_adjustment.get("note", "Gripper offset differs between robots.")
            })

    if not warnings:
        return None

    return {
        "skill_name": skill_name,
        "source_robot": source_robot,
        "target_robot": target_robot,
        "primitive_match": True,
        "warnings": warnings
    }


def generate_guidance_from_substitutions(
    skill_substitutions: dict,
    all_skills: dict,
    output_dir: Path,
    score_threshold: float = EQUIVALENCE_SCORE_THRESHOLD
) -> dict:
    """
    Automatically generate structured infilling guidance from skill_substitutions.json.

    Args:
        skill_substitutions: The skill_substitutions.json content
        all_skills: Dict of {robot_name: {skill_name: skill_def}}
        output_dir: Where to save guidance files
        score_threshold: Minimum score to consider a skill equivalence

    Returns:
        Dict containing generated guidance for each direction
    """
    print(f"\n{'='*60}")
    print("Generating Structured Infilling Guidance (Auto)")
    print(f"{'='*60}")

    # Load graph from output_dir for ee_offset queries
    graph = None
    graph_path = output_dir / "graph.json"
    if graph_path.exists():
        graph = TripleGraph.load(str(graph_path))

    equivalences = skill_substitutions.get('equivalences', [])

    # Filter by score threshold
    valid_equivs = [e for e in equivalences if e.get('score', 0) >= score_threshold]
    print(f"  Found {len(equivalences)} equivalences, {len(valid_equivs)} above threshold {score_threshold}")

    # Group by source robot
    # Format: "robot:skill_name"
    guidance_by_direction = {}

    # Track primitive matches and mismatches
    primitive_match_count = 0
    primitive_mismatch_count = 0

    for equiv in valid_equivs:
        skill_a = equiv['skill_a']  # e.g., "panda:pick"
        skill_b = equiv['skill_b']  # e.g., "ur5:ur5_grasp_at"
        score = equiv['score']

        robot_a, name_a = skill_a.split(':', 1)
        robot_b, name_b = skill_b.split(':', 1)

        # Direction: robot_a -> robot_b
        direction_key = f"{robot_a}_to_{robot_b}"
        if direction_key not in guidance_by_direction:
            # Compute gripper offset adjustment for this robot pair
            offset_adjustment = None
            source_ee_type = None
            target_ee_type = None
            if graph is not None:
                offset_adjustment = compute_gripper_offset_adjustment(graph, robot_a, robot_b)
                source_ee_type = get_ee_type_from_graph(graph, robot_a)
                target_ee_type = get_ee_type_from_graph(graph, robot_b)

            guidance_by_direction[direction_key] = {
                "source_robot": robot_a,
                "target_robot": robot_b,
                "source_ee_type": source_ee_type,
                "target_ee_type": target_ee_type,
                "gripper_offset_adjustment": offset_adjustment,
                "skill_mappings": [],
                "warnings": []  # For primitive matches with characteristic differences
            }

        # Check if primitives match (same skill name)
        if check_primitive_match(name_a, name_b):
            primitive_match_count += 1

            # Check if there are robot/gripper characteristic differences that need warning
            offset_adjustment = guidance_by_direction[direction_key].get("gripper_offset_adjustment")
            source_ee_type = guidance_by_direction[direction_key].get("source_ee_type")
            target_ee_type = guidance_by_direction[direction_key].get("target_ee_type")

            warning_entry = create_primitive_match_warning(
                skill_name=name_a,
                source_robot=robot_a,
                target_robot=robot_b,
                source_ee_type=source_ee_type,
                target_ee_type=target_ee_type,
                offset_adjustment=offset_adjustment
            )

            if warning_entry:
                # Check if warning already exists for this skill
                existing_warning = next(
                    (w for w in guidance_by_direction[direction_key]["warnings"]
                     if w["skill_name"] == name_a),
                    None
                )
                if not existing_warning:
                    guidance_by_direction[direction_key]["warnings"].append(warning_entry)

            # Skip guidance generation for primitive matches
            continue

        # Primitive mismatch - generate guidance
        primitive_mismatch_count += 1

        # Get skill definitions
        skill_a_def = all_skills.get(robot_a, {}).get(name_a, {})
        skill_b_def = all_skills.get(robot_b, {}).get(name_b, {})

        if not skill_a_def or not skill_b_def:
            print(f"  Warning: Missing skill definition for {skill_a} or {skill_b}")
            continue

        # Infer parameter mapping (now returns tuple with risk_flags)
        param_mappings, risk_flags = infer_parameter_mapping(
            skill_a_def.get('parameters', []),
            skill_b_def.get('parameters', [])
        )

        # Get offset adjustment for this robot pair
        offset_adjustment = guidance_by_direction[direction_key].get("gripper_offset_adjustment")

        # Generate guidance entry with quality grade
        guidance_entry = create_guidance_entry(
            source_skill=skill_a_def,
            target_skill=skill_b_def,
            source_robot=robot_a,
            target_robot=robot_b,
            param_mappings=param_mappings,
            risk_flags=risk_flags,
            equiv_score=score,
            offset_adjustment=offset_adjustment
        )

        # Check if skill already has a mapping (keep highest score)
        existing = next(
            (m for m in guidance_by_direction[direction_key]["skill_mappings"]
             if m["skill_name"] == name_a),
            None
        )

        if existing:
            # Keep the one with higher score
            if score > existing.get("_score", 0):
                guidance_by_direction[direction_key]["skill_mappings"].remove(existing)
                guidance_entry["_score"] = score
                guidance_by_direction[direction_key]["skill_mappings"].append(guidance_entry)
        else:
            guidance_entry["_score"] = score
            guidance_by_direction[direction_key]["skill_mappings"].append(guidance_entry)

    print(f"  Primitive matches (skipped): {primitive_match_count}")
    print(f"  Primitive mismatches (guidance generated): {primitive_mismatch_count}")

    # Clean up internal score field and save
    for direction_key, guidance in guidance_by_direction.items():
        for mapping in guidance["skill_mappings"]:
            mapping.pop("_score", None)

        # Remove empty warnings list if no warnings
        if not guidance["warnings"]:
            del guidance["warnings"]

        # Save to file
        filename = f"guidance_{direction_key}.json"
        filepath = output_dir / filename
        with open(filepath, 'w') as f:
            json.dump(guidance, f, indent=2)

        warning_count = len(guidance.get("warnings", []))
        print(f"  Saved: {filename} ({len(guidance['skill_mappings'])} skill mappings, {warning_count} warnings)")

    return guidance_by_direction


def compute_quality_grade(equiv_score: float, param_mappings: list, risk_flags: list) -> dict:
    """
    Compute quality grade for the guidance based on multiple factors.

    Returns:
        dict with:
        - grade: 'A', 'B', 'C', 'D', 'F'
        - usable: bool (can be used directly without manual review)
        - confidence_breakdown: dict of individual scores
        - risk_summary: list of risk descriptions
    """
    # Calculate average parameter mapping confidence
    if param_mappings:
        avg_param_conf = sum(m.get('confidence', 0) for m in param_mappings) / len(param_mappings)
    else:
        avg_param_conf = 0.0

    # Count critical and warning risks
    critical_risks = [r for r in risk_flags if r.get('type') == 'semantic_mismatch']
    warning_risks = [r for r in risk_flags if r.get('type') == 'low_confidence']

    # Calculate risk penalties
    critical_penalty = len(critical_risks) * 0.2  # Semantic mismatch: -0.2 each
    warning_penalty = len(warning_risks) * 0.1    # Low confidence: -0.1 each

    # Calculate low-confidence mapping ratio (for usable_directly check)
    low_conf_ratio = len(warning_risks) / len(param_mappings) if param_mappings else 0.0

    # Compute overall score (now includes warning penalty)
    overall_score = (
        equiv_score * 0.4 +
        avg_param_conf * 0.4 +
        (1.0 - critical_penalty - warning_penalty) * 0.2
    )
    overall_score = max(0, min(1, overall_score))

    # Determine grade with warning_risks consideration
    if overall_score >= 0.9 and len(critical_risks) == 0 and len(warning_risks) == 0:
        grade = 'A'
        usable = True
    elif overall_score >= 0.8 and len(critical_risks) == 0 and len(warning_risks) <= 1:
        grade = 'B'
        usable = True
    elif overall_score >= 0.7:
        grade = 'C'
        # Usable only if no critical risks AND low-confidence ratio < 50%
        usable = len(critical_risks) == 0 and low_conf_ratio < 0.5
    elif overall_score >= 0.5:
        grade = 'D'
        usable = False
    else:
        grade = 'F'
        usable = False

    return {
        'grade': grade,
        'overall_score': round(overall_score, 3),
        'usable_directly': usable,
        'confidence_breakdown': {
            'skill_equivalence': round(equiv_score, 3),
            'param_mapping_avg': round(avg_param_conf, 3),
            'critical_risk_penalty': round(critical_penalty, 3),
            'warning_risk_penalty': round(warning_penalty, 3),
            'low_confidence_ratio': round(low_conf_ratio, 3)
        },
        'risk_summary': [r.get('message', '') for r in risk_flags]
    }


def create_guidance_entry(
    source_skill: dict,
    target_skill: dict,
    source_robot: str,
    target_robot: str,
    param_mappings: list,
    risk_flags: list,
    equiv_score: float,
    offset_adjustment: Optional[dict] = None
) -> dict:
    """Create a single guidance entry for skill transformation with quality grade."""

    source_name = source_skill['name']
    target_name = target_skill['name']
    source_params = source_skill.get('parameters', [])

    # Add offset adjustment to risk_flags if present and skill has position-related parameters
    if offset_adjustment is not None:
        x_adj = offset_adjustment.get('x_adjustment', 0)
        y_adj = offset_adjustment.get('y_adjustment', 0)
        z_adj = offset_adjustment.get('z_adjustment', 0)

        # Only add if any axis has significant difference (>= 1cm)
        has_significant_offset = (
            abs(x_adj) >= 0.01 or
            abs(y_adj) >= 0.01 or
            abs(z_adj) >= 0.01
        )

        if has_significant_offset:
            # Check if any parameter mapping involves position semantics
            position_semantics = {'position', 'target_position', 'grasp_position', 'place_position'}
            has_position_param = any(
                m.get('breakdown', {}).get('source_semantic') in position_semantics or
                m.get('breakdown', {}).get('target_semantic') in position_semantics
                for m in param_mappings
            )

            if has_position_param:
                risk_flags = risk_flags.copy()  # Don't modify original
                risk_flags.append({
                    'type': 'gripper_offset_adjustment',
                    'source_robot': offset_adjustment.get('source_robot'),
                    'target_robot': offset_adjustment.get('target_robot'),
                    'source_ee_offset': offset_adjustment.get('source_ee_offset'),
                    'target_ee_offset': offset_adjustment.get('target_ee_offset'),
                    'x_adjustment': x_adj,
                    'y_adjustment': y_adj,
                    'z_adjustment': z_adj,
                    'message': offset_adjustment.get('note', "Gripper offset adjustment needed")
                })

    # Compute quality grade
    quality_grade = compute_quality_grade(equiv_score, param_mappings, risk_flags)

    # Build keywords_required from source params
    keywords_required = [p['name'] for p in source_params[:4]]

    # Generate full content with function signature and mapping
    target_signature = generate_function_signature(target_skill)
    param_mapping_text = generate_param_mapping_text(param_mappings)

    full_content = f"""Replace the `{source_name}(env, task, ...)` call with a `{target_name}(...)` call using the following interface:

```python
{target_signature}
```

{param_mapping_text}
"""

    # Generate interface example
    interface_example = generate_interface_example(target_skill, param_mappings)

    return {
        "skill_name": source_name,
        "guidance": [
            {
                "line_start": "",
                "line_end": "",
                "match": {
                    "node": "call",
                    "func": {"type": "Name", "id": source_name},
                    "keywords_required": keywords_required
                },
                "type": "capabilities",
                "content": f"Replace the `{source_name}(env, task, ...)` call with a `{target_name}(...)` call.",
                "full_content": full_content,
                "interface": interface_example,
                "equivalence_score": equiv_score,
                "parameter_mappings": param_mappings,
                "quality_grade": quality_grade
            }
        ]
    }


# ============================================================================
# Single Robot Ontology Generation
# ============================================================================

def generate_single_robot_ontology(robot_name: str, config: dict, output_dir: Path, llm=None):
    """Generate ontology for a single robot."""
    print(f"\n{'='*60}")
    print(f"Generating ontology for {robot_name}")
    print(f"{'='*60}")

    output_dir.mkdir(exist_ok=True)
    graph = TripleGraph()

    urdf_path = str(config['urdf'])
    srdf_path = str(config['srdf'])

    if not Path(urdf_path).exists():
        print(f"  Warning: URDF not found: {urdf_path}")
        return None
    if not Path(srdf_path).exists():
        print(f"  Warning: SRDF not found: {srdf_path}")
        return None

    summary, robot_graph = parse_robot(
        robot_name,
        urdf_path,
        srdf_path,
        output_dir=str(output_dir)
    )
    graph.merge(robot_graph)

    print(f"  URDF: {summary['urdf']['joint_count']} joints, {summary['urdf']['link_count']} links")
    print(f"  SRDF: {len(summary['srdf']['groups'])} groups")
    print(f"  Joint mapping: {len(summary['joint_name_mapping'])} matched")

    skills = []
    if config['skills'].exists():
        skills = load_skills(config['skills'])
        add_skills_to_graph(graph, robot_name, skills)
        print(f"  Loaded {len(skills)} skills")

    caps = infer_capabilities(
        graph,
        robot_id(robot_name),
        summary,
        skills,
        llm=llm,
        output_dir=str(output_dir)
    )
    print(f"  Capabilities: {', '.join(caps['capabilities_final'])}")

    graph.save(str(output_dir / "graph.json"))
    graph.export_ttl_like(str(output_dir / "graph.ttl"))

    # Generate report
    report_content = f"""# {robot_name.upper()} Robot Ontology Report

## Robot Summary
- **Robot**: {robot_name}
- **URDF Joints**: {summary['urdf']['joint_count']}
- **URDF Links**: {summary['urdf']['link_count']}
- **SRDF Groups**: {len(summary['srdf']['groups'])}
- **Matched Joints**: {len(summary['joint_name_mapping'])}

## Capabilities
{chr(10).join(['- ' + c for c in caps['capabilities_final']])}

## Skills ({len(skills)} total)
{chr(10).join(['- ' + s['name'] + ': ' + s.get('description', '') for s in skills])}

## Joint Mapping
| SRDF Joint | URDF Joint | Confidence |
|------------|------------|------------|
"""
    for srdf_j, urdf_j in summary['joint_name_mapping'].items():
        report_content += f"| {srdf_j} | {urdf_j} | 1.0 |\n"

    with open(output_dir / "report.md", 'w') as f:
        f.write(report_content)

    return {
        'robot': robot_name,
        'summary': summary,
        'skills': skills,
        'capabilities': caps,
        'graph': graph
    }


# ============================================================================
# Cross-Robot Ontology Generation
# ============================================================================

def generate_cross_robot_ontology(robot_results: dict, output_dir: Path, llm=None):
    """Generate cross-robot aligned ontology."""
    print(f"\n{'='*60}")
    print("Generating cross-robot aligned ontology")
    print(f"{'='*60}")

    output_dir.mkdir(exist_ok=True)

    merged_graph = TripleGraph()
    for robot_name, result in robot_results.items():
        if result and 'graph' in result:
            merged_graph.merge(result['graph'])

    scene_path = BASE_DIR / "data" / "scene.json"
    scene = {"objects": [], "relations": []}
    if scene_path.exists():
        scene = load_scene(scene_path)
        add_scene_to_graph(merged_graph, scene)
        print(f"  Loaded scene: {scene.get('scene_id', 'unknown')}")

    # Infer skill substitutions
    skill_subs = {"equivalences": [], "decompositions": [], "summary": {}}
    robot_names = list(robot_results.keys())

    if len(robot_names) >= 2:
        robot_a, robot_b = robot_names[0], robot_names[1]
        skills_a = robot_results[robot_a]['skills']
        skills_b = robot_results[robot_b]['skills']

        skill_subs = infer_skill_substitutions(
            merged_graph,
            robot_a,
            robot_b,
            skills_a,
            skills_b,
            llm=llm,
            output_dir=str(output_dir)
        )
        print(f"  Equivalences found: {skill_subs['summary']['total_equivalences']}")
        print(f"  Decompositions found: {skill_subs['summary']['total_decompositions']}")

    obj_mappings = infer_object_mappings(
        merged_graph,
        scene,
        llm=llm,
        output_dir=str(output_dir)
    )
    print(f"  Objects analyzed: {obj_mappings['summary']['total_objects']}")

    merged_graph.save(str(output_dir / "graph.json"))
    merged_graph.export_ttl_like(str(output_dir / "graph.ttl"))

    all_caps = {}
    for robot_name, result in robot_results.items():
        if result and 'capabilities' in result:
            all_caps[robot_name] = result['capabilities']

    with open(output_dir / "all_capabilities.json", 'w') as f:
        json.dump(all_caps, f, indent=2)

    # Generate combined report
    robot_list = list(robot_results.keys())
    report_content = f"""# {' + '.join([r.upper() for r in robot_list])} Cross-Robot Ontology Report

## Overview
This report contains the aligned ontology results for {', '.join([r.upper() for r in robot_list])} robots.

"""
    for robot_name, result in robot_results.items():
        if result:
            summary = result['summary']
            caps = result['capabilities']
            skills = result['skills']
            report_content += f"""## {robot_name.upper()} Robot
- **URDF Joints**: {summary['urdf']['joint_count']}
- **URDF Links**: {summary['urdf']['link_count']}
- **Skills**: {len(skills)}
- **Capabilities**: {', '.join(caps['capabilities_final'])}

"""

    # Add skill substitution summary
    if skill_subs.get('equivalences'):
        report_content += """## Skill Equivalences (Auto-detected)

| Source Skill | Target Skill | Score |
|--------------|--------------|-------|
"""
        for eq in skill_subs['equivalences']:
            report_content += f"| {eq['skill_a']} | {eq['skill_b']} | {eq['score']:.2f} |\n"

    with open(output_dir / "report.md", 'w') as f:
        f.write(report_content)

    return merged_graph, skill_subs


# ============================================================================
# Main Pipeline
# ============================================================================

def generate_all_pairwise_skill_substitutions(robot_results: dict, merged_graph: TripleGraph, output_dir: Path, llm=None) -> dict:
    """
    Generate skill substitutions for all pairs of robots.

    Args:
        robot_results: Dict of {robot_name: result} from generate_single_robot_ontology
        merged_graph: The merged TripleGraph containing all robots (will be modified in-place with equivSkill/decompSkill)
        output_dir: Output directory
        llm: Optional LLM instance

    Returns:
        Dict with all skill substitutions combined
    """
    from itertools import combinations

    robot_names = list(robot_results.keys())
    all_equivalences = []
    all_decompositions = []

    # Generate for all pairs
    for robot_a, robot_b in combinations(robot_names, 2):
        print(f"\n  Processing pair: {robot_a} <-> {robot_b}")

        skills_a = robot_results[robot_a]['skills']
        skills_b = robot_results[robot_b]['skills']

        # Use the shared merged_graph so equivSkill/decompSkill triples are added to it
        pair_subs = infer_skill_substitutions(
            merged_graph,
            robot_a,
            robot_b,
            skills_a,
            skills_b,
            llm=llm,
            output_dir=str(output_dir)
        )

        all_equivalences.extend(pair_subs.get('equivalences', []))
        all_decompositions.extend(pair_subs.get('decompositions', []))

        print(f"    Equivalences: {len(pair_subs.get('equivalences', []))}")
        print(f"    Decompositions: {len(pair_subs.get('decompositions', []))}")

    # Combine all results
    combined_subs = {
        'equivalences': all_equivalences,
        'decompositions': all_decompositions,
        'summary': {
            'total_equivalences': len(all_equivalences),
            'total_decompositions': len(all_decompositions),
            'robot_pairs': len(list(combinations(robot_names, 2)))
        }
    }

    # Save combined substitutions
    with open(output_dir / "skill_substitutions.json", 'w') as f:
        json.dump(combined_subs, f, indent=2)

    return combined_subs


def main():
    parser = argparse.ArgumentParser(
        description="Robot Ontology Generation Pipeline"
    )
    parser.add_argument(
        '--use_llm',
        action='store_true',
        help='Enable LLM for enhanced reasoning'
    )
    parser.add_argument(
        '--model',
        type=str,
        default='',
        help='HuggingFace model name or path (e.g., "Qwen/Qwen2.5-Coder-7B"). If provided, LLM will be used automatically.'
    )
    parser.add_argument(
        '--score_threshold',
        type=float,
        default=EQUIVALENCE_SCORE_THRESHOLD,
        help=f'Minimum score for skill equivalence (default: {EQUIVALENCE_SCORE_THRESHOLD})'
    )
    parser.add_argument(
        '--robots',
        type=str,
        default='',
        help='Comma-separated list of robots to include (e.g., "ur5,sawyer,panda"). If empty, all robots are used.'
    )
    parser.add_argument(
        '--robot-type',
        type=str,
        choices=['rlbench', 'genesis', 'both'],
        default='rlbench',
        help='Robot type to generate ontology for: rlbench, genesis, or both (default: rlbench)'
    )
    parser.add_argument(
        '--verbose',
        action='store_true',
        help='Print detailed progress information'
    )

    args = parser.parse_args()

    # If --model is provided, automatically enable LLM
    if args.model:
        args.use_llm = True

    # Select ROBOTS configuration based on --robot-type
    if args.robot_type == 'both':
        ROBOTS = {**ROBOTS_RLBENCH, **ROBOTS_GENESIS}
    elif args.robot_type == 'genesis':
        ROBOTS = ROBOTS_GENESIS
    else:  # rlbench
        ROBOTS = ROBOTS_RLBENCH

    # Filter robots if --robots argument provided
    if args.robots:
        selected_robots = [r.strip() for r in args.robots.split(',')]
        # Validate robot names
        for r in selected_robots:
            if r not in ROBOTS:
                print(f"Warning: Unknown robot '{r}', skipping")
        selected_robots = [r for r in selected_robots if r in ROBOTS]
    else:
        selected_robots = list(ROBOTS.keys())

    print("=" * 70)
    print("Robot Ontology Generation Pipeline (Multi-Robot)")
    print("=" * 70)
    print(f"\nRobots to process: {', '.join(selected_robots)}")
    print("\nPipeline steps:")
    print("  1. Generate individual ontology for each robot")
    print("  2. Generate cross-robot skill mappings for all pairs")
    print("  3. Auto-generate guidance from substitutions")
    print("=" * 70)

    # Initialize LLM
    llm = None
    if args.use_llm:
        print(f"\nLoading LLM: {args.model}")
        try:
            llm = create_llm(args.model, fallback_to_dummy=True)
            if isinstance(llm, DummyLLM):
                print("  -> Fell back to DummyLLM (model load failed or not available)")
            else:
                print("  -> LLM loaded successfully")
        except Exception as e:
            print(f"  -> Failed to load LLM: {e}")
            llm = DummyLLM()
    else:
        print("\nRunning without LLM (deterministic only)")

    # Step 1: Generate individual ontology for each robot
    print("\n" + "=" * 70)
    print("STEP 1: Generating individual ontologies for all robots")
    print("=" * 70)

    robot_results = {}
    temp_dirs = []

    for robot_name in selected_robots:
        config = ROBOTS[robot_name]

        # Check if config files exist
        if not config['urdf'].exists():
            print(f"\n  Warning: Skipping {robot_name} - URDF not found: {config['urdf']}")
            continue
        if not config['srdf'].exists():
            print(f"\n  Warning: Skipping {robot_name} - SRDF not found: {config['srdf']}")
            continue
        if not config['skills'].exists():
            print(f"\n  Warning: Skipping {robot_name} - Skills file not found: {config['skills']}")
            continue

        # Use individual output directory for each robot
        output_dir = BASE_DIR / f"output_{robot_name}"
        temp_dirs.append(output_dir)

        print(f"\n  Processing {robot_name}...")
        result = generate_single_robot_ontology(
            robot_name,
            config,
            output_dir,
            llm=llm
        )

        if result:
            robot_results[robot_name] = result

    print(f"\n  Successfully processed: {list(robot_results.keys())}")

    # Step 2: Generate cross-robot aligned ontology
    print("\n" + "=" * 70)
    print("STEP 2: Generating cross-robot skill mappings for all pairs")
    print("=" * 70)

    output_mapping_dir = BASE_DIR / "output_mapping"
    output_mapping_dir.mkdir(exist_ok=True)

    skill_subs = {}

    if len(robot_results) >= 2:
        # Merge all graphs
        merged_graph = TripleGraph()
        for robot_name, result in robot_results.items():
            if result and 'graph' in result:
                merged_graph.merge(result['graph'])

        # Add scene if exists
        scene_path = BASE_DIR / "data" / "scene.json"
        scene = {"objects": [], "relations": []}
        if scene_path.exists():
            scene = load_scene(scene_path)
            add_scene_to_graph(merged_graph, scene)
            print(f"  Loaded scene: {scene.get('scene_id', 'unknown')}")

        # Generate pairwise skill substitutions (this also adds equivSkill/decompSkill to merged_graph)
        skill_subs = generate_all_pairwise_skill_substitutions(
            robot_results, merged_graph, output_mapping_dir, llm=llm
        )

        print(f"\n  Total equivalences found: {skill_subs['summary']['total_equivalences']}")
        print(f"  Total decompositions found: {skill_subs['summary']['total_decompositions']}")

        # Save merged graph
        merged_graph.save(str(output_mapping_dir / "graph.json"))
        merged_graph.export_ttl_like(str(output_mapping_dir / "graph.ttl"))

        # Save all capabilities
        all_caps = {}
        for robot_name, result in robot_results.items():
            if result and 'capabilities' in result:
                all_caps[robot_name] = result['capabilities']

        with open(output_mapping_dir / "all_capabilities.json", 'w') as f:
            json.dump(all_caps, f, indent=2)

        # Copy joint mappings from individual outputs
        import shutil
        for robot_name in robot_results.keys():
            src = BASE_DIR / f"output_{robot_name}" / f"joint_mapping_{robot_name}.json"
            if src.exists():
                shutil.copy(src, output_mapping_dir / f"joint_mapping_{robot_name}.json")

        # Generate combined report
        report_content = f"""# Multi-Robot Cross-Robot Ontology Report

## Overview
This report contains the aligned ontology results for {len(robot_results)} robots: {', '.join([r.upper() for r in robot_results.keys()])}.

"""
        for robot_name, result in robot_results.items():
            if result:
                summary = result['summary']
                caps = result['capabilities']
                skills = result['skills']
                report_content += f"""## {robot_name.upper()} Robot
- **URDF Joints**: {summary['urdf']['joint_count']}
- **URDF Links**: {summary['urdf']['link_count']}
- **Skills**: {len(skills)}
- **Capabilities**: {', '.join(caps['capabilities_final'])}

"""

        # Add skill substitution summary
        if skill_subs.get('equivalences'):
            report_content += """## Skill Equivalences (Auto-detected)

| Source Skill | Target Skill | Score |
|--------------|--------------|-------|
"""
            for eq in skill_subs['equivalences']:
                report_content += f"| {eq['skill_a']} | {eq['skill_b']} | {eq['score']:.2f} |\n"

        with open(output_mapping_dir / "report.md", 'w') as f:
            f.write(report_content)

    else:
        print("  Warning: Need at least 2 robots for cross-robot alignment")

    # Step 3: Auto-generate guidance from skill_substitutions
    print("\n" + "=" * 70)
    print("STEP 3: Auto-generating Guidance from skill_substitutions")
    print("=" * 70)

    if skill_subs and skill_subs.get('equivalences'):
        # Build all_skills dict
        all_skills = {}
        for robot_name, result in robot_results.items():
            skills_list = result.get('skills', [])
            all_skills[robot_name] = {s['name']: s for s in skills_list}

        generate_guidance_from_substitutions(
            skill_subs,
            all_skills,
            output_mapping_dir,
            score_threshold=args.score_threshold
        )
    else:
        print("  Skipped: No skill substitutions available")

    # Cleanup temporary folders (keep output_mapping as main output)
    import shutil
    for temp_dir in temp_dirs:
        if temp_dir.exists() and temp_dir.name != "output_mapping":
            # Keep individual robot outputs for reference
            pass

    # Summary
    print("\n" + "=" * 70)
    print("GENERATION COMPLETE")
    print("=" * 70)
    print("\nGenerated outputs:")

    for robot_name in robot_results.keys():
        output_dir = BASE_DIR / f"output_{robot_name}"
        print(f"\n  output_{robot_name}/: {robot_name.upper()} standalone ontology")
        if output_dir.exists():
            for f in sorted(output_dir.glob("*")):
                print(f"    - {f.name}")

    print(f"\n  output_mapping/: Cross-robot aligned ontology + Auto-generated guidance")
    if output_mapping_dir.exists():
        for f in sorted(output_mapping_dir.glob("*")):
            print(f"    - {f.name}")

    print("\nDone!")
    return 0


if __name__ == "__main__":
    sys.exit(main())
