import random
import json
import os
from typing import Dict, List, Any, Tuple
import re

class PolicyGenerator:
    def __init__(self, structure_complexity=1, args_num=5):
        self.task_types = 3
        self.layers = 3
        self.attribute_dict = [
            {  # Layer 1
                "1": "condition",
                "2": "condition", 
                "3": "reference_1",
                "4": "reference_2",
                "5": "lookup"
            },
            {  # Layer 2
                "1": "condition",
                "2": "condition", 
                "3": "condition",
                "4": "reference_2",
                "5": "reference_3",
                "6": "lookup"
            },
            {  # Layer 3
                "1": "condition",
                "2": "condition", 
                "3": "condition", 
                "4": "reference_3",
                "5": "lookup"
            }
        ]
        self.num_global_attributes = 3
        self.task_requirements = {}  # Store task layer requirements
        self.task_operations = {}  # Store executable operations for each task
        self.structure_complexity = structure_complexity
        self.args_num = args_num
        
    def generate_global_attributes(self) -> Dict[str, int]:
        """Generate random global attribute values between 0-100"""
        global_attrs = {}
        for i in range(1, self.num_global_attributes + 1):
            global_attrs[f"Global_Attribute_Value{i}"] = random.randint(0, 100)
        return global_attrs
    
    def generate_general_instructions(self, global_attrs: Dict[str, int]) -> Tuple[List[str], int]:
        """Generate the general instructions section and return the policy ID"""
        global_attr_str = ", ".join([f"{k} = {v}" for k, v in global_attrs.items()])
        
        # Generate task types dynamically based on self.task_types with highlights
        task_types_list = ", ".join([f"**Task_Type_{i}**" for i in range(1, self.task_types + 1)])
        
        # Generate unique policy ID
        policy_id = random.randint(1, 99999)
        
        instructions = [
            f"# Agent Policy Document #P{policy_id:05d}",
            "",
            "## General Instructions",
            f"The global attribute is currently: {global_attr_str}",
            "You are a helpful agent that can get access to profiles and attributes at different layers and indexes.",
            f"You can help users finish {task_types_list}."
        ]
        
        return instructions, policy_id
    
    def generate_domain_basic(self) -> List[str]:
        """Generate the domain basic structure explanation"""
        basic_structure = [
            "",
            "## Domain Basic",
            "### Profile Structure",
            "The jth profile instance at profile layer i has its primary key as profile_i_j",
            f"There are {self.layers} layers of profiles, and each profile layer has a number of profile instances. All the profile instances at the same layer have the same attributes."
        ]
        
        # Add profile attribute descriptions for each layer with their specific structures
        for layer in range(1, self.layers + 1):
            layer_dict = self.attribute_dict[layer - 1]
            layer_attrs = ", ".join([f"Profile_{layer}_Attribute_{j}" for j in layer_dict.keys()])
            basic_structure.append("")  # Add line break before each profile description
            basic_structure.append(f"**- Each profile at layer {layer} indexed j Profile_{layer}_j has attributes:** {layer_attrs}")
        
        basic_structure.append("")
        basic_structure.append("### Attribute Definitions")
        basic_structure.append("The jth attribute at layer i is denoted as profile_attribute_i_j.") # Add line break after attribute definition
        
        # Add layer-specific descriptions based on each layer's attribute types
        for layer in range(1, self.layers + 1):
            layer_dict = self.attribute_dict[layer - 1]
            
            # Group attributes by type for this specific layer
            condition_attrs = [f"attribute_{k}" for k, v in layer_dict.items() if v == "condition"]
            lookup_attrs = [f"attribute_{k}" for k, v in layer_dict.items() if v == "lookup"]
            
            # Group reference attributes by target layer
            reference_by_layer = {}
            for attr_num, attr_type in layer_dict.items():
                if attr_type.startswith("reference_"):
                    target_layer = attr_type.split("_")[1]
                    if target_layer not in reference_by_layer:
                        reference_by_layer[target_layer] = []
                    reference_by_layer[target_layer].append(f"attribute_{attr_num}")
            
            if condition_attrs or reference_by_layer or lookup_attrs:
                basic_structure.append("") 
                basic_structure.append(f"**At layer {layer}:**")
                
                if condition_attrs:
                    condition_str = " and ".join(condition_attrs)
                    basic_structure.append(f"  - The {condition_str} can serve as conditions")
                
                # Handle reference attributes grouped by target layer
                for target_layer, ref_attrs in reference_by_layer.items():
                    ref_str = " and ".join(ref_attrs)
                    basic_structure.append(f"  - The {ref_str} contain the primary keys to access profiles at layer {target_layer}")
                
                if lookup_attrs:
                    lookup_str = " and ".join(lookup_attrs)
                    basic_structure.append(f"  - The {lookup_str} can be used as an alternative way to access the profiles while searching.")
        
        # Add profile access explanation (removed adjacent instances definition)
        basic_structure.append("")
        basic_structure.append("### Profile Access Pattern")
        basic_structure.append("When the user specifies a profile_k_id, you should understand that this means the user wants to access the profile_k instance with the primary key's index being the given value. When the user specifies a profile_k_info, you should understand that this means the user wants to access the profile_k instance with the lookup attribute value of the provided string.")
        basic_structure.append("When referring to a user's profile_k, you should use the layer k-1 profile's reference attribute to get access to the primary keys of profile_k instances.")
        basic_structure.append("")
        basic_structure.append("**Relative Profile Access:**")
        basic_structure.append("When the user specifies getting a 'relative profile' or 'related profile', this means accessing other profile instances at the same layer as the current profile. To accomplish this, you should use the reference attributes from the current profile instance to find the primary keys of the target profile instances at the same layer. For example, if you are currently accessing a profile at layer 2, and the user asks for a relative profile, you should use the reference attributes in the current layer 2 profile to identify and access other layer 2 profile instances.")
        
        return basic_structure
    
    def generate_tool_calling_instructions(self) -> List[str]:
        """Generate tool calling instructions"""
        return [
            "",
            "## Tool Calling Instructions",
            "### General Rules",
            "- You should only make one tool call at a time, and if you make a tool call, you should not respond to the user simultaneously.",
            "- If you respond to the user, you should not make a tool call at the same time.",
            "- You should only call the tool Tool_Conflict when the request is not able to be handled within the policy and the user specifications.",
            "",
            "### Available Tools",
            "",
            "#### Profile Access Tools",
            "- **Get_Profile_Layer_k**: Use this tool to directly access a specific profile instance by its primary key.",
            "  - **Parameter**: `index_value` (string) - The full primary key of the profile instance (e.g., \"profile_1_5\", \"profile_2_10\", \"profile_3_1\")",
            "  - **When to use**: ",
            "    - When users specify a profile_id, such as \"my profile_id is profile_1_5\" or \"using profile_2_3\"",
            "    - When you obtain a reference attribute value from another profile instance that contains the primary key to access a different layer",
            "  - **Example call**: Get_Profile_Layer_1(index_value=\"profile_1_5\")",
            "",
            "- **Search_Profile_Layer_k**: Use this tool to find profile instances by their lookup attribute value.",
            "  - **Parameter**: `key_value` (string) - The lookup attribute value to search for",
            "  - **When to use**: When users specify a profile_info, such as \"my profile_info is 'engineering'\" or \"find profiles with lookup value 'sales'\"",
            "  - **Example call**: Search_Profile_Layer_1(key_value=\"engineering\")",
            "",
            "#### Task Completion Tools", 
            "- **finish_task_k**: Use this tool to complete Task_Type_k with the computed arguments.",
            "  - **Parameter**: `attributes` (list) - A list of computed argument values in the order specified by the task requirements",
            "  - **When to use**: After accessing all required profile instances and computing the task arguments according to task specifications",
            "  - **Example call**: finish_task_1(attributes=[25, 150, 42])",
            "",
            "#### Conflict Resolution Tool",
            "- **Tool_Conflict**: Use this tool when the user request cannot be handled within the policy constraints.",
            "  - **Parameters**: None",
            "  - **When to use**: If the user request violates policy or cannot be fulfilled with available tools and data",
            "  - **Example call**: Tool_Conflict()",
            "",
            "### Tool Parameter Mapping Guidelines",
            "- **profile_id references**: When users mention \"my profile_id is profile_k_X\" or \"profile_k_X\", use the Get_Profile_Layer_k tool with index_value=\"profile_k_X\"",
            "- **reference attribute usage**: When you access a profile instance and obtain reference attributes (e.g., reference_1, reference_2, reference_3), use those primary key values with Get_Profile_Layer_k to access the referenced profiles at the target layers",
            "- **profile_info references**: When users mention \"my profile_info is Y\" or provide lookup values, use the Search_Profile_Layer_k tool with key_value=\"Y\"",
            "- **Task completion**: Always pass computed arguments as a list to finish_task_k tools, ensuring the order matches task specifications",
            "",
            "### Usage Guidelines",
            "The user will specify the instance index at the first layer, and the agent shall go through the profile instances at different indexes and layers to obtain the attributes needed for the task."
        ]
    
    def generate_task_specifications(self) -> List[str]:
        """Generate dynamic task type specifications based on attribute structure"""
        tasks = [
            "",
            "## Task Specifications"
        ]
        
        for task_num in range(1, self.task_types + 1):
            tasks.append("")
            tasks.append(f"### Task_Type_{task_num}")
            
            # Dynamically determine which layers this task will use
            involved_layers = self._select_task_layers(task_num)
            
            # Generate profile instance requirements
            profile_requirements = self._generate_profile_requirements(involved_layers)
            tasks.extend(profile_requirements)
            
            # Generate input specifications based on selected instances
            input_specs = self._generate_input_specifications(task_num, involved_layers)
            tasks.extend(input_specs)
            
            # Add completion requirements
            completion_reqs = self._generate_completion_requirements(task_num, involved_layers)
            tasks.extend(completion_reqs)
            
        return tasks
    
    def generate_task_specifications_with_variant(self, modified_task_num: int, original_task_operations: Dict[int, List[Dict[str, Any]]]) -> List[str]:
        """Generate task specifications where only one task is modified, others use original operations"""
        tasks = [
            "",
            "## Task Specifications"
        ]
        
        for task_num in range(1, self.task_types + 1):
            tasks.append("")
            tasks.append(f"### Task_Type_{task_num}")
            
            # Use existing layer requirements (no changes)
            involved_layers = self.task_requirements[task_num]
            
            # Generate profile instance requirements
            profile_requirements = self._generate_profile_requirements(involved_layers)
            tasks.extend(profile_requirements)
            
            # Generate input specifications 
            if task_num == modified_task_num:
                # Use the newly generated operations for the modified task
                input_specs = self._generate_input_specifications_from_operations(task_num, involved_layers, self.task_operations[task_num])
            else:
                # Use the original operations for unchanged tasks
                input_specs = self._generate_input_specifications_from_operations(task_num, involved_layers, original_task_operations[task_num])
            
            tasks.extend(input_specs)
            
            # Add completion requirements
            completion_reqs = self._generate_completion_requirements(task_num, involved_layers)
            tasks.extend(completion_reqs)
            
        return tasks
    
    def _generate_input_specifications_from_operations(self, task_num: int, involved_layers: List[int], operations: List[Dict[str, Any]]) -> List[str]:
        """Generate input specification text from stored operations"""
        specs = []
        specs.append(f"- The agent should pass the following arguments into the finish_task_{task_num} tool call:")
        
        for operation in operations:
            arg_num = operation["arg_num"]
            
            if operation["type"] == "ifelse":
                # Reconstruct if-else structure text
                branches = operation['branches']
                conditions = operation['conditions']
                
                # Generate the text for this if-else structure
                text = f"arg_{arg_num}: "
                for cond_idx in range(len(conditions)):
                    left_expr, right_expr = conditions[cond_idx]
                    branch_text = self._operation_to_text(branches[cond_idx])
                    if cond_idx == 0:
                        text += f"If {left_expr} > {right_expr}, then {branch_text} else "
                    else:
                        text += f"if {left_expr} > {right_expr}, then {branch_text} else "
                
                # Add final branch
                final_branch_text = self._operation_to_text(branches[-1])
                text += final_branch_text
                
                specs.append(f"  - {text}")
            else:
                # Generate text for simple operations
                operation_text = self._operation_to_text(operation)
                specs.append(f"  - arg_{arg_num}: {operation_text}")
        
        return specs
    
    def _operation_to_text(self, operation: Dict[str, Any]) -> str:
        """Convert an operation dictionary back to its text representation"""
        if operation["type"] == "lookup":
            attr = operation["attribute"]
            return f"The original lookup value of {attr} from the selected profile."
        elif operation["type"] == "constant":
            value = operation["value"]
            return f"A constant value of {value}."
        elif operation["type"] == "two_element":
            op_type = operation["op_type"]
            operands = operation["operands"]
            op1, op2 = operands[0], operands[1]
            
            if op_type == "sum":
                return f"The sum of {op1} and {op2}."
            elif op_type == "product":
                return f"The product of {op1} and {op2}."
            elif op_type == "diff":
                return f"The result of {op1} minus {op2}."
            elif op_type == "max":
                return f"The maximum between {op1} and {op2}."
            elif op_type == "min":
                return f"The minimum between {op1} and {op2}."
            elif op_type == "modulo":
                return f"The result of {op1} modulo ({op2} + 1)."
            elif op_type == "avg":
                return f"The average of {op1} and {op2} (integer division)."
            elif op_type == "conditional":
                return f"{op1} if {op1} > {op2}, else {op2}."
            else:
                return f"A {op_type} operation on {op1} and {op2}."
        elif operation["type"] == "multi_element":
            op_type = operation["op_type"]
            operands = operation["operands"]
            elements_str = ', '.join(operands)
            
            if op_type == "sum_all":
                return f"The sum of all values: {elements_str}."
            elif op_type == "max_all":
                return f"The maximum among all values: {elements_str}."
            elif op_type == "min_all":
                return f"The minimum among all values: {elements_str}."
            elif op_type == "avg_all":
                return f"The average of all values: ({' + '.join(operands)}) divided by {len(operands)} (integer division)."
            elif op_type == "mod_sum":
                return f"The result of ({' + '.join(operands)}) modulo 100."
            elif op_type == "count_gt50":
                return f"The count of values greater than 50 among: {elements_str}."
            elif op_type == "range":
                return f"The range (max - min) among: {elements_str}."
            elif op_type == "sum_even":
                return f"The sum of even values among: {elements_str}."
            else:
                return f"A {op_type} operation on {elements_str}."
        else:
            return f"A computation operation of type {operation['type']}."
    
    def _select_task_layers(self, task_num: int) -> List[int]:
        """Select which layers a task will involve based on available layers"""
        # Generate any valid combination from available layers (1 to self.layers)
        available_layers = list(range(2, self.layers + 1))  # Start from layer 2 since layer 1 is always included
        
        # Randomly select how many additional layers to use (0 to all remaining layers)
        num_additional_layers = random.randint(0, len(available_layers))
        
        # Always include layer 1, then add randomly selected additional layers
        selected_layers = [1]  # Always include layer 1
        if num_additional_layers > 0:
            additional_layers = random.sample(available_layers, num_additional_layers)
            selected_layers.extend(additional_layers)
        
        # Sort and store the task requirements
        selected_layers = sorted(selected_layers)
        self.task_requirements[task_num] = selected_layers
        
        return selected_layers
    
    def _generate_profile_requirements(self, involved_layers: List[int]) -> List[str]:
        """Generate requirements for which profile instances to access"""
        requirements = []
        
        layer_list = ", ".join([f"layer {layer}" for layer in involved_layers])
        requirements.append(f"- The agent must access one profile instance at each of the {layer_list} according to the user request,")
        
        return requirements
    
    def _generate_input_specifications(self, task_num: int, involved_layers: List[int]) -> List[str]:
        """Generate input specifications based on all available condition attributes and global attributes, with if-else structure if structure_complexity > 1."""
        specs = []
        specs.append(f"- The agent should pass the following arguments into the finish_task_{task_num} tool call:")

        # Collect all condition and lookup attributes from all involved layers
        all_condition_attrs = []
        all_lookup_attrs = []

        for layer in involved_layers:
            layer_attrs = self.attribute_dict[layer - 1]
            for attr_num, attr_type in layer_attrs.items():
                if attr_type == "condition":
                    all_condition_attrs.append(f"layer_{layer}_attribute_{attr_num}")
                elif attr_type == "lookup":
                    all_lookup_attrs.append(f"layer_{layer}_attribute_{attr_num}")

        # Add global attributes to available pool
        global_attrs = [f"global_attribute_{i}" for i in range(1, self.num_global_attributes + 1)]

        # Use fixed number of input requirements based on args_num parameter
        #max_possible_inputs = len(all_condition_attrs) + len(all_lookup_attrs) + len(global_attrs)
        num_inputs = self.args_num

        # Initialize task operations storage
        self.task_operations[task_num] = []

        for i in range(1, num_inputs + 1):
            if self.structure_complexity == 1:
                input_req, operation = self._generate_complex_input_requirement(i, all_condition_attrs, all_lookup_attrs, global_attrs)
                specs.append(f"  - {input_req}")
                self.task_operations[task_num].append(operation)
            else:
                # For structure_complexity > 1, generate nested/sequential if-else logic
                branches = []
                branch_ops = []
                for branch in range(self.structure_complexity):
                    # For each branch, sample a new operation for the argument
                    branch_req, branch_op = self._generate_complex_input_requirement(i, all_condition_attrs, all_lookup_attrs, global_attrs)
                    branches.append((branch_req, branch_op))
                    branch_ops.append(branch_op)
                # Generate if-else conditions (comparisons between two sampled expressions)
                conditions = []
                cond_exprs = []
                # Only use numeric attributes for if-else conditions
                numeric_attrs = all_condition_attrs + global_attrs
                for cond_idx in range(self.structure_complexity - 1):
                    # Sample two expressions for comparison, but only from numeric attributes
                    left_req, left_op = self._generate_complex_input_requirement(i, numeric_attrs, [], global_attrs, for_condition=True)
                    right_req, right_op = self._generate_complex_input_requirement(i, numeric_attrs, [], global_attrs, for_condition=True)
                    # Use sum as the default operation for condition expressions
                    left_expr = left_op.get('code', '0') if 'code' in left_op else left_op.get('attribute', '0')
                    right_expr = right_op.get('code', '0') if 'code' in right_op else right_op.get('attribute', '0')
                    cond_exprs.append((left_expr, right_expr))
                    conditions.append((left_req, right_req))
                # Build the policy text for this argument
                text = f"arg_{i}: "
                for cond_idx in range(self.structure_complexity - 1):
                    left_req, right_req = conditions[cond_idx]
                    text += f"If {left_req.split(':',1)[-1].strip()} > {right_req.split(':',1)[-1].strip()}, then {branches[cond_idx][0]} else "
                text += f"{branches[-1][0]}"
                specs.append(f"  - {text}")
                # Store the if-else structure for code generation
                self.task_operations[task_num].append({
                    'type': 'ifelse',
                    'arg_num': i,
                    'branches': branch_ops,
                    'conditions': cond_exprs
                })
        return specs
    
    def _generate_complex_input_requirement(self, arg_num: int, condition_attrs: List[str], lookup_attrs: List[str], global_attrs: List[str], for_condition: bool = False) -> Tuple[str, Dict[str, Any]]:
        """Generate a complex input requirement using multiple attributes and operations. If for_condition is True, do not use lookup attributes."""
        # If for_condition is True, do not use lookup attributes at all
        if for_condition:
            lookup_attrs = []
        # Decide if this should be a lookup attribute (use original value) or computation
        if lookup_attrs and not for_condition and random.random() < 0.2:  # 20% chance for lookup
            lookup_attr = random.choice(lookup_attrs)
            operation = {
                "type": "lookup",
                "arg_num": arg_num,
                "attribute": lookup_attr
            }
            return f"arg_{arg_num}: The original lookup value of {lookup_attr} from the selected profile.", operation
        # Otherwise, create a complex computation
        available_attrs = condition_attrs + global_attrs
        if not available_attrs:
            operation = {
                "type": "constant",
                "arg_num": arg_num,
                "value": 1
            }
            return f"arg_{arg_num}: A constant value of 1.", operation
        # Sample 1-3 attributes and 1-2 constants, total should be 2 or more
        num_attrs = random.randint(1, min(3, len(available_attrs)))
        num_constants = random.randint(1, 2)
        # Ensure total is at least 2
        total_elements = num_attrs + num_constants
        if total_elements < 2:
            if len(available_attrs) >= 2:
                num_attrs = 2
                num_constants = 0
            else:
                num_attrs = 1
                num_constants = 1
        selected_attrs = random.sample(available_attrs, num_attrs) if available_attrs else []
        selected_constants = [random.randint(0, 100) for _ in range(num_constants)]
        # If we have exactly 2 elements (attr + constant or 2 attrs), use two-element operations
        if len(selected_attrs) + len(selected_constants) == 2:
            text, operation = self._generate_two_element_operation(arg_num, selected_attrs, selected_constants)
            return text, operation
        else:
            text, operation = self._generate_multi_element_operation(arg_num, selected_attrs, selected_constants)
            return text, operation
    
    def _generate_two_element_operation(self, arg_num: int, attrs: List[str], constants: List[int]) -> Tuple[str, Dict[str, Any]]:
        """Generate operation with exactly two elements (attributes and/or constants)"""
        # Combine attributes and constants into a single list of operands
        operands = attrs + [str(c) for c in constants]
        
        # Ensure we have exactly 2 operands
        if len(operands) != 2:
            # Fallback - this shouldn't happen with correct logic above
            if len(attrs) >= 2:
                operands = attrs[:2]
            elif len(attrs) == 1:
                operands = [attrs[0], str(random.randint(0, 100))]
            else:
                operands = [str(random.randint(0, 100)), str(random.randint(0, 100))]
        
        op1, op2 = operands[0], operands[1]
        
        # Define operations with both text and executable code
        operations = [
            ("sum", f"The sum of {op1} and {op2}", f"({op1}) + ({op2})"),
            ("product", f"The product of {op1} and {op2}", f"({op1}) * ({op2})"),
            ("diff", f"The result of {op1} minus {op2}", f"({op1}) - ({op2})"),
            ("max", f"The maximum between {op1} and {op2}", f"max({op1}, {op2})"),
            ("min", f"The minimum between {op1} and {op2}", f"min({op1}, {op2})"),
            ("modulo", f"The result of {op1} modulo ({op2} + 1)", f"({op1}) % (({op2}) + 1)"),
            ("avg", f"The average of {op1} and {op2} (integer division)", f"(({op1}) + ({op2})) // 2"),
            ("conditional", f"{op1} if {op1} > {op2}, else {op2}", f"({op1}) if ({op1}) > ({op2}) else ({op2})")
        ]
        
        op_type, text_desc, code_expr = random.choice(operations)
        
        operation = {
            "type": "two_element",
            "arg_num": arg_num,
            "op_type": op_type,
            "operands": [op1, op2],
            "code": code_expr,
            "attributes": [op for op in [op1, op2] if not op.isdigit()],
            "constants": [int(op) for op in [op1, op2] if op.isdigit()]
        }
        
        return f"arg_{arg_num}: {text_desc}.", operation
    
    def _generate_multi_element_operation(self, arg_num: int, attrs: List[str], constants: List[int]) -> Tuple[str, Dict[str, Any]]:
        """Generate operation with multiple elements (attributes and constants)"""
        # Combine attributes and constants
        all_elements = attrs + [str(c) for c in constants]
        elements_str = ', '.join(all_elements)
        
        # Define operations with both text and executable code
        operations = [
            ("sum_all", f"The sum of all values: {elements_str}", f"sum([{', '.join(all_elements)}])"),
            ("max_all", f"The maximum among all values: {elements_str}", f"max([{', '.join(all_elements)}])"),
            ("min_all", f"The minimum among all values: {elements_str}", f"min([{', '.join(all_elements)}])"),
            ("avg_all", f"The average of all values: ({' + '.join(all_elements)}) divided by {len(all_elements)} (integer division)", f"sum([{', '.join(all_elements)}]) // {len(all_elements)}"),
            ("mod_sum", f"The result of ({' + '.join(all_elements)}) modulo 100", f"sum([{', '.join(all_elements)}]) % 100"),
            ("count_gt50", f"The count of values greater than 50 among: {elements_str}", f"sum(1 for x in [{', '.join(all_elements)}] if x > 50)"),
            ("range", f"The range (max - min) among: {elements_str}", f"max([{', '.join(all_elements)}]) - min([{', '.join(all_elements)}])"),
            ("sum_even", f"The sum of even values among: {elements_str}", f"sum(x for x in [{', '.join(all_elements)}] if x % 2 == 0)")
        ]
        
        op_type, text_desc, code_expr = random.choice(operations)
        
        operation = {
            "type": "multi_element",
            "arg_num": arg_num,
            "op_type": op_type,
            "operands": all_elements,
            "code": code_expr,
            "attributes": attrs,
            "constants": constants
        }
        
        return f"arg_{arg_num}: {text_desc}.", operation
    
    def _generate_completion_requirements(self, task_num: int, involved_layers: List[int]) -> List[str]:
        """Generate completion requirements for the task"""
        requirements = []
        
        if len(involved_layers) == 1:
            requirements.append(f"- The agent should call the finish_task_{task_num} tool with the arguments above for the selected profile instance.")
        else:
            requirements.append(f"- Each task_{task_num} completion requires exactly one profile from each of the specified layers.")
            requirements.append(f"- The agent should call the finish_task_{task_num} tool with arguments from one instance per layer at a time.")
            
        if len(involved_layers) > 2:
            requirements.append("- Multiple function calls may be needed if multiple profile combinations are requested.")
        
        return requirements
    
    def generate_general_policies(self) -> List[str]:
        """Generate general policy constraints"""
        return [
            "",
            "## Policy Specifications",
            "",
            "### General Policy 1",
            "The agent must first get access to the profile instance at layer 1 according to the user specified primary key, alternatively, the agent may also search for the profile instance at layer 1 when the user did not provide a profile instance at layer 1 and instead provided a lookup field in profile layer 1.",
            "",
            "### General Policy 2", 
            "The agent should always finish the task with the task required attribute combinations at one time. If users specify multiple attribute combinations for the task (e.g., 'doing task i for all the instances accessd in layer 1.'), the agent must call the finish task tool multiple times and only address one attribute combination at a time."
        ]
    
    def generate_policy(self) -> str:
        """Generate a complete policy"""
        global_attrs = self.generate_global_attributes()
        
        policy_content = []
        instructions, policy_id = self.generate_general_instructions(global_attrs)
        policy_content.extend(instructions)
        policy_content.extend(self.generate_domain_basic())
        policy_content.extend(self.generate_tool_calling_instructions())
        policy_content.extend(self.generate_general_policies())
        policy_content.extend(self.generate_task_specifications())
        
        return "\n".join(policy_content)
    
    def get_task_requirements(self) -> Dict[int, List[int]]:
        """Get the generated task requirements dictionary"""
        return self.task_requirements.copy()
    
    def get_task_layer_mapping(self) -> Dict[str, List[int]]:
        """Get the task requirements as a dictionary with string keys mapping task numbers to their required layers"""
        return {str(task_num): layers for task_num, layers in self.task_requirements.items()}
    
    def generate_policy_qa(self, policy_id: int, global_attrs: Dict[str, int]) -> List[Dict[str, str]]:
        """Generate questions and answers about the policy content"""
        qa_pairs = []
        policy_id_str = f"#P{policy_id:05d}"
        
        # 1. Questions about global attributes
        for i in range(1, self.num_global_attributes + 1):
            attr_key = f"Global_Attribute_Value{i}"
            if attr_key in global_attrs:
                question = f"What is the value of global_attribute_{i} in Policy {policy_id_str}?"
                answer = str(global_attrs[attr_key])
                qa_pairs.append({
                    "question": question,
                    "answer": answer,
                    "category": "global_attributes"
                })
        
        # 2. Question about number of tasks
        question = f"How many tasks does Policy {policy_id_str} specify the agent to do?"
        answer = str(self.task_types)
        qa_pairs.append({
            "question": question,
            "answer": answer,
            "category": "task_count"
        })
        
        # 3. Questions about task argument computations
        for task_num in sorted(self.task_operations.keys()):
            operations = self.task_operations[task_num]
            for i, operation in enumerate(operations):
                arg_num = operation["arg_num"]
                question = f"How to compute arg_{arg_num} in task_{task_num} in Policy {policy_id_str}?"
                
                # Generate answer based on operation type
                if operation["type"] == "lookup":
                    attr = operation["attribute"]
                    answer = f"The original lookup value of {attr} from the selected profile."
                elif operation["type"] == "constant":
                    value = operation["value"]
                    answer = f"A constant value of {value}."
                elif operation["type"] == "two_element":
                    op_type = operation["op_type"]
                    operands = operation["operands"]
                    op1, op2 = operands[0], operands[1]
                    if op_type == "sum":
                        answer = f"The sum of {op1} and {op2}."
                    elif op_type == "product":
                        answer = f"The product of {op1} and {op2}."
                    elif op_type == "diff":
                        answer = f"The result of {op1} minus {op2}."
                    elif op_type == "max":
                        answer = f"The maximum between {op1} and {op2}."
                    elif op_type == "min":
                        answer = f"The minimum between {op1} and {op2}."
                    elif op_type == "modulo":
                        answer = f"The result of {op1} modulo ({op2} + 1)."
                    elif op_type == "avg":
                        answer = f"The average of {op1} and {op2} (integer division)."
                    elif op_type == "conditional":
                        answer = f"{op1} if {op1} > {op2}, else {op2}."
                    else:
                        answer = f"A {op_type} operation on {op1} and {op2}."
                elif operation["type"] == "multi_element":
                    op_type = operation["op_type"]
                    operands = operation["operands"]
                    elements_str = ', '.join(operands)
                    if op_type == "sum_all":
                        answer = f"The sum of all values: {elements_str}."
                    elif op_type == "max_all":
                        answer = f"The maximum among all values: {elements_str}."
                    elif op_type == "min_all":
                        answer = f"The minimum among all values: {elements_str}."
                    elif op_type == "avg_all":
                        answer = f"The average of all values: ({' + '.join(operands)}) divided by {len(operands)} (integer division)."
                    elif op_type == "mod_sum":
                        answer = f"The result of ({' + '.join(operands)}) modulo 100."
                    elif op_type == "count_gt50":
                        answer = f"The count of values greater than 50 among: {elements_str}."
                    elif op_type == "range":
                        answer = f"The range (max - min) among: {elements_str}."
                    elif op_type == "sum_even":
                        answer = f"The sum of even values among: {elements_str}."
                    else:
                        answer = f"A {op_type} operation on {elements_str}."
                elif operation["type"] == "ifelse":
                    # For if-else operations, reconstruct the full if-else structure text
                    branches = operation['branches']
                    conditions = operation['conditions']
                    
                    # Generate the text for this if-else structure (same logic as in policy generation)
                    text = ""
                    for cond_idx in range(len(conditions)):
                        left_expr, right_expr = conditions[cond_idx]
                        branch_text = self._operation_to_text(branches[cond_idx])
                        if cond_idx == 0:
                            text += f"If {left_expr} > {right_expr}, then {branch_text} else "
                        else:
                            text += f"if {left_expr} > {right_expr}, then {branch_text} else "
                    
                    # Add final branch
                    final_branch_text = self._operation_to_text(branches[-1])
                    text += final_branch_text
                    
                    answer = text
                else:
                    answer = f"A computation operation of type {operation['type']}."
                
                qa_pairs.append({
                    "question": question,
                    "answer": answer,
                    "category": "task_computation"
                })
        
        return qa_pairs
    
    def save_policy(self, output_path: str, generate_variants: bool = True):
        """Generate and save a policy to the specified path as markdown"""
        # Generate global attributes once and use for both policy and exec code
        global_attrs = self.generate_global_attributes()
        
        # Generate policy using these global attributes
        policy_content = []
        instructions, policy_id = self.generate_general_instructions(global_attrs)
        policy_content.extend(instructions)
        policy_content.extend(self.generate_domain_basic())
        policy_content.extend(self.generate_tool_calling_instructions())
        policy_content.extend(self.generate_general_policies())
        policy_content.extend(self.generate_task_specifications())
        
        policy_text = "\n".join(policy_content)
        
        # Create directory if it doesn't exist
        os.makedirs(os.path.dirname(output_path), exist_ok=True)
        
        with open(output_path, 'w', encoding='utf-8') as f:
            f.write(policy_text)
        
        print(f"Policy generated and saved to: {output_path}")
        
        # Generate and save Q&A pairs
        qa_pairs = self.generate_policy_qa(policy_id, global_attrs)
        qa_output_path = os.path.join(os.path.dirname(output_path), "Policy_QA.json")
        
        with open(qa_output_path, 'w', encoding='utf-8') as f:
            json.dump(qa_pairs, f, indent=2, ensure_ascii=False)
        
        print(f"Policy Q&A generated and saved to: {qa_output_path}")
        print(f"Generated {len(qa_pairs)} Q&A pairs covering:")
        print(f"  - {self.num_global_attributes} global attribute questions")
        print(f"  - 1 task count question") 
        print(f"  - {len(qa_pairs) - self.num_global_attributes - 1} task computation questions")
        
        # Generate and save executable code using the same base directory as the policy
        # Extract base directory from output_path (e.g., "Generated_data_layer_3_task_5/Policy/Policy.md" -> "Generated_data_layer_3_task_5")
        base_dir = os.path.dirname(os.path.dirname(output_path))
        exec_output_path = os.path.join(base_dir, "Task", "exec.py")
        self.save_exec_code(exec_output_path, global_attrs)
        
        # Generate variants if requested
        if generate_variants:
            self.generate_policy_variants(output_path, policy_id, global_attrs, base_dir)
        
        # Output the task requirements
        print(f"\nGenerated task requirements:")
        print("custom_task_requirements = {")
        for task_num in sorted(self.task_requirements.keys()):
            layers = self.task_requirements[task_num]
            if task_num == max(self.task_requirements.keys()):
                print(f"    {task_num}: {layers}     # Task_Type_{task_num}: {self._format_layers_description(layers)}")
            else:
                print(f"    {task_num}: {layers},    # Task_Type_{task_num}: {self._format_layers_description(layers)}")
        print("}")
        
        return policy_text
    
    def generate_policy_variants(self, original_output_path: str, original_policy_id: int, original_global_attrs: Dict[str, int], base_dir: str):
        """Generate policy and task level variants"""
        print(f"\n🔄 Generating policy variants...")
        
        # Generate policy-level variant
        self.generate_policy_level_variant(original_output_path, base_dir)
        
        # Generate task-level variant
        self.generate_task_level_variant(original_output_path, original_policy_id, original_global_attrs, base_dir)
        
        print(f"✅ Policy variants generated successfully!")
    
    def generate_policy_level_variant(self, original_output_path: str, base_dir: str):
        """Generate a completely different policy variant"""
        print(f"  📝 Generating policy-level variant...")
        
        # Store original state
        original_task_requirements = self.task_requirements.copy()
        original_task_operations = self.task_operations.copy()
        
        # Clear for fresh generation
        self.task_requirements = {}
        self.task_operations = {}
        
        # Generate new global attributes
        variant_global_attrs = self.generate_global_attributes()
        
        # Generate variant policy
        policy_content = []
        instructions, variant_policy_id = self.generate_general_instructions(variant_global_attrs)
        policy_content.extend(instructions)
        policy_content.extend(self.generate_domain_basic())
        policy_content.extend(self.generate_tool_calling_instructions())
        policy_content.extend(self.generate_general_policies())
        policy_content.extend(self.generate_task_specifications())
        
        variant_policy_text = "\n".join(policy_content)
        
        # Save variant policy
        variant_output_path = os.path.join(os.path.dirname(original_output_path), "overide_policy.md")
        with open(variant_output_path, 'w', encoding='utf-8') as f:
            f.write(variant_policy_text)
        
        print(f"    💾 Policy variant saved to: {variant_output_path}")
        
        # Generate Q&A for variant policy
        variant_qa_pairs = self.generate_policy_qa(variant_policy_id, variant_global_attrs)
        variant_qa_output_path = os.path.join(os.path.dirname(original_output_path), "Policy_QA_overide_policy.json")
        
        with open(variant_qa_output_path, 'w', encoding='utf-8') as f:
            json.dump(variant_qa_pairs, f, indent=2, ensure_ascii=False)
        
        print(f"    💾 Policy variant Q&A saved to: {variant_qa_output_path}")
        
        # Generate exec code for variant
        variant_exec_path = os.path.join(base_dir, "Task", "exec_overide_policy.py")
        self.save_exec_code(variant_exec_path, variant_global_attrs, function_name_suffix="_overide_policy")
        
        print(f"    💾 Policy variant exec saved to: {variant_exec_path}")
        
        # Restore original state
        self.task_requirements = original_task_requirements
        self.task_operations = original_task_operations
    
    def generate_task_level_variant(self, original_output_path: str, original_policy_id: int, original_global_attrs: Dict[str, int], base_dir: str):
        """Generate a policy variant with one task changed"""
        print(f"  📝 Generating task-level variant...")
        
        # Store original state
        original_task_requirements = self.task_requirements.copy()
        original_task_operations = self.task_operations.copy()
        
        # Choose a random task to modify
        task_to_modify = random.choice(list(self.task_requirements.keys()))
        print(f"    🎯 Modifying Task_Type_{task_to_modify}")
        
        # Store the original task operation for this task
        original_task_op = self.task_operations[task_to_modify].copy()
        
        # Clear only the selected task and regenerate it
        if task_to_modify in self.task_operations:
            del self.task_operations[task_to_modify]
        
        # Regenerate just this task with different parameters
        involved_layers = self.task_requirements[task_to_modify]
        
        # Generate new input specifications for this task only
        self._generate_input_specifications_for_task(task_to_modify, involved_layers)
        
        # Generate variant policy with modified task - preserve original content except for the modified task
        policy_content = []
        instructions, variant_policy_id = self.generate_general_instructions(original_global_attrs)
        # Update policy ID to indicate task variant
        instructions[0] = f"# Agent Policy Document #P{original_policy_id:05d}-T{task_to_modify}"
        
        policy_content.extend(instructions)
        policy_content.extend(self.generate_domain_basic())
        policy_content.extend(self.generate_tool_calling_instructions())
        policy_content.extend(self.generate_general_policies())
        
        # Generate task specifications with only the modified task changed
        policy_content.extend(self.generate_task_specifications_with_variant(task_to_modify, original_task_operations))
        
        variant_policy_text = "\n".join(policy_content)
        
        # Save variant policy
        variant_output_path = os.path.join(os.path.dirname(original_output_path), "overide_task.md")
        with open(variant_output_path, 'w', encoding='utf-8') as f:
            f.write(variant_policy_text)
        
        print(f"    💾 Task variant saved to: {variant_output_path}")
        
        # Generate Q&A for variant policy
        variant_qa_pairs = self.generate_policy_qa(variant_policy_id, original_global_attrs)
        variant_qa_output_path = os.path.join(os.path.dirname(original_output_path), "Policy_QA_overide_task.json")
        
        with open(variant_qa_output_path, 'w', encoding='utf-8') as f:
            json.dump(variant_qa_pairs, f, indent=2, ensure_ascii=False)
        
        print(f"    💾 Task variant Q&A saved to: {variant_qa_output_path}")
        
        # Generate exec code for variant - need to temporarily set up all task operations
        # Combine original operations with the modified task operation
        variant_task_operations = original_task_operations.copy()
        variant_task_operations[task_to_modify] = self.task_operations[task_to_modify]
        
        # Temporarily set task_operations to include all tasks for exec generation
        temp_task_operations = self.task_operations
        self.task_operations = variant_task_operations
        
        variant_exec_path = os.path.join(base_dir, "Task", "exec_overide_task.py")
        self.save_exec_code(variant_exec_path, original_global_attrs, function_name_suffix="_overide_task")
        
        print(f"    💾 Task variant exec saved to: {variant_exec_path}")
        
        # Restore original state
        self.task_requirements = original_task_requirements
        self.task_operations = original_task_operations
    
    def _generate_input_specifications_for_task(self, task_num: int, involved_layers: List[int]) -> List[str]:
        """Generate input specifications for a single task (used in task variant generation)"""
        # Collect all condition and lookup attributes from all involved layers
        all_condition_attrs = []
        all_lookup_attrs = []

        for layer in involved_layers:
            layer_attrs = self.attribute_dict[layer - 1]
            for attr_num, attr_type in layer_attrs.items():
                if attr_type == "condition":
                    all_condition_attrs.append(f"layer_{layer}_attribute_{attr_num}")
                elif attr_type == "lookup":
                    all_lookup_attrs.append(f"layer_{layer}_attribute_{attr_num}")

        # Add global attributes to available pool
        global_attrs = [f"global_attribute_{i}" for i in range(1, self.num_global_attributes + 1)]

        # Use fixed number of input requirements based on args_num parameter
        num_inputs = self.args_num

        # Initialize task operations storage for this task
        self.task_operations[task_num] = []

        for i in range(1, num_inputs + 1):
            if self.structure_complexity == 1:
                input_req, operation = self._generate_complex_input_requirement(i, all_condition_attrs, all_lookup_attrs, global_attrs)
                self.task_operations[task_num].append(operation)
            else:
                # For structure_complexity > 1, generate nested/sequential if-else logic
                branches = []
                branch_ops = []
                for branch in range(self.structure_complexity):
                    # For each branch, sample a new operation for the argument
                    branch_req, branch_op = self._generate_complex_input_requirement(i, all_condition_attrs, all_lookup_attrs, global_attrs)
                    branches.append((branch_req, branch_op))
                    branch_ops.append(branch_op)
                # Generate if-else conditions (comparisons between two sampled expressions)
                conditions = []
                cond_exprs = []
                # Only use numeric attributes for if-else conditions
                numeric_attrs = all_condition_attrs + global_attrs
                for cond_idx in range(self.structure_complexity - 1):
                    # Sample two expressions for comparison, but only from numeric attributes
                    left_req, left_op = self._generate_complex_input_requirement(i, numeric_attrs, [], global_attrs, for_condition=True)
                    right_req, right_op = self._generate_complex_input_requirement(i, numeric_attrs, [], global_attrs, for_condition=True)
                    # Use sum as the default operation for condition expressions
                    left_expr = left_op.get('code', '0') if 'code' in left_op else left_op.get('attribute', '0')
                    right_expr = right_op.get('code', '0') if 'code' in right_op else right_op.get('attribute', '0')
                    cond_exprs.append((left_expr, right_expr))
                    conditions.append((left_req, right_req))
                # Store the if-else structure for code generation
                self.task_operations[task_num].append({
                    'type': 'ifelse',
                    'arg_num': i,
                    'branches': branch_ops,
                    'conditions': cond_exprs
                })
    
    def _format_layers_description(self, layers: List[int]) -> str:
        """Format layer description for the comment"""
        if len(layers) == 1:
            return f"layer {layers[0]} only"
        elif len(layers) == self.layers:
            return "all layers"
        else:
            layer_str = ", ".join(map(str, layers[:-1])) + f" and {layers[-1]}"
            return f"layers {layer_str}"
    
    def generate_exec_code(self, global_attrs: Dict[str, int], function_name_suffix: str = "") -> str:
        """Generate executable Python code for computing task arguments"""
        code_lines = [
            "# Auto-generated task computation functions",
            "# This file contains functions to compute task arguments based on instance values",
            "",
            "# Global attributes (generated during policy creation)",
        ]
        
        # Add global attributes as constants
        for attr_name, attr_value in global_attrs.items():
            code_lines.append(f"{attr_name.upper()} = {attr_value}")
        
        code_lines.extend([
            "",
            f"def get_attribute_value{function_name_suffix}(instances, attr_name):",
            "    \"\"\"",
            "    Extract attribute value from instances or global attributes.",
            "    ",
            "    Args:",
            "        instances: Dict mapping layer numbers to instance data",
            "        attr_name: String like 'layer_{1}_attribute_{2}' or 'global_attribute_1'",
            "    \"\"\"",
            "    if attr_name.startswith('global_attribute_'):",
            "        attr_num = attr_name.split('_')[-1]",
            "        global_var_name = f'GLOBAL_ATTRIBUTE_VALUE{attr_num}'.upper()",
            "        return globals().get(global_var_name, 0)",
            "    ",
            "    # Parse layer_{X}_attribute_{Y} format",
            "    parts = attr_name.replace('{', '').replace('}', '').split('_')",
            "    if len(parts) >= 4 and parts[0] == 'layer' and parts[2] == 'attribute':",
            "        layer_num = int(parts[1])",
            "        attr_num = parts[3]",
            "        if layer_num in instances and f'Profile_{layer_num}_Attribute_{attr_num}' in instances[layer_num]:",
            "            return instances[layer_num][f'Profile_{layer_num}_Attribute_{attr_num}']",
            "    ",
            "    return 0  # Default value if attribute not found",
            "",
            ""
        ])
        
        # Generate individual task functions
        for task_num in sorted(self.task_operations.keys()):
            operations = self.task_operations[task_num]
            code_lines.extend(self._generate_task_function(task_num, operations, function_name_suffix))
            code_lines.append("")
        
        # Generate master function that calls all task functions
        code_lines.extend([
            f"def compute_all_tasks{function_name_suffix}(instances):",
            "    \"\"\"",
            "    Compute arguments for all tasks.",
            "    ",
            "    Args:",
            "        instances: Dict mapping layer numbers to instance data",
            "    ",
            "    Returns:",
            "        Dict mapping task numbers to their computed arguments",
            "    \"\"\"",
            "    results = {}",
        ])
        
        for task_num in sorted(self.task_operations.keys()):
            code_lines.append(f"    results[{task_num}] = compute_task_{task_num}{function_name_suffix}(instances)")
        
        code_lines.extend([
            "    return results",
            "",
            "# Example usage:",
            "# instances = {",
            "#     1: {'Profile_1_Attribute_1': 25, 'Profile_1_Attribute_2': 75, ...},",
            "#     2: {'Profile_2_Attribute_1': 50, 'Profile_2_Attribute_2': 30, ...},",
            "# }",
            f"# results = compute_all_tasks{function_name_suffix}(instances)"
        ])
        
        return "\n".join(code_lines)
    
    def _extract_attribute_vars(self, code_str: str) -> set:
        """Extract all attribute variable names from a code string."""
        # Matches layer_1_attribute_2, global_attribute_1, etc.
        pattern = r'(layer_\d+_attribute_\d+|global_attribute_\d+)'
        return set(re.findall(pattern, code_str))
    
    def _generate_task_function(self, task_num: int, operations: List[Dict[str, Any]], function_name_suffix: str = "") -> List[str]:
        """Generate a function for computing one task's arguments, supporting if-else structure if needed. All attribute values are obtained at the beginning."""
        function_lines = [
            f"def compute_task_{task_num}{function_name_suffix}(instances):",
            f"    \"\"\"",
            f"    Compute arguments for Task_Type_{task_num}.",
            f"    ",
            f"    Args:",
            f"        instances: Dict mapping layer numbers to instance data",
            f"    ",
            f"    Returns:",
            f"        List of computed argument values",
            f"    \"\"\"",
            f"    args = []",
            f""
        ]
        # --- Collect all attributes used in all operations and conditions ---
        used_attrs = set()
        for operation in operations:
            if operation["type"] == "ifelse":
                all_ops = operation['branches']
                all_conds = operation['conditions']
                for op in all_ops:
                    if op["type"] in ["two_element", "multi_element"]:
                        # Extract from code
                        used_attrs.update(self._extract_attribute_vars(op["code"]))
                    elif op["type"] == "lookup":
                        used_attrs.add(op["attribute"])
                for left_expr, right_expr in all_conds:
                    used_attrs.update(self._extract_attribute_vars(left_expr))
                    used_attrs.update(self._extract_attribute_vars(right_expr))
            else:
                if operation["type"] == "lookup":
                    used_attrs.add(operation["attribute"])
                elif operation["type"] in ["two_element", "multi_element"]:
                    used_attrs.update(self._extract_attribute_vars(operation["code"]))
        # --- Generate code to get all needed attribute values at the top ---
        for attr in sorted(used_attrs):
            clean_attr = attr.replace('{', '').replace('}', '')
            function_lines.append(f"    {clean_attr} = get_attribute_value{function_name_suffix}(instances, '{attr}')")
        function_lines.append("")
        # --- Now generate the logic for each argument ---
        for i, operation in enumerate(operations):
            arg_num = operation["arg_num"]
            if operation["type"] == "ifelse":
                all_ops = operation['branches']
                all_conds = operation['conditions']
                indent = "    "
                for cond_idx, (left_expr, right_expr) in enumerate(operation['conditions']):
                    left_code = left_expr
                    right_code = right_expr
                    for attr in used_attrs:
                        clean_attr = attr.replace('{', '').replace('}', '')
                        left_code = left_code.replace(attr, clean_attr)
                        right_code = right_code.replace(attr, clean_attr)
                    function_lines.append(f"{indent}if {left_code} > {right_code}:")
                    branch_op = operation['branches'][cond_idx]
                    branch_lines = self._generate_task_function_branch(arg_num, branch_op, used_attrs, indent + "    ")
                    function_lines.extend(branch_lines)
                    function_lines.append(f"{indent}    args.append(value_{arg_num})")
                    function_lines.append(f"{indent}else:")
                    indent += "    "
                branch_op = operation['branches'][-1]
                branch_lines = self._generate_task_function_branch(arg_num, branch_op, used_attrs, indent)
                function_lines.extend(branch_lines)
                function_lines.append(f"{indent}args.append(value_{arg_num})")
            else:
                if operation["type"] == "lookup":
                    attr = operation["attribute"]
                    clean_attr = attr.replace('{', '').replace('}', '')
                    function_lines.extend([
                        f"    # arg_{arg_num}: Lookup operation",
                        f"    value_{arg_num} = {clean_attr}",
                        f"    args.append(value_{arg_num})",
                        f""
                    ])
                elif operation["type"] == "constant":
                    value = operation["value"]
                    function_lines.extend([
                        f"    # arg_{arg_num}: Constant value",
                        f"    value_{arg_num} = {value}",
                        f"    args.append(value_{arg_num})",
                        f""
                    ])
                elif operation["type"] in ["two_element", "multi_element"]:
                    code_expr = operation["code"]
                    attributes = operation.get("attributes", [])
                    function_lines.append(f"    # arg_{arg_num}: {operation['op_type']} operation")
                    clean_code = code_expr
                    for attr in attributes:
                        if not attr.isdigit():
                            clean_attr = attr.replace('{', '').replace('}', '')
                            clean_code = clean_code.replace(f"({attr})", clean_attr).replace(attr, clean_attr)
                    function_lines.extend([
                        f"    value_{arg_num} = {clean_code}",
                        f"    args.append(value_{arg_num})",
                        f""
                    ])
        function_lines.append("    return args")
        return function_lines

    def _generate_task_function_branch(self, arg_num, operation, used_attrs, indent):
        """Helper to generate code for a branch in an if-else structure."""
        lines = []
        if operation["type"] == "lookup":
            attr = operation["attribute"]
            clean_attr = attr.replace('{', '').replace('}', '')
            lines.append(f"{indent}value_{arg_num} = {clean_attr}")
        elif operation["type"] == "constant":
            value = operation["value"]
            lines.append(f"{indent}value_{arg_num} = {value}")
        elif operation["type"] in ["two_element", "multi_element"]:
            code_expr = operation["code"]
            attributes = operation.get("attributes", [])
            clean_code = code_expr
            for attr in attributes:
                if not attr.isdigit():
                    clean_attr = attr.replace('{', '').replace('}', '')
                    clean_code = clean_code.replace(f"({attr})", clean_attr).replace(attr, clean_attr)
            lines.append(f"{indent}value_{arg_num} = {clean_code}")
        return lines
    
    def save_exec_code(self, output_path: str, global_attrs: Dict[str, int], function_name_suffix: str = ""):
        """Generate and save the executable code to the specified path"""
        exec_code = self.generate_exec_code(global_attrs, function_name_suffix)
        
        # Create directory if it doesn't exist
        os.makedirs(os.path.dirname(output_path), exist_ok=True)
        
        with open(output_path, 'w', encoding='utf-8') as f:
            f.write(exec_code)
        
        print(f"Executable code generated and saved to: {output_path}")

if __name__ == "__main__":
    # Generate a policy
    generator = PolicyGenerator()
    output_path = "Generated_data/Policy/Policy.md"
    
    policy_content = generator.save_policy(output_path)
    
    print(f"\nGenerated files:")
    print(f"- Policy: {output_path}")
    print(f"- Executable code: Generated_data/Task/exec.py")
    print(f"\nThe executable code contains functions to compute task arguments from instance values.")
    print(f"Use compute_all_tasks(instances) to get results for all tasks.") 