# Configuration for the heuristic policy
# This policy uses HR interestingness functions to guide concept selection

_target_: frame.policies.interestingness_guided_policy.InterestingnessGuidedPolicy
type: interestingness_guided

params:
  # Number of top concepts to consider for production rules
  top_k_concepts: 10
  
  # Temperature for sampling (higher = more uniform)
  temperature: 1.5
  
  # Concept selection strategy
  concept_selection: INTERESTINGNESS
  
  # Use RULE_BASED_RANDOM for action selection to match original heuristic behavior
  action_selection: RULE_BASED_RANDOM
  
  # Use HR interestingness functions from file
  interestingness_function_path: "frame/interestingness/learning/generated_programs/hr_weighted.py"