interaction:
  - name: "ver_k_retry"
    class_name: "verl.interactions.ver_k_retry_interaction.VerKRetryInteraction"
    config:
      # Maze verifier (validates path on the maze grid).
      verifier_type: "callable"
      verifier_fn_path: "examples.reward_fns.maze_path_reward:verifier_fn"

      # Used for logging/history; callable verifier uses full attempt_text.
      answer_extraction: "answer_tag"

      include_history: false
      history_max_chars: 0

      track_turn_metadata: true
      log_attempts: true
      log_attempts_num_samples: 3
      log_attempts_max_per_instance: 0
      log_max_chars: 0
      log_file: "./outputs/ver_k_retry_attempts_maze.log"
      log_file_overwrite: true

      feedback:
        correct: "Correct. Stop."
        incorrect: |
          Your previous attempt(s) were incorrect. Review them and try again.
          Solve the maze again from scratch, correcting any mistakes.
          Final answer must be a move string over U,D,L,R only in <answer>...</answer>.
        max_attempts_reached: "Incorrect and maximum attempts reached. Stop."
