{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "The autoreload extension is already loaded. To reload it, use:\n",
      "  %reload_ext autoreload\n"
     ]
    }
   ],
   "source": [
    "import sys\n",
    "sys.path.insert(0, '../')\n",
    "\n",
    "%load_ext autoreload\n",
    "%autoreload 2\n",
    "from src.self_improve.self_improve_search import *\n",
    "from src.searchlight.datastructures.graphs import ValueGraph2\n",
    "from src.GOPS.value_heuristic_evaluators import *\n",
    "from src.self_improve.self_improve_search import SelfImprovementInitialInferencer\n",
    "from src.llm_utils.llm_api_models import GPT35Multi\n",
    "from src.self_improve.proposers import LLMImprovementProposer\n",
    "from src.self_improve.prompts.improvement_prompts import *\n",
    "from src.searchlight.datastructures.adjusters import QValueAdjuster\n",
    "from src.searchlight.datastructures.estimators import UtilityEstimatorLast\n",
    "from src.GOPS.baseline_models_GOPS import *\n",
    "from src.llm_utils.func_list import *\n",
    "from src.searchlight.gameplay.simulators import GameSimulator\n",
    "from src.GOPS.examples.abstract_list3 import abstract_list\n",
    "from src.GOPS.examples.func_list3 import func_list\n",
    "from src.self_improve.analyzers import HeuristicsAnalyzer\n",
    "from src.self_improve.headers import *"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "An exception occurred: invalid syntax (<string>, line 53)\n"
     ]
    }
   ],
   "source": [
    "# create improvement proposer\n",
    "gpt = GPT35Multi(temperature=0.7, num_responses=2)\n",
    "proposer = LLMImprovementProposer(gpt, IMPROVEMENT_PROMPTS)\n",
    "\n",
    "# create GOPSValueHeuristicsSSGEvaluator\n",
    "transitor=GOPSForwardTransitor2()\n",
    "actor_enumerator=GOPSActorEnumerator()\n",
    "action_enumerator=GOPSActionEnumerator()\n",
    "start_state=GOPSState2({-1}, tuple(),tuple(), tuple(), 5)\n",
    "\n",
    "# create game simulator\n",
    "simulator = GameSimulator(transitor=transitor, actor_enumerator=actor_enumerator, action_enumerator=action_enumerator, start_state=start_state)\n",
    "\n",
    "# create evaluator\n",
    "evaluator = GOPSValueHeuristicsSSGEvaluator(simulator=simulator, num_batch_runs=1, players = {0,1}, against_benchmark=True)\n",
    "\n",
    "# create analyzer\n",
    "analyzer = HeuristicsAnalyzer()\n",
    "\n",
    "seed_functions = [(func_list[0], abstract_list[0]), (func_list[1], abstract_list[1]), (func_list[2], abstract_list[2])]\n",
    "\n",
    "# create evolver\n",
    "evolver = Evolver(evaluator=evaluator, proposer=proposer, analyzer=analyzer, seed_functions=seed_functions)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[0.0, -4.5, -2.5]\n"
     ]
    }
   ],
   "source": [
    "scores, notes = evaluator.evaluate([func_list[0], func_list[1], func_list[2]])\n",
    "print(scores)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(\"def evaluate_state(state) -> tuple[tuple[float, float], dict]:\\n    score_cards = state[0]\\n    player_0_played_cards = state[1]\\n    player_1_played_cards = state[2]\\n    is_turn = state[3]\\n    player_0_score = state[4]\\n    player_1_score = state[5]\\n    score_deck = state[6]\\n    player_0_hand = state[7]\\n    player_1_hand = state[8]\\n    \\n    # Calculate the potential scores for each player based on the remaining score cards\\n    player_potential_score = player_0_score\\n    opponent_potential_score = player_1_score\\n    \\n    if len(score_deck) > 0:\\n        remaining_score_cards = len(score_deck)\\n        if len(player_0_played_cards) > len(player_1_played_cards):\\n            player_potential_score += remaining_score_cards / 2\\n        elif len(player_1_played_cards) > len(player_0_played_cards):\\n            opponent_potential_score += remaining_score_cards / 2\\n    \\n    player_advantage = player_potential_score - opponent_potential_score\\n    \\n    return (player_potential_score, opponent_potential_score), {'player_advantage': player_advantage}\",\n",
       " ('Thoughts:\\n- In GOPS, the value of a state can be determined by the current total score of each player.\\n- The number of score cards remaining in the deck can also impact the value of a state, as it affects the potential for each player to increase their score.\\n- The difference in total scores between the two players can indicate the current advantage one player has over the other.\\n- The distribution of high-value score cards among the remaining cards can influence the potential for high-scoring rounds.\\n- The player who has won more rounds so far may have a higher chance of winning the game.\\n- The strategy of each player in terms of playing high or low cards can also affect the value of a state.\\n-----\\n\\nPseudocode:\\n```\\nfunction evaluate_state(player_score, opponent_score, remaining_score_cards, player_rounds_won, opponent_rounds_won):\\n    player_potential_score = player_score\\n    opponent_potential_score = opponent_score\\n    \\n    if player_rounds_won > opponent_rounds_won:\\n        player_potential_score += remaining_score_cards / 2\\n    elif opponent_rounds_won > player_rounds_won:\\n        opponent_potential_score += remaining_score_cards / 2\\n    \\n    player_advantage = player_potential_score - opponent_potential_score\\n    \\n    return (player_potential_score, opponent_potential_score, player_advantage)\\n```\\nThis function takes as input the current total scores of the player and opponent, the number of remaining score cards in the deck, the number of rounds won by each player, and calculates the potential scores for each player based on the remaining score cards. It also calculates the advantage one player has over the other based on their potential scores.',\n",
       "  \"--------------------------\\n    Example 0:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (4, 1)\\n    - The cards that player 0 has played are: (5,)\\n    - The cards that player 1 has played are: (4,)\\n    - Player 0's score so far is: 4\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {2, 3, 5}\\n    - The cards left in player 0's hand are: {1, 2, 3, 4}\\n    - The cards left in player 1's hand are: {1, 2, 3, 5}\\n    \\n\\n    The function you generated returned the following values:\\n    {}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 3.0, 1: 0.0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 1.0, 1: -1.0}\\n    --------------------------\\n    --------------------------\\n    Example 1:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (4, 1)\\n    - The cards that player 0 has played are: (5, 4)\\n    - The cards that player 1 has played are: (4, 1)\\n    - Player 0's score so far is: 5\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {2, 3, 5}\\n    - The cards left in player 0's hand are: {1, 2, 3}\\n    - The cards left in player 1's hand are: {2, 3, 5}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 5, 1: -5}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_advantage': 5}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 5, 1: -5}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 1.0, 1: -1.0}\\n    --------------------------\\n    --------------------------\\n    Example 2:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (4, 1, 3, 5, 2)\\n    - The cards that player 0 has played are: (5, 4, 3, 1)\\n    - The cards that player 1 has played are: (4, 1, 2, 3)\\n    - Player 0's score so far is: 8\\n    - Player 1's score so far is: 5\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: {2}\\n    - The cards left in player 1's hand are: {5}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 3, 1: -3}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_advantage': 3}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 1, 1: -3}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 1.0, 1: -1.0}\\n    --------------------------\\n    --------------------------\\n    Example 3:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (4, 1, 3)\\n    - The cards that player 0 has played are: (5, 4, 3)\\n    - The cards that player 1 has played are: (4, 1, 2)\\n    - Player 0's score so far is: 8\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {2, 5}\\n    - The cards left in player 0's hand are: {1, 2}\\n    - The cards left in player 1's hand are: {3, 5}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 8, 1: -8}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_advantage': 8}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 8, 1: -8}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 1.0, 1: -1.0}\\n    --------------------------\\n    --------------------------\\n    Example 4:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (4, 1, 3, 5, 2)\\n    - The cards that player 0 has played are: (5, 4, 3, 1, 2)\\n    - The cards that player 1 has played are: (4, 1, 2, 3, 5)\\n    - Player 0's score so far is: 8\\n    - Player 1's score so far is: 7\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: set()\\n    - The cards left in player 1's hand are: set()\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 1, 1: -1}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_advantage': 1}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: -1}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 1.0, 1: -1.0}\\n    --------------------------\\n    --------------------------\\n    Example 5:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (4, 1)\\n    - The cards that player 0 has played are: (5,)\\n    - The cards that player 1 has played are: (4,)\\n    - Player 0's score so far is: 4\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {2, 3, 5}\\n    - The cards left in player 0's hand are: {1, 2, 3, 4}\\n    - The cards left in player 1's hand are: {1, 2, 3, 5}\\n    \\n\\n    The function you generated returned the following values:\\n    {}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 3.0, 1: 0.0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 1.0, 1: -1.0}\\n    --------------------------\\n    \",\n",
       "  0),\n",
       " 0.5)"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "evolver.get_fittest(1)[0]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "\"You are a function engineer trying to write a function that can evaluate the value of a state in a game. \\nThis is known as a value heuristic, and will be used in reinforcement learning and Monte Carlo Tree Search to evaluate the value of a state. \\nThe game you want to write a function for is GOPS (game of pure strategy), also known as Goofspiel. The game has two players, and is played with a deck of score cards. Each player is dealt the same hand of cards at the beginning. The goal of the game is to get a score higher than your opponent. At the beginning of each round, a score card is randomly drawn without replacement from the score deck. Then each player plays a card simultaneously from their hand. The player who plays the higher card wins the round and gets the score card. They add the score of the score card to their total score. If the two cards played are the same, the person who wins the next round will get both score cards. The game continues until all score cards have been played. The player with the highest total score wins the game.\\n\\n    Previously you generated the following function to evaluate the value of a state in the game of GOPS.\\n\\n    Previous function: \\n\\n    \\n Below is some feedback on how the function you generated performed when we tested it. Note that simulations involve high variance and the actual scores may not match the expected scores exactly.\\n    \\n    Feedback: \\nBased on the feedback given and the function you generated previously, what's one specific improvement we can make to the function to make it better? Be as specific and conrete as possible.\\n >>>>>>>>>>>>>>>>>>>>>>>>>> \\n\""
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "\"--------------------------\\n    Example 0:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3)\\n    - The cards that player 0 has played are: (2, 5)\\n    - The cards that player 1 has played are: (2, 5)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {1, 4, 5}\\n    - The cards left in player 0's hand are: {1, 3, 4}\\n    - The cards left in player 1's hand are: {1, 3, 4}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 5, 'opponent_potential_score': 5}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 1:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4)\\n    - The cards that player 0 has played are: (2, 5)\\n    - The cards that player 1 has played are: (2, 5)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {1, 5}\\n    - The cards left in player 0's hand are: {1, 3, 4}\\n    - The cards left in player 1's hand are: {1, 3, 4}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 1, 'opponent_potential_score': 1}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 2:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4)\\n    - The cards that player 0 has played are: (2, 5)\\n    - The cards that player 1 has played are: (2, 5)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {1, 5}\\n    - The cards left in player 0's hand are: {1, 3, 4}\\n    - The cards left in player 1's hand are: {1, 3, 4}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 1, 'opponent_potential_score': 1}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 3:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1, 5)\\n    - The cards that player 0 has played are: (2, 5, 4, 3, 1)\\n    - The cards that player 1 has played are: (2, 5, 4, 3, 1)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: set()\\n    - The cards left in player 1's hand are: set()\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 4:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1, 5)\\n    - The cards that player 0 has played are: (2, 5, 4, 3, 1)\\n    - The cards that player 1 has played are: (2, 5, 4, 3, 1)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: set()\\n    - The cards left in player 1's hand are: set()\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 5:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1, 5)\\n    - The cards that player 0 has played are: (2, 5, 4, 3, 1)\\n    - The cards that player 1 has played are: (2, 5, 4, 3, 1)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: set()\\n    - The cards left in player 1's hand are: set()\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 6:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1)\\n    - The cards that player 0 has played are: (2, 5, 4)\\n    - The cards that player 1 has played are: (2, 5, 4)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {5}\\n    - The cards left in player 0's hand are: {1, 3}\\n    - The cards left in player 1's hand are: {1, 3}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 7:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1, 5)\\n    - The cards that player 0 has played are: (2, 5, 4, 3)\\n    - The cards that player 1 has played are: (2, 5, 4, 3)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: {1}\\n    - The cards left in player 1's hand are: {1}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 8:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1)\\n    - The cards that player 0 has played are: (2, 5, 4)\\n    - The cards that player 1 has played are: (2, 5, 4)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {5}\\n    - The cards left in player 0's hand are: {1, 3}\\n    - The cards left in player 1's hand are: {1, 3}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 9:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3)\\n    - The cards that player 0 has played are: (2, 5)\\n    - The cards that player 1 has played are: (2, 5)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {1, 4, 5}\\n    - The cards left in player 0's hand are: {1, 3, 4}\\n    - The cards left in player 1's hand are: {1, 3, 4}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 5, 'opponent_potential_score': 5}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    \""
      ]
     },
     "execution_count": 21,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "analyzer.num_samples = 10\n",
    "feedback0 = analyzer.translate(notes[0])\n",
    "feedback0"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "We want to generate $k$ possible improvements now based on the feedback, function, and function abstract. These improvements should be as specific as possible"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[\"1.) One specific improvement that can be made to the function is to incorporate a more sophisticated strategy for evaluating the potential score of each player. This could involve considering the distribution of score cards remaining in the deck, as well as the cards already played and the cards remaining in each player's hand. By taking into account the probabilities of different card combinations and potential outcomes, the function can provide a more accurate evaluation of the state. This could potentially involve using statistical methods or machine learning techniques to estimate the potential score more effectively.\"]"
      ]
     },
     "execution_count": 23,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "prompt_imp = gen_specific_improvement_prompt(func_list[0], feedback0, num_improvements=1)\n",
    "gpt.generate(prompt_imp, 1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "\"You are a function engineer trying to write a function that can evaluate the value of a state in a game. This is known as a value heuristic, and will be used in lookahead search algorithms to evaluate the value of unexplored states. Your goal is to develop a heuristic that is as accurate as possible without being too expensive to compute. Hence, you are not allowed to runs simulations in the function.\\nThe game you want to write a function for is GOPS (game of pure strategy), also known as Goofspiel. The game has two players, and is played with a deck of score cards. Each player is dealt the same hand of cards at the beginning. The goal of the game is to get a score higher than your opponent. At the beginning of each round, a score card is randomly drawn without replacement from the score deck. Then each player plays a card simultaneously from their hand. The player who plays the higher card wins the round and gets the score card. They add the score of the score card to their total score. If the two cards played are the same, the person who wins the next round will get both score cards. The game continues until all score cards have been played. The player with the highest total score wins the game.\\nPreviously you generated the following function to evaluate the value of a state in the game of GOPS.\\n\\n    Previous function: \\ndef evaluate_state(state) -> tuple[tuple[float, float], dict]:\\n    score_cards = state[0]\\n    player_0_played_cards = state[1]\\n    player_1_played_cards = state[2]\\n    is_turn = state[3]\\n    player_0_score = state[4]\\n    player_1_score = state[5]\\n    score_deck = state[6]\\n    player_0_hand = state[7]\\n    player_1_hand = state[8]\\n    \\n    # Calculate the total score of each player\\n    def calculate_total_score(state, player):\\n        if player == 0:\\n            return state[4]\\n        else:\\n            return state[5]\\n    \\n    # Get the remaining score cards in the deck\\n    remaining_score_cards = set(score_deck)\\n    \\n    # Calculate the potential score for a player based on their current state\\n    def calculate_potential_score(player_score, player_hand, remaining_score_cards):\\n        potential_score = player_score\\n        for card in player_hand:\\n            if card in remaining_score_cards:\\n                potential_score += card\\n        return potential_score\\n    \\n    # Evaluate the potential value of the state\\n    player_potential_score = calculate_potential_score(player_0_score, player_0_hand, remaining_score_cards)\\n    opponent_potential_score = calculate_potential_score(player_1_score, player_1_hand, remaining_score_cards)\\n    \\n    return (player_potential_score, opponent_potential_score), {'player_potential_score': player_potential_score, 'opponent_potential_score': opponent_potential_score}\\n Below is some feedback on how the function you generated performed when we tested it. Note that simulations involve high variance and the actual scores may not match the expected scores exactly.\\n    \\n    Feedback: \\n--------------------------\\n    Example 0:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3)\\n    - The cards that player 0 has played are: (2, 5)\\n    - The cards that player 1 has played are: (2, 5)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {1, 4, 5}\\n    - The cards left in player 0's hand are: {1, 3, 4}\\n    - The cards left in player 1's hand are: {1, 3, 4}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 5, 'opponent_potential_score': 5}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 1:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4)\\n    - The cards that player 0 has played are: (2, 5)\\n    - The cards that player 1 has played are: (2, 5)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {1, 5}\\n    - The cards left in player 0's hand are: {1, 3, 4}\\n    - The cards left in player 1's hand are: {1, 3, 4}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 1, 'opponent_potential_score': 1}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 2:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4)\\n    - The cards that player 0 has played are: (2, 5)\\n    - The cards that player 1 has played are: (2, 5)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {1, 5}\\n    - The cards left in player 0's hand are: {1, 3, 4}\\n    - The cards left in player 1's hand are: {1, 3, 4}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 1, 'opponent_potential_score': 1}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 3:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1, 5)\\n    - The cards that player 0 has played are: (2, 5, 4, 3, 1)\\n    - The cards that player 1 has played are: (2, 5, 4, 3, 1)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: set()\\n    - The cards left in player 1's hand are: set()\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 4:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1, 5)\\n    - The cards that player 0 has played are: (2, 5, 4, 3, 1)\\n    - The cards that player 1 has played are: (2, 5, 4, 3, 1)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: set()\\n    - The cards left in player 1's hand are: set()\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 5:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1, 5)\\n    - The cards that player 0 has played are: (2, 5, 4, 3, 1)\\n    - The cards that player 1 has played are: (2, 5, 4, 3, 1)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: set()\\n    - The cards left in player 1's hand are: set()\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 6:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1)\\n    - The cards that player 0 has played are: (2, 5, 4)\\n    - The cards that player 1 has played are: (2, 5, 4)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {5}\\n    - The cards left in player 0's hand are: {1, 3}\\n    - The cards left in player 1's hand are: {1, 3}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 7:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1, 5)\\n    - The cards that player 0 has played are: (2, 5, 4, 3)\\n    - The cards that player 1 has played are: (2, 5, 4, 3)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: {1}\\n    - The cards left in player 1's hand are: {1}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 8:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1)\\n    - The cards that player 0 has played are: (2, 5, 4)\\n    - The cards that player 1 has played are: (2, 5, 4)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {5}\\n    - The cards left in player 0's hand are: {1, 3}\\n    - The cards left in player 1's hand are: {1, 3}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 9:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3)\\n    - The cards that player 0 has played are: (2, 5)\\n    - The cards that player 1 has played are: (2, 5)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {1, 4, 5}\\n    - The cards left in player 0's hand are: {1, 3, 4}\\n    - The cards left in player 1's hand are: {1, 3, 4}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 5, 'opponent_potential_score': 5}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    \\n Based on the feedback given and the function you generated previously, what are 1 specific improvement we can make to the function to make it better? Be as specific and concrete as possible, and enumerate each improvement using 1.), 2.), ...\\n\""
      ]
     },
     "execution_count": 24,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "prompt_imp"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "\"You are a function engineer trying to write a function that can evaluate the value of a state in a game. \\nThis is known as a value heuristic, and will be used in reinforcement learning and Monte Carlo Tree Search to evaluate the value of a state. \\nThe game you want to write a function for is GOPS (game of pure strategy), also known as Goofspiel. The game has two players, and is played with a deck of score cards. Each player is dealt the same hand of cards at the beginning. The goal of the game is to get a score higher than your opponent. At the beginning of each round, a score card is randomly drawn without replacement from the score deck. Then each player plays a card simultaneously from their hand. The player who plays the higher card wins the round and gets the score card. They add the score of the score card to their total score. If the two cards played are the same, the person who wins the next round will get both score cards. The game continues until all score cards have been played. The player with the highest total score wins the game.\\n\\n    Previously you generated the following function to evaluate the value of a state in the game of GOPS.\\n\\n    Previous function: \\n\\n    def evaluate_state(state) -> tuple[tuple[float, float], dict]:\\n    score_cards = state[0]\\n    player_0_played_cards = state[1]\\n    player_1_played_cards = state[2]\\n    is_turn = state[3]\\n    player_0_score = state[4]\\n    player_1_score = state[5]\\n    score_deck = state[6]\\n    player_0_hand = state[7]\\n    player_1_hand = state[8]\\n    \\n    # Calculate the total score of each player\\n    def calculate_total_score(state, player):\\n        if player == 0:\\n            return state[4]\\n        else:\\n            return state[5]\\n    \\n    # Get the remaining score cards in the deck\\n    remaining_score_cards = set(score_deck)\\n    \\n    # Calculate the potential score for a player based on their current state\\n    def calculate_potential_score(player_score, player_hand, remaining_score_cards):\\n        potential_score = player_score\\n        for card in player_hand:\\n            if card in remaining_score_cards:\\n                potential_score += card\\n        return potential_score\\n    \\n    # Evaluate the potential value of the state\\n    player_potential_score = calculate_potential_score(player_0_score, player_0_hand, remaining_score_cards)\\n    opponent_potential_score = calculate_potential_score(player_1_score, player_1_hand, remaining_score_cards)\\n    \\n    return (player_potential_score, opponent_potential_score), {'player_potential_score': player_potential_score, 'opponent_potential_score': opponent_potential_score}\\n Below is some feedback on how the function you generated performed when we tested it. Note that simulations involve high variance and the actual scores may not match the expected scores exactly.\\n    \\n    Feedback: \\n--------------------------\\n    Example 0:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4)\\n    - The cards that player 0 has played are: (2, 5)\\n    - The cards that player 1 has played are: (2, 5)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {1, 5}\\n    - The cards left in player 0's hand are: {1, 3, 4}\\n    - The cards left in player 1's hand are: {1, 3, 4}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 1, 'opponent_potential_score': 1}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 1:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1, 5)\\n    - The cards that player 0 has played are: (2, 5, 4, 3, 1)\\n    - The cards that player 1 has played are: (2, 5, 4, 3, 1)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: set()\\n    - The cards left in player 1's hand are: set()\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 2:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1, 5)\\n    - The cards that player 0 has played are: (2, 5, 4, 3)\\n    - The cards that player 1 has played are: (2, 5, 4, 3)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: {1}\\n    - The cards left in player 1's hand are: {1}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 3:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3)\\n    - The cards that player 0 has played are: (2,)\\n    - The cards that player 1 has played are: (2,)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: {1, 4, 5}\\n    - The cards left in player 0's hand are: {1, 3, 4, 5}\\n    - The cards left in player 1's hand are: {1, 3, 4, 5}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 10, 'opponent_potential_score': 10}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0.0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 4:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1, 5)\\n    - The cards that player 0 has played are: (2, 5, 4, 3)\\n    - The cards that player 1 has played are: (2, 5, 4, 3)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: {1}\\n    - The cards left in player 1's hand are: {1}\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    --------------------------\\n    Example 5:\\n    The state you were trying to estimate a value for is:\\n    The state of a GOPS (game of pure strategy) game is as follows:\\n    - The score cards that have been revealed are: (2, 3, 4, 1, 5)\\n    - The cards that player 0 has played are: (2, 5, 4, 3, 1)\\n    - The cards that player 1 has played are: (2, 5, 4, 3, 1)\\n    - Player 0's score so far is: 0\\n    - Player 1's score so far is: 0\\n    - The score cards left in the deck are: set()\\n    - The cards left in player 0's hand are: set()\\n    - The cards left in player 1's hand are: set()\\n    \\n\\n    The function you generated returned the following values:\\n    {0: 0, 1: 0}\\n    for the expected end of game scores of the players. \\n\\n    Some intermediate values that you used to calculate the scores were:\\n    {'player_potential_score': 0, 'opponent_potential_score': 0}\\n\\n    The estimated end of game scores of the players using lookahead search with your function was:\\n    {0: 0, 1: 0}\\n\\n    The actual scores of the players at the end of the game in the simulation were:\\n    {0: 0.0, 1: 0.0}\\n    --------------------------\\n    Please think about what conclusions we can draw from this feedback. What parts of the function do you think we can adjust so that it performs better? Be concrete and specific, citing the feedback examples given.\\n >>>>>>>>>>>>>>>>>>>>>>>>>> \\n\""
      ]
     },
     "execution_count": 13,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "gen_feedback_analyze_prompt(func_list[0], feedback0)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "LLMgames",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.5"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
