{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 32,
   "id": "e03983c0",
   "metadata": {},
   "outputs": [],
   "source": [
    "from alfworld.agents.environment.alfred_tw_env import AlfredTWEnv\n",
    "import numpy as np\n",
    "from pettingllms.multi_agent_env.alfworld.utils import load_config_file"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "6ed78341",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Initializing AlfredTWEnv...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "100%|██████████| 8810/8810 [00:04<00:00, 1929.96it/s]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Overall we have 790 games in split=train\n",
      "Training with 790 games\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    }
   ],
   "source": [
    "\n",
    "config = load_config_file()\n",
    "#env_type = config['env']['type']\n",
    "base_env = AlfredTWEnv(config, train_eval='train')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "id": "51e7f17c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Task description: ('-= Welcome to TextWorld, ALFRED! =-\\n\\nYou are in the middle of a room. Looking quickly around you, you see a bathtubbasin 1, a countertop 2, a countertop 1, a drawer 4, a drawer 3, a drawer 2, a drawer 1, a garbagecan 1, a handtowelholder 1, a sinkbasin 1, a toilet 1, a toiletpaperhanger 1, a towelholder 2, and a towelholder 1.\\n\\nYour task is to: put a candle in drawer.',)\n",
      "==================================================\n",
      "Step 1: action=go to drawer 4, reward=0, done=False\n",
      "Step 2: action=go to handtowelholder 1, reward=0, done=False\n",
      "Step 3: action=go to drawer 3, reward=0, done=False\n",
      "Step 4: action=go to drawer 2, reward=0, done=False\n",
      "Step 5: action=go to drawer 4, reward=0, done=False\n",
      "Step 6: action=go to sinkbasin 1, reward=0, done=False\n",
      "Step 7: action=go to drawer 3, reward=0, done=False\n",
      "Step 8: action=open drawer 3, reward=0, done=False\n",
      "Step 9: action=go to towelholder 1, reward=0, done=False\n",
      "Step 10: action=go to toiletpaperhanger 1, reward=0, done=False\n",
      "Step 11: action=examine toiletpaperhanger 1, reward=0, done=False\n",
      "Step 12: action=go to toilet 1, reward=0, done=False\n",
      "Step 13: action=go to drawer 3, reward=0, done=False\n",
      "Step 14: action=go to handtowelholder 1, reward=0, done=False\n",
      "Step 15: action=go to sinkbasin 1, reward=0, done=False\n",
      "Step 16: action=go to handtowelholder 1, reward=0, done=False\n",
      "Step 17: action=go to drawer 4, reward=0, done=False\n",
      "Step 18: action=go to bathtubbasin 1, reward=0, done=False\n",
      "Step 19: action=go to towelholder 2, reward=0, done=False\n",
      "Step 20: action=go to countertop 2, reward=0, done=False\n",
      "==================================================\n",
      "Total reward: 0\n"
     ]
    }
   ],
   "source": [
    "env=base_env.init_env(batch_size=1)\n",
    "# 4. Reset 环境\n",
    "obs, infos = env.reset()\n",
    "done = False\n",
    "step_count = 0\n",
    "total_reward = 0\n",
    "\n",
    "print(\"Task description:\", obs)\n",
    "print(\"=\"*50)\n",
    "\n",
    "# 5. 随机 roll out，打印 reward\n",
    "while not done and step_count < 20:   # 最多跑 20 步\n",
    "    random_action = np.random.choice(infos['admissible_commands'][0])\n",
    "    action = random_action  # 随便取一个可行动作\n",
    "    obs, reward, done_list, infos = env.step([action])\n",
    "    done = done_list[0]\n",
    "    step_count += 1\n",
    "    total_reward += reward[0]\n",
    "    print(f\"Step {step_count}: action={action}, reward={reward[0]}, done={done_list[0]}\")\n",
    "\n",
    "print(\"=\"*50)\n",
    "print(\"Total reward:\", total_reward)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "954612e6",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "('-= Welcome to TextWorld, ALFRED! =-\\n\\nYou are in the middle of a room. Looking quickly around you, you see a bathtubbasin 1, a countertop 2, a countertop 1, a drawer 4, a drawer 3, a drawer 2, a drawer 1, a garbagecan 1, a handtowelholder 1, a sinkbasin 1, a toilet 1, a toiletpaperhanger 1, a towelholder 2, and a towelholder 1.\\n\\nYour task is to: put some soapbottle on garbagecan.',)\n"
     ]
    }
   ],
   "source": [
    "env=base_env.init_env(batch_size=1)\n",
    "env.seed(0)\n",
    "obs, infos=env.reset()\n",
    "print(obs)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "9824ae4a",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'won': [False], 'extra.gamefile': ['/home/lah003/.cache/alfworld/json_2.1.1/train/pick_and_place_simple-SoapBottle-None-GarbageCan-411/trial_T20190908_051634_985936/game.tw-pddl'], 'admissible_commands': [['go to bathtubbasin 1', 'go to countertop 1', 'go to countertop 2', 'go to drawer 1', 'go to drawer 2', 'go to drawer 3', 'go to drawer 4', 'go to garbagecan 1', 'go to handtowelholder 1', 'go to sinkbasin 1', 'go to toilet 1', 'go to toiletpaperhanger 1', 'go to towelholder 1', 'go to towelholder 2', 'help', 'inventory', 'look']], 'facts': [[Proposition('pickupable', (Variable('cloth 2', 'object'),)), Proposition('pickupable', (Variable('candle 1', 'object'),)), Proposition('pickupable', (Variable('soapbottle 1', 'object'),)), Proposition('pickupable', (Variable('towel 1', 'object'),)), Proposition('pickupable', (Variable('scrubbrush 1', 'object'),)), Proposition('pickupable', (Variable('cloth 1', 'object'),)), Proposition('pickupable', (Variable('soapbar 1', 'object'),)), Proposition('pickupable', (Variable('soapbottle 2', 'object'),)), Proposition('pickupable', (Variable('handtowel 1', 'object'),)), Proposition('pickupable', (Variable('toiletpaper 2', 'object'),)), Proposition('pickupable', (Variable('plunger 1', 'object'),)), Proposition('pickupable', (Variable('cloth 3', 'object'),)), Proposition('pickupable', (Variable('toiletpaper 1', 'object'),)), Proposition('pickupable', (Variable('candle 2', 'object'),)), Proposition('pickupable', (Variable('spraybottle 1', 'object'),)), Proposition('receptacletype', (Variable('drawer 4', 'receptacle'), Variable('drawertype ', 'rtype'))), Proposition('receptacletype', (Variable('toiletpaperhanger 1', 'receptacle'), Variable('toiletpaperhangertype ', 'rtype'))), Proposition('receptacletype', (Variable('handtowelholder 1', 'receptacle'), Variable('handtowelholdertype ', 'rtype'))), Proposition('receptacletype', (Variable('towelholder 2', 'receptacle'), Variable('towelholdertype ', 'rtype'))), Proposition('receptacletype', (Variable('countertop 2', 'receptacle'), Variable('countertoptype ', 'rtype'))), Proposition('receptacletype', (Variable('bathtubbasin 1', 'receptacle'), Variable('bathtubbasintype ', 'rtype'))), Proposition('receptacletype', (Variable('garbagecan 1', 'receptacle'), Variable('garbagecantype ', 'rtype'))), Proposition('receptacletype', (Variable('countertop 1', 'receptacle'), Variable('countertoptype ', 'rtype'))), Proposition('receptacletype', (Variable('drawer 2', 'receptacle'), Variable('drawertype ', 'rtype'))), Proposition('receptacletype', (Variable('drawer 1', 'receptacle'), Variable('drawertype ', 'rtype'))), Proposition('receptacletype', (Variable('towelholder 1', 'receptacle'), Variable('towelholdertype ', 'rtype'))), Proposition('receptacletype', (Variable('toilet 1', 'receptacle'), Variable('toilettype ', 'rtype'))), Proposition('receptacletype', (Variable('drawer 3', 'receptacle'), Variable('drawertype ', 'rtype'))), Proposition('receptacletype', (Variable('sinkbasin 1', 'receptacle'), Variable('sinkbasintype ', 'rtype'))), Proposition('cancontain', (Variable('bathtubbasintype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('garbagecantype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('garbagecantype ', 'rtype'), Variable('spraybottletype ', 'otype'))), Proposition('cancontain', (Variable('handtowelholdertype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('garbagecantype ', 'rtype'), Variable('toiletpapertype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('soapbartype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('soapbartype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('toiletpapertype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('spraybottletype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('clothtype ', 'otype'))), Proposition('cancontain', (Variable('towelholdertype ', 'rtype'), Variable('toweltype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('clothtype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('candletype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('spraybottletype ', 'otype'))), Proposition('cancontain', (Variable('garbagecantype ', 'rtype'), Variable('soapbartype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('toiletpapertype ', 'otype'))), Proposition('cancontain', (Variable('garbagecantype ', 'rtype'), Variable('clothtype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('toiletpapertype ', 'otype'))), Proposition('cancontain', (Variable('bathtubbasintype ', 'rtype'), Variable('clothtype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('spraybottletype ', 'otype'))), Proposition('cancontain', (Variable('sinkbasintype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('candletype ', 'otype'))), Proposition('cancontain', (Variable('garbagecantype ', 'rtype'), Variable('soapbottletype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('candletype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('soapbottletype ', 'otype'))), Proposition('cancontain', (Variable('bathtubbasintype ', 'rtype'), Variable('soapbartype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('soapbartype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('clothtype ', 'otype'))), Proposition('cancontain', (Variable('sinkbasintype ', 'rtype'), Variable('soapbartype ', 'otype'))), Proposition('cancontain', (Variable('toiletpaperhangertype ', 'rtype'), Variable('toiletpapertype ', 'otype'))), Proposition('cancontain', (Variable('sinkbasintype ', 'rtype'), Variable('clothtype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('soapbottletype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('soapbottletype ', 'otype'))), Proposition('receptacleatlocation', (Variable('drawer 1', 'receptacle'), Variable('loc 9', 'location'))), Proposition('receptacleatlocation', (Variable('drawer 3', 'receptacle'), Variable('loc 10', 'location'))), Proposition('receptacleatlocation', (Variable('towelholder 1', 'receptacle'), Variable('loc 21', 'location'))), Proposition('receptacleatlocation', (Variable('drawer 2', 'receptacle'), Variable('loc 12', 'location'))), Proposition('receptacleatlocation', (Variable('countertop 2', 'receptacle'), Variable('loc 4', 'location'))), Proposition('receptacleatlocation', (Variable('towelholder 2', 'receptacle'), Variable('loc 20', 'location'))), Proposition('receptacleatlocation', (Variable('garbagecan 1', 'receptacle'), Variable('loc 17', 'location'))), Proposition('receptacleatlocation', (Variable('sinkbasin 1', 'receptacle'), Variable('loc 19', 'location'))), Proposition('receptacleatlocation', (Variable('drawer 4', 'receptacle'), Variable('loc 6', 'location'))), Proposition('receptacleatlocation', (Variable('bathtubbasin 1', 'receptacle'), Variable('loc 11', 'location'))), Proposition('receptacleatlocation', (Variable('toilet 1', 'receptacle'), Variable('loc 2', 'location'))), Proposition('receptacleatlocation', (Variable('handtowelholder 1', 'receptacle'), Variable('loc 16', 'location'))), Proposition('receptacleatlocation', (Variable('toiletpaperhanger 1', 'receptacle'), Variable('loc 5', 'location'))), Proposition('receptacleatlocation', (Variable('countertop 1', 'receptacle'), Variable('loc 14', 'location'))), Proposition('openable', (Variable('drawer 1', 'receptacle'),)), Proposition('openable', (Variable('drawer 3', 'receptacle'),)), Proposition('openable', (Variable('drawer 4', 'receptacle'),)), Proposition('openable', (Variable('drawer 2', 'receptacle'),)), Proposition('inreceptacle', (Variable('toiletpaper 1', 'object'), Variable('toiletpaperhanger 1', 'receptacle'))), Proposition('inreceptacle', (Variable('sink 1', 'object'), Variable('sinkbasin 1', 'receptacle'))), Proposition('inreceptacle', (Variable('cloth 3', 'object'), Variable('bathtubbasin 1', 'receptacle'))), Proposition('inreceptacle', (Variable('spraybottle 1', 'object'), Variable('toilet 1', 'receptacle'))), Proposition('inreceptacle', (Variable('candle 2', 'object'), Variable('drawer 1', 'receptacle'))), Proposition('inreceptacle', (Variable('toiletpaper 2', 'object'), Variable('toilet 1', 'receptacle'))), Proposition('inreceptacle', (Variable('cloth 1', 'object'), Variable('countertop 2', 'receptacle'))), Proposition('inreceptacle', (Variable('towel 1', 'object'), Variable('towelholder 1', 'receptacle'))), Proposition('inreceptacle', (Variable('soapbar 1', 'object'), Variable('countertop 2', 'receptacle'))), Proposition('inreceptacle', (Variable('soapbottle 2', 'object'), Variable('countertop 2', 'receptacle'))), Proposition('inreceptacle', (Variable('candle 1', 'object'), Variable('drawer 3', 'receptacle'))), Proposition('inreceptacle', (Variable('bathtub 1', 'object'), Variable('bathtubbasin 1', 'receptacle'))), Proposition('inreceptacle', (Variable('soapbottle 1', 'object'), Variable('countertop 1', 'receptacle'))), Proposition('inreceptacle', (Variable('handtowel 1', 'object'), Variable('handtowelholder 1', 'receptacle'))), Proposition('inreceptacle', (Variable('cloth 2', 'object'), Variable('bathtubbasin 1', 'receptacle'))), Proposition('objectatlocation', (Variable('window 1', 'object'), Variable('loc 5', 'location'))), Proposition('objectatlocation', (Variable('soapbottle 2', 'object'), Variable('loc 4', 'location'))), Proposition('objectatlocation', (Variable('spraybottle 1', 'object'), Variable('loc 2', 'location'))), Proposition('objectatlocation', (Variable('bathtub 1', 'object'), Variable('loc 11', 'location'))), Proposition('objectatlocation', (Variable('window 2', 'object'), Variable('loc 7', 'location'))), Proposition('objectatlocation', (Variable('soapbottle 1', 'object'), Variable('loc 14', 'location'))), Proposition('objectatlocation', (Variable('candle 1', 'object'), Variable('loc 10', 'location'))), Proposition('objectatlocation', (Variable('cloth 1', 'object'), Variable('loc 4', 'location'))), Proposition('objectatlocation', (Variable('cloth 3', 'object'), Variable('loc 11', 'location'))), Proposition('objectatlocation', (Variable('lightswitch 1', 'object'), Variable('loc 15', 'location'))), Proposition('objectatlocation', (Variable('showerdoor 1', 'object'), Variable('loc 3', 'location'))), Proposition('objectatlocation', (Variable('toiletpaper 2', 'object'), Variable('loc 2', 'location'))), Proposition('objectatlocation', (Variable('scrubbrush 1', 'object'), Variable('loc 1', 'location'))), Proposition('objectatlocation', (Variable('sink 1', 'object'), Variable('loc 19', 'location'))), Proposition('objectatlocation', (Variable('mirror 1', 'object'), Variable('loc 18', 'location'))), Proposition('objectatlocation', (Variable('plunger 1', 'object'), Variable('loc 1', 'location'))), Proposition('objectatlocation', (Variable('showerglass 1', 'object'), Variable('loc 8', 'location'))), Proposition('objectatlocation', (Variable('soapbar 1', 'object'), Variable('loc 4', 'location'))), Proposition('objectatlocation', (Variable('candle 2', 'object'), Variable('loc 9', 'location'))), Proposition('objectatlocation', (Variable('cloth 2', 'object'), Variable('loc 11', 'location'))), Proposition('objectatlocation', (Variable('toiletpaper 1', 'object'), Variable('loc 5', 'location'))), Proposition('objectatlocation', (Variable('handtowel 1', 'object'), Variable('loc 16', 'location'))), Proposition('objectatlocation', (Variable('towel 1', 'object'), Variable('loc 21', 'location'))), Proposition('objecttype', (Variable('showerglass 1', 'object'), Variable('showerglasstype ', 'otype'))), Proposition('objecttype', (Variable('cloth 2', 'object'), Variable('clothtype ', 'otype'))), Proposition('objecttype', (Variable('cloth 1', 'object'), Variable('clothtype ', 'otype'))), Proposition('objecttype', (Variable('showerdoor 1', 'object'), Variable('showerdoortype ', 'otype'))), Proposition('objecttype', (Variable('window 2', 'object'), Variable('windowtype ', 'otype'))), Proposition('objecttype', (Variable('soapbottle 1', 'object'), Variable('soapbottletype ', 'otype'))), Proposition('objecttype', (Variable('soapbar 1', 'object'), Variable('soapbartype ', 'otype'))), Proposition('objecttype', (Variable('sink 1', 'object'), Variable('sinktype ', 'otype'))), Proposition('objecttype', (Variable('lightswitch 1', 'object'), Variable('lightswitchtype ', 'otype'))), Proposition('objecttype', (Variable('candle 2', 'object'), Variable('candletype ', 'otype'))), Proposition('objecttype', (Variable('toiletpaper 2', 'object'), Variable('toiletpapertype ', 'otype'))), Proposition('objecttype', (Variable('cloth 3', 'object'), Variable('clothtype ', 'otype'))), Proposition('objecttype', (Variable('scrubbrush 1', 'object'), Variable('scrubbrushtype ', 'otype'))), Proposition('objecttype', (Variable('plunger 1', 'object'), Variable('plungertype ', 'otype'))), Proposition('objecttype', (Variable('bathtub 1', 'object'), Variable('bathtubtype ', 'otype'))), Proposition('objecttype', (Variable('towel 1', 'object'), Variable('toweltype ', 'otype'))), Proposition('objecttype', (Variable('handtowel 1', 'object'), Variable('handtoweltype ', 'otype'))), Proposition('objecttype', (Variable('soapbottle 2', 'object'), Variable('soapbottletype ', 'otype'))), Proposition('objecttype', (Variable('window 1', 'object'), Variable('windowtype ', 'otype'))), Proposition('objecttype', (Variable('spraybottle 1', 'object'), Variable('spraybottletype ', 'otype'))), Proposition('objecttype', (Variable('toiletpaper 1', 'object'), Variable('toiletpapertype ', 'otype'))), Proposition('objecttype', (Variable('mirror 1', 'object'), Variable('mirrortype ', 'otype'))), Proposition('objecttype', (Variable('candle 1', 'object'), Variable('candletype ', 'otype'))), Proposition('cleanable', (Variable('cloth 2', 'object'),)), Proposition('cleanable', (Variable('cloth 1', 'object'),)), Proposition('cleanable', (Variable('cloth 3', 'object'),)), Proposition('cleanable', (Variable('soapbar 1', 'object'),)), Proposition('atlocation', (Variable('agent1 ', 'agent'), Variable('loc 13', 'location')))]], 'extra.expert_plan': [['look']]}\n"
     ]
    }
   ],
   "source": [
    "\n",
    "print(infos)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "e88f5642",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[['go to bathtubbasin 1', 'go to countertop 1', 'go to countertop 2', 'go to drawer 1', 'go to drawer 2', 'go to drawer 3', 'go to drawer 4', 'go to garbagecan 1', 'go to handtowelholder 1', 'go to sinkbasin 1', 'go to toilet 1', 'go to toiletpaperhanger 1', 'go to towelholder 1', 'go to towelholder 2', 'help', 'inventory', 'look']]\n"
     ]
    }
   ],
   "source": [
    "print(infos['admissible_commands'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "1d6e3e06",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[False]\n"
     ]
    }
   ],
   "source": [
    "print(infos['won'])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "49a39feb",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'won': [False], 'extra.gamefile': [None], 'admissible_commands': [['go to bathtubbasin 1', 'go to countertop 1', 'go to countertop 2', 'go to drawer 1', 'go to drawer 2', 'go to drawer 3', 'go to drawer 4', 'go to garbagecan 1', 'go to handtowelholder 1', 'go to sinkbasin 1', 'go to toilet 1', 'go to toiletpaperhanger 1', 'go to towelholder 1', 'go to towelholder 2', 'help', 'inventory', 'look']], 'facts': [[Proposition('pickupable', (Variable('cloth 2', 'object'),)), Proposition('pickupable', (Variable('candle 1', 'object'),)), Proposition('pickupable', (Variable('soapbottle 1', 'object'),)), Proposition('pickupable', (Variable('towel 1', 'object'),)), Proposition('pickupable', (Variable('scrubbrush 1', 'object'),)), Proposition('pickupable', (Variable('cloth 1', 'object'),)), Proposition('pickupable', (Variable('soapbar 1', 'object'),)), Proposition('pickupable', (Variable('soapbottle 2', 'object'),)), Proposition('pickupable', (Variable('handtowel 1', 'object'),)), Proposition('pickupable', (Variable('toiletpaper 2', 'object'),)), Proposition('pickupable', (Variable('plunger 1', 'object'),)), Proposition('pickupable', (Variable('cloth 3', 'object'),)), Proposition('pickupable', (Variable('toiletpaper 1', 'object'),)), Proposition('pickupable', (Variable('candle 2', 'object'),)), Proposition('pickupable', (Variable('spraybottle 1', 'object'),)), Proposition('receptacletype', (Variable('drawer 4', 'receptacle'), Variable('drawertype ', 'rtype'))), Proposition('receptacletype', (Variable('toiletpaperhanger 1', 'receptacle'), Variable('toiletpaperhangertype ', 'rtype'))), Proposition('receptacletype', (Variable('handtowelholder 1', 'receptacle'), Variable('handtowelholdertype ', 'rtype'))), Proposition('receptacletype', (Variable('towelholder 2', 'receptacle'), Variable('towelholdertype ', 'rtype'))), Proposition('receptacletype', (Variable('countertop 2', 'receptacle'), Variable('countertoptype ', 'rtype'))), Proposition('receptacletype', (Variable('bathtubbasin 1', 'receptacle'), Variable('bathtubbasintype ', 'rtype'))), Proposition('receptacletype', (Variable('garbagecan 1', 'receptacle'), Variable('garbagecantype ', 'rtype'))), Proposition('receptacletype', (Variable('countertop 1', 'receptacle'), Variable('countertoptype ', 'rtype'))), Proposition('receptacletype', (Variable('drawer 2', 'receptacle'), Variable('drawertype ', 'rtype'))), Proposition('receptacletype', (Variable('drawer 1', 'receptacle'), Variable('drawertype ', 'rtype'))), Proposition('receptacletype', (Variable('towelholder 1', 'receptacle'), Variable('towelholdertype ', 'rtype'))), Proposition('receptacletype', (Variable('toilet 1', 'receptacle'), Variable('toilettype ', 'rtype'))), Proposition('receptacletype', (Variable('drawer 3', 'receptacle'), Variable('drawertype ', 'rtype'))), Proposition('receptacletype', (Variable('sinkbasin 1', 'receptacle'), Variable('sinkbasintype ', 'rtype'))), Proposition('cancontain', (Variable('bathtubbasintype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('garbagecantype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('garbagecantype ', 'rtype'), Variable('spraybottletype ', 'otype'))), Proposition('cancontain', (Variable('handtowelholdertype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('garbagecantype ', 'rtype'), Variable('toiletpapertype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('soapbartype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('soapbartype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('toiletpapertype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('spraybottletype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('clothtype ', 'otype'))), Proposition('cancontain', (Variable('towelholdertype ', 'rtype'), Variable('toweltype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('clothtype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('candletype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('spraybottletype ', 'otype'))), Proposition('cancontain', (Variable('garbagecantype ', 'rtype'), Variable('soapbartype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('toiletpapertype ', 'otype'))), Proposition('cancontain', (Variable('garbagecantype ', 'rtype'), Variable('clothtype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('toiletpapertype ', 'otype'))), Proposition('cancontain', (Variable('bathtubbasintype ', 'rtype'), Variable('clothtype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('spraybottletype ', 'otype'))), Proposition('cancontain', (Variable('sinkbasintype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('candletype ', 'otype'))), Proposition('cancontain', (Variable('garbagecantype ', 'rtype'), Variable('soapbottletype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('candletype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('soapbottletype ', 'otype'))), Proposition('cancontain', (Variable('bathtubbasintype ', 'rtype'), Variable('soapbartype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('handtoweltype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('soapbartype ', 'otype'))), Proposition('cancontain', (Variable('drawertype ', 'rtype'), Variable('clothtype ', 'otype'))), Proposition('cancontain', (Variable('sinkbasintype ', 'rtype'), Variable('soapbartype ', 'otype'))), Proposition('cancontain', (Variable('toiletpaperhangertype ', 'rtype'), Variable('toiletpapertype ', 'otype'))), Proposition('cancontain', (Variable('sinkbasintype ', 'rtype'), Variable('clothtype ', 'otype'))), Proposition('cancontain', (Variable('countertoptype ', 'rtype'), Variable('soapbottletype ', 'otype'))), Proposition('cancontain', (Variable('toilettype ', 'rtype'), Variable('soapbottletype ', 'otype'))), Proposition('receptacleatlocation', (Variable('drawer 1', 'receptacle'), Variable('loc 9', 'location'))), Proposition('receptacleatlocation', (Variable('drawer 3', 'receptacle'), Variable('loc 10', 'location'))), Proposition('receptacleatlocation', (Variable('towelholder 1', 'receptacle'), Variable('loc 21', 'location'))), Proposition('receptacleatlocation', (Variable('drawer 2', 'receptacle'), Variable('loc 12', 'location'))), Proposition('receptacleatlocation', (Variable('countertop 2', 'receptacle'), Variable('loc 4', 'location'))), Proposition('receptacleatlocation', (Variable('towelholder 2', 'receptacle'), Variable('loc 20', 'location'))), Proposition('receptacleatlocation', (Variable('garbagecan 1', 'receptacle'), Variable('loc 17', 'location'))), Proposition('receptacleatlocation', (Variable('sinkbasin 1', 'receptacle'), Variable('loc 19', 'location'))), Proposition('receptacleatlocation', (Variable('drawer 4', 'receptacle'), Variable('loc 6', 'location'))), Proposition('receptacleatlocation', (Variable('bathtubbasin 1', 'receptacle'), Variable('loc 11', 'location'))), Proposition('receptacleatlocation', (Variable('toilet 1', 'receptacle'), Variable('loc 2', 'location'))), Proposition('receptacleatlocation', (Variable('handtowelholder 1', 'receptacle'), Variable('loc 16', 'location'))), Proposition('receptacleatlocation', (Variable('toiletpaperhanger 1', 'receptacle'), Variable('loc 5', 'location'))), Proposition('receptacleatlocation', (Variable('countertop 1', 'receptacle'), Variable('loc 14', 'location'))), Proposition('openable', (Variable('drawer 1', 'receptacle'),)), Proposition('openable', (Variable('drawer 3', 'receptacle'),)), Proposition('openable', (Variable('drawer 4', 'receptacle'),)), Proposition('openable', (Variable('drawer 2', 'receptacle'),)), Proposition('inreceptacle', (Variable('toiletpaper 1', 'object'), Variable('toiletpaperhanger 1', 'receptacle'))), Proposition('inreceptacle', (Variable('sink 1', 'object'), Variable('sinkbasin 1', 'receptacle'))), Proposition('inreceptacle', (Variable('cloth 3', 'object'), Variable('bathtubbasin 1', 'receptacle'))), Proposition('inreceptacle', (Variable('spraybottle 1', 'object'), Variable('toilet 1', 'receptacle'))), Proposition('inreceptacle', (Variable('candle 2', 'object'), Variable('drawer 1', 'receptacle'))), Proposition('inreceptacle', (Variable('toiletpaper 2', 'object'), Variable('toilet 1', 'receptacle'))), Proposition('inreceptacle', (Variable('cloth 1', 'object'), Variable('countertop 2', 'receptacle'))), Proposition('inreceptacle', (Variable('towel 1', 'object'), Variable('towelholder 1', 'receptacle'))), Proposition('inreceptacle', (Variable('soapbar 1', 'object'), Variable('countertop 2', 'receptacle'))), Proposition('inreceptacle', (Variable('soapbottle 2', 'object'), Variable('countertop 2', 'receptacle'))), Proposition('inreceptacle', (Variable('candle 1', 'object'), Variable('drawer 3', 'receptacle'))), Proposition('inreceptacle', (Variable('bathtub 1', 'object'), Variable('bathtubbasin 1', 'receptacle'))), Proposition('inreceptacle', (Variable('soapbottle 1', 'object'), Variable('countertop 1', 'receptacle'))), Proposition('inreceptacle', (Variable('handtowel 1', 'object'), Variable('handtowelholder 1', 'receptacle'))), Proposition('inreceptacle', (Variable('cloth 2', 'object'), Variable('bathtubbasin 1', 'receptacle'))), Proposition('objectatlocation', (Variable('window 1', 'object'), Variable('loc 5', 'location'))), Proposition('objectatlocation', (Variable('soapbottle 2', 'object'), Variable('loc 4', 'location'))), Proposition('objectatlocation', (Variable('spraybottle 1', 'object'), Variable('loc 2', 'location'))), Proposition('objectatlocation', (Variable('bathtub 1', 'object'), Variable('loc 11', 'location'))), Proposition('objectatlocation', (Variable('window 2', 'object'), Variable('loc 7', 'location'))), Proposition('objectatlocation', (Variable('soapbottle 1', 'object'), Variable('loc 14', 'location'))), Proposition('objectatlocation', (Variable('candle 1', 'object'), Variable('loc 10', 'location'))), Proposition('objectatlocation', (Variable('cloth 1', 'object'), Variable('loc 4', 'location'))), Proposition('objectatlocation', (Variable('cloth 3', 'object'), Variable('loc 11', 'location'))), Proposition('objectatlocation', (Variable('lightswitch 1', 'object'), Variable('loc 15', 'location'))), Proposition('objectatlocation', (Variable('showerdoor 1', 'object'), Variable('loc 3', 'location'))), Proposition('objectatlocation', (Variable('toiletpaper 2', 'object'), Variable('loc 2', 'location'))), Proposition('objectatlocation', (Variable('scrubbrush 1', 'object'), Variable('loc 1', 'location'))), Proposition('objectatlocation', (Variable('sink 1', 'object'), Variable('loc 19', 'location'))), Proposition('objectatlocation', (Variable('mirror 1', 'object'), Variable('loc 18', 'location'))), Proposition('objectatlocation', (Variable('plunger 1', 'object'), Variable('loc 1', 'location'))), Proposition('objectatlocation', (Variable('showerglass 1', 'object'), Variable('loc 8', 'location'))), Proposition('objectatlocation', (Variable('soapbar 1', 'object'), Variable('loc 4', 'location'))), Proposition('objectatlocation', (Variable('candle 2', 'object'), Variable('loc 9', 'location'))), Proposition('objectatlocation', (Variable('cloth 2', 'object'), Variable('loc 11', 'location'))), Proposition('objectatlocation', (Variable('toiletpaper 1', 'object'), Variable('loc 5', 'location'))), Proposition('objectatlocation', (Variable('handtowel 1', 'object'), Variable('loc 16', 'location'))), Proposition('objectatlocation', (Variable('towel 1', 'object'), Variable('loc 21', 'location'))), Proposition('objecttype', (Variable('showerglass 1', 'object'), Variable('showerglasstype ', 'otype'))), Proposition('objecttype', (Variable('cloth 2', 'object'), Variable('clothtype ', 'otype'))), Proposition('objecttype', (Variable('cloth 1', 'object'), Variable('clothtype ', 'otype'))), Proposition('objecttype', (Variable('showerdoor 1', 'object'), Variable('showerdoortype ', 'otype'))), Proposition('objecttype', (Variable('window 2', 'object'), Variable('windowtype ', 'otype'))), Proposition('objecttype', (Variable('soapbottle 1', 'object'), Variable('soapbottletype ', 'otype'))), Proposition('objecttype', (Variable('soapbar 1', 'object'), Variable('soapbartype ', 'otype'))), Proposition('objecttype', (Variable('sink 1', 'object'), Variable('sinktype ', 'otype'))), Proposition('objecttype', (Variable('lightswitch 1', 'object'), Variable('lightswitchtype ', 'otype'))), Proposition('objecttype', (Variable('candle 2', 'object'), Variable('candletype ', 'otype'))), Proposition('objecttype', (Variable('toiletpaper 2', 'object'), Variable('toiletpapertype ', 'otype'))), Proposition('objecttype', (Variable('cloth 3', 'object'), Variable('clothtype ', 'otype'))), Proposition('objecttype', (Variable('scrubbrush 1', 'object'), Variable('scrubbrushtype ', 'otype'))), Proposition('objecttype', (Variable('plunger 1', 'object'), Variable('plungertype ', 'otype'))), Proposition('objecttype', (Variable('bathtub 1', 'object'), Variable('bathtubtype ', 'otype'))), Proposition('objecttype', (Variable('towel 1', 'object'), Variable('toweltype ', 'otype'))), Proposition('objecttype', (Variable('handtowel 1', 'object'), Variable('handtoweltype ', 'otype'))), Proposition('objecttype', (Variable('soapbottle 2', 'object'), Variable('soapbottletype ', 'otype'))), Proposition('objecttype', (Variable('window 1', 'object'), Variable('windowtype ', 'otype'))), Proposition('objecttype', (Variable('spraybottle 1', 'object'), Variable('spraybottletype ', 'otype'))), Proposition('objecttype', (Variable('toiletpaper 1', 'object'), Variable('toiletpapertype ', 'otype'))), Proposition('objecttype', (Variable('mirror 1', 'object'), Variable('mirrortype ', 'otype'))), Proposition('objecttype', (Variable('candle 1', 'object'), Variable('candletype ', 'otype'))), Proposition('cleanable', (Variable('cloth 2', 'object'),)), Proposition('cleanable', (Variable('cloth 1', 'object'),)), Proposition('cleanable', (Variable('cloth 3', 'object'),)), Proposition('cleanable', (Variable('soapbar 1', 'object'),)), Proposition('atlocation', (Variable('agent1 ', 'agent'), Variable('loc 13', 'location')))]], 'extra.expert_plan': [['go to toilet 1']]}\n"
     ]
    }
   ],
   "source": [
    "obs, scores, dones, infos=env.step(['examine bed 1'])\n",
    "print(infos)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "400e331d",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[False]\n",
      "(0,)\n"
     ]
    }
   ],
   "source": [
    "print(infos['won'])\n",
    "print(scores)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "8e28dbbd",
   "metadata": {},
   "outputs": [
    {
     "ename": "AttributeError",
     "evalue": "module 'alfworld.agents.environment.alfred_tw_env' has no attribute 'load_env'",
     "output_type": "error",
     "traceback": [
      "\u001b[31m---------------------------------------------------------------------------\u001b[39m",
      "\u001b[31mAttributeError\u001b[39m                            Traceback (most recent call last)",
      "\u001b[36mCell\u001b[39m\u001b[36m \u001b[39m\u001b[32mIn[19]\u001b[39m\u001b[32m, line 3\u001b[39m\n\u001b[32m      1\u001b[39m \u001b[38;5;28;01mfrom\u001b[39;00m\u001b[38;5;250m \u001b[39m\u001b[34;01malfworld\u001b[39;00m\u001b[34;01m.\u001b[39;00m\u001b[34;01magents\u001b[39;00m\u001b[34;01m.\u001b[39;00m\u001b[34;01menvironment\u001b[39;00m\u001b[38;5;250m \u001b[39m\u001b[38;5;28;01mimport\u001b[39;00m alfred_tw_env\n\u001b[32m----> \u001b[39m\u001b[32m3\u001b[39m env = \u001b[43malfred_tw_env\u001b[49m\u001b[43m.\u001b[49m\u001b[43mload_env\u001b[49m(\n\u001b[32m      4\u001b[39m     split=\u001b[33m\"\u001b[39m\u001b[33mtrain\u001b[39m\u001b[33m\"\u001b[39m, \n\u001b[32m      5\u001b[39m     reward=\u001b[33m\"\u001b[39m\u001b[33mdense\u001b[39m\u001b[33m\"\u001b[39m,   \u001b[38;5;66;03m# dense reward\u001b[39;00m\n\u001b[32m      6\u001b[39m     task_type=\u001b[33m\"\u001b[39m\u001b[33mpick_and_place\u001b[39m\u001b[33m\"\u001b[39m\n\u001b[32m      7\u001b[39m )\n\u001b[32m      9\u001b[39m obs, info = env.reset()\n\u001b[32m     10\u001b[39m done = \u001b[38;5;28;01mFalse\u001b[39;00m\n",
      "\u001b[31mAttributeError\u001b[39m: module 'alfworld.agents.environment.alfred_tw_env' has no attribute 'load_env'"
     ]
    }
   ],
   "source": [
    "from alfworld.agents.environment import alfred_tw_env\n",
    "\n",
    "env = alfred_tw_env.load_env(\n",
    "    split=\"train\", \n",
    "    reward=\"dense\",   # dense reward\n",
    "    task_type=\"pick_and_place\"\n",
    ")\n",
    "\n",
    "obs, info = env.reset()\n",
    "done = False\n",
    "total_reward = 0\n",
    "while not done:\n",
    "    action = env.action_space.sample()\n",
    "    obs, reward, done, info = env.step(action)\n",
    "    print(\"Reward:\", reward)\n",
    "    total_reward += reward"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "7b757143",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "pettingllms-venv",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.12.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
