{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## CWMB"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Generate the environments"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!python3 code-world-models/src/experiments/run_agentic_world_model_cwm.py \\\n",
    "--model openai/gpt-4.1-mini \\\n",
    "--save_dir \"results/cwm/agentic_world_model\" \\\n",
    "--num_processes=1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!python3 code-world-models/src/experiments/run_agentic_world_model_cwm.py \\\n",
    "--model gpt-4.1-mini \\\n",
    "--save_dir \"results/cwm/agentic_world_model\" \\\n",
    "--num_processes=4"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!python3 code-world-models/src/experiments/run_mcts_cwm.py \\\n",
    "--idx 0, \\\n",
    "--model gpt-4.1-mini \\\n",
    "--save_dir \"results/cwm/mcts\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!python3 code-world-models/src/experiments/run_world_coder_cwm.py \\\n",
    "--idx 0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17 \\\n",
    "--budget 10 \\\n",
    "--model gpt-4.1-mini \\\n",
    "--save_dir \"results/cwm/world_coder\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!python code-world-models/src/experiments/get_best_code_from_json.py \\\n",
    "--world_coder_dir \"results/cwm/world_coder\"\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!python code-world-models/src/experiments/run_text2world_cwm.py \\\n",
    "--world_coder_dir \"results/cwm/text2world\""
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Eval the agentic world model"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!python code-world-models/src/experiments/eval_planning.py \\\n",
    "--save_dir results/awm \\\n",
    "--experiment_name \"agentic_world_model\" \\\n",
    "--n_episodes 10"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!python code-world-models/src/experiments/eval_planning.py \\\n",
    "--save_dir results/mcts \\\n",
    "--experiment_name \"mcts\" \\\n",
    "--n_episodes 10"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!python code-world-models/src/experiments/eval_planning.py \\\n",
    "--save_dir results/world_coder \\\n",
    "--experiment_name \"world_coder\" \\\n",
    "--n_episodes 10"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!python code-world-models/src/experiments/eval_planning.py \\\n",
    "--save_dir results/text2world \\\n",
    "--experiment_name \"text2world\" \\\n",
    "--n_episodes 10"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Statistics of the final indicators"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!python code-world-models/analyze_results.py \\\n",
    "code-world-models/results/text2world/results.json"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!python code-world-models/compute.py \\\n",
    "--json_file_path \"code-world-models/results/text2world/results.json\""
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "agenticworldmodel",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.18"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
