{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "996db35c",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import numpy as np\n",
    "from io import StringIO\n",
    "\n",
    "# Input CSV data as string\n",
    "data_exp = \"\"\"env,reward,seed,success_rate,avg_return\n",
    "button-press-topdown-v3,expert,0,1.0000,142.54\n",
    "button-press-topdown-v3,expert,1,1.0000,127.91\n",
    "button-press-topdown-v3,expert,2,0.8000,182.33\n",
    "button-press-topdown-v3,expert,3,1.0000,130.18\n",
    "button-press-topdown-v3,expert,4,1.0000,144.35\n",
    "button-press-topdown-v3,expert,5,0.6000,228.29\n",
    "button-press-topdown-v3,expert,6,1.0000,130.78\n",
    "button-press-topdown-v3,expert,7,0.7500,196.89\n",
    "button-press-topdown-v3,expert,8,0.6500,216.86\n",
    "button-press-topdown-v3,expert,9,1.0000,123.49\n",
    "door-open-v3,expert,0,1.0000,313.76\n",
    "door-open-v3,expert,1,1.0000,300.78\n",
    "door-open-v3,expert,2,1.0000,308.55\n",
    "door-open-v3,expert,3,1.0000,286.59\n",
    "door-open-v3,expert,4,1.0000,307.19\n",
    "door-open-v3,expert,5,1.0000,293.26\n",
    "door-open-v3,expert,6,1.0000,331.17\n",
    "door-open-v3,expert,7,1.0000,292.38\n",
    "door-open-v3,expert,8,1.0000,265.20\n",
    "door-open-v3,expert,9,1.0000,314.42\n",
    "drawer-close-v3,expert,0,1.0000,29.45\n",
    "drawer-close-v3,expert,1,1.0000,41.29\n",
    "drawer-close-v3,expert,2,1.0000,37.83\n",
    "drawer-close-v3,expert,3,1.0000,28.54\n",
    "drawer-close-v3,expert,4,1.0000,24.38\n",
    "drawer-close-v3,expert,5,1.0000,41.23\n",
    "drawer-close-v3,expert,6,1.0000,27.29\n",
    "drawer-close-v3,expert,7,1.0000,29.40\n",
    "drawer-close-v3,expert,8,1.0000,21.87\n",
    "drawer-close-v3,expert,9,1.0000,43.39\n",
    "drawer-open-v3,expert,0,1.0000,336.27\n",
    "drawer-open-v3,expert,1,1.0000,319.70\n",
    "drawer-open-v3,expert,2,0.9500,369.03\n",
    "drawer-open-v3,expert,3,1.0000,336.97\n",
    "drawer-open-v3,expert,4,1.0000,336.90\n",
    "drawer-open-v3,expert,5,1.0000,332.18\n",
    "drawer-open-v3,expert,6,1.0000,327.39\n",
    "drawer-open-v3,expert,7,1.0000,434.44\n",
    "drawer-open-v3,expert,8,1.0000,327.03\n",
    "drawer-open-v3,expert,9,0.9000,352.49\n",
    "peg-insert-side-v3,expert,0,0.2000,254.81\n",
    "peg-insert-side-v3,expert,1,0.1500,161.00\n",
    "peg-insert-side-v3,expert,2,0.3000,274.93\n",
    "peg-insert-side-v3,expert,3,0.0000,103.76\n",
    "peg-insert-side-v3,expert,4,0.3500,175.40\n",
    "peg-insert-side-v3,expert,5,0.3000,321.07\n",
    "peg-insert-side-v3,expert,6,0.2500,167.92\n",
    "peg-insert-side-v3,expert,7,0.2500,180.90\n",
    "peg-insert-side-v3,expert,8,0.0000,113.81\n",
    "peg-insert-side-v3,expert,9,0.1000,242.43\n",
    "pick-place-v3,expert,0,0.0000,1.60\n",
    "pick-place-v3,expert,1,0.0000,1.84\n",
    "pick-place-v3,expert,2,0.0000,1.99\n",
    "pick-place-v3,expert,3,0.0000,2.06\n",
    "pick-place-v3,expert,4,0.0500,1.60\n",
    "pick-place-v3,expert,5,0.0000,1.83\n",
    "pick-place-v3,expert,6,0.0000,1.55\n",
    "pick-place-v3,expert,7,0.0000,1.66\n",
    "pick-place-v3,expert,8,0.0000,1.89\n",
    "pick-place-v3,expert,9,0.0000,1.50\n",
    "push-v3,expert,0,0.5000,106.64\n",
    "push-v3,expert,1,0.3000,60.86\n",
    "push-v3,expert,2,0.1000,28.88\n",
    "push-v3,expert,3,0.0500,18.09\n",
    "push-v3,expert,4,0.2500,37.16\n",
    "push-v3,expert,5,0.5000,66.49\n",
    "push-v3,expert,6,0.5500,63.76\n",
    "push-v3,expert,7,0.2500,56.45\n",
    "push-v3,expert,8,0.1000,13.57\n",
    "push-v3,expert,9,0.2000,42.98\n",
    "reach-v3,expert,0,0.1000,590.71\n",
    "reach-v3,expert,1,0.3000,567.80\n",
    "reach-v3,expert,2,0.3000,595.98\n",
    "reach-v3,expert,3,0.2000,796.65\n",
    "reach-v3,expert,4,0.1500,758.75\n",
    "reach-v3,expert,5,0.3000,537.71\n",
    "reach-v3,expert,6,0.4500,592.13\n",
    "reach-v3,expert,7,0.2000,601.41\n",
    "reach-v3,expert,8,0.4000,512.87\n",
    "reach-v3,expert,9,0.2000,563.57\n",
    "window-close-v3,expert,0,1.0000,119.74\n",
    "window-close-v3,expert,1,1.0000,118.96\n",
    "window-close-v3,expert,2,1.0000,120.08\n",
    "window-close-v3,expert,3,1.0000,120.34\n",
    "window-close-v3,expert,4,1.0000,119.98\n",
    "window-close-v3,expert,5,1.0000,121.67\n",
    "window-close-v3,expert,6,1.0000,119.91\n",
    "window-close-v3,expert,7,1.0000,119.93\n",
    "window-close-v3,expert,8,1.0000,121.46\n",
    "window-close-v3,expert,9,1.0000,119.89\n",
    "window-open-v3,expert,0,1.0000,74.08\n",
    "window-open-v3,expert,1,1.0000,79.94\n",
    "window-open-v3,expert,2,1.0000,83.14\n",
    "window-open-v3,expert,3,1.0000,79.51\n",
    "window-open-v3,expert,4,1.0000,83.62\n",
    "window-open-v3,expert,5,1.0000,82.15\n",
    "window-open-v3,expert,6,1.0000,78.90\n",
    "window-open-v3,expert,7,1.0000,82.62\n",
    "window-open-v3,expert,8,1.0000,84.16\n",
    "window-open-v3,expert,9,1.0000,77.21\n",
    "\"\"\"\n",
    "\n",
    "data_no_ttt = \"\"\"env,reward,seed,success_rate,avg_return\n",
    "button-press-topdown-v3,no_ttt,0,0.9000,150.85\n",
    "button-press-topdown-v3,no_ttt,1,0.9000,158.34\n",
    "button-press-topdown-v3,no_ttt,2,1.0000,140.30\n",
    "button-press-topdown-v3,no_ttt,3,0.9000,148.59\n",
    "button-press-topdown-v3,no_ttt,4,1.0000,141.73\n",
    "button-press-topdown-v3,no_ttt,5,0.9000,156.52\n",
    "button-press-topdown-v3,no_ttt,6,1.0000,142.06\n",
    "button-press-topdown-v3,no_ttt,7,0.9000,165.51\n",
    "button-press-topdown-v3,no_ttt,8,1.0000,156.09\n",
    "button-press-topdown-v3,no_ttt,9,0.6000,217.16\n",
    "door-open-v3,no_ttt,0,1.0000,289.75\n",
    "door-open-v3,no_ttt,1,1.0000,293.84\n",
    "door-open-v3,no_ttt,2,1.0000,308.09\n",
    "door-open-v3,no_ttt,3,1.0000,274.73\n",
    "door-open-v3,no_ttt,4,1.0000,281.71\n",
    "door-open-v3,no_ttt,5,1.0000,298.12\n",
    "door-open-v3,no_ttt,6,1.0000,344.70\n",
    "door-open-v3,no_ttt,7,1.0000,334.09\n",
    "door-open-v3,no_ttt,8,1.0000,295.50\n",
    "door-open-v3,no_ttt,9,1.0000,362.80\n",
    "drawer-close-v3,no_ttt,0,1.0000,65.72\n",
    "drawer-close-v3,no_ttt,1,1.0000,42.05\n",
    "drawer-close-v3,no_ttt,2,1.0000,48.10\n",
    "drawer-close-v3,no_ttt,3,1.0000,31.69\n",
    "drawer-close-v3,no_ttt,4,1.0000,39.38\n",
    "drawer-close-v3,no_ttt,5,1.0000,39.52\n",
    "drawer-close-v3,no_ttt,6,1.0000,24.88\n",
    "drawer-close-v3,no_ttt,7,1.0000,25.59\n",
    "drawer-close-v3,no_ttt,8,1.0000,21.35\n",
    "drawer-close-v3,no_ttt,9,1.0000,37.99\n",
    "drawer-open-v3,no_ttt,0,1.0000,375.90\n",
    "drawer-open-v3,no_ttt,1,1.0000,353.16\n",
    "drawer-open-v3,no_ttt,2,1.0000,349.25\n",
    "drawer-open-v3,no_ttt,3,1.0000,331.36\n",
    "drawer-open-v3,no_ttt,4,1.0000,336.47\n",
    "drawer-open-v3,no_ttt,5,0.9500,397.01\n",
    "drawer-open-v3,no_ttt,6,1.0000,332.42\n",
    "drawer-open-v3,no_ttt,7,1.0000,363.87\n",
    "drawer-open-v3,no_ttt,8,1.0000,382.74\n",
    "drawer-open-v3,no_ttt,9,1.0000,323.51\n",
    "peg-insert-side-v3,no_ttt,0,0.2000,149.72\n",
    "peg-insert-side-v3,no_ttt,1,0.1000,60.52\n",
    "peg-insert-side-v3,no_ttt,2,0.3000,181.21\n",
    "peg-insert-side-v3,no_ttt,3,0.1000,183.75\n",
    "peg-insert-side-v3,no_ttt,4,0.6000,130.87\n",
    "peg-insert-side-v3,no_ttt,5,0.2500,126.91\n",
    "peg-insert-side-v3,no_ttt,6,0.1000,75.44\n",
    "peg-insert-side-v3,no_ttt,7,0.2000,75.07\n",
    "peg-insert-side-v3,no_ttt,8,0.3000,67.21\n",
    "peg-insert-side-v3,no_ttt,9,0.1500,165.82\n",
    "pick-place-v3,no_ttt,0,0.0000,2.15\n",
    "pick-place-v3,no_ttt,1,0.0000,2.11\n",
    "pick-place-v3,no_ttt,2,0.0000,2.27\n",
    "pick-place-v3,no_ttt,3,0.0000,2.33\n",
    "pick-place-v3,no_ttt,4,0.0000,1.84\n",
    "pick-place-v3,no_ttt,5,0.1000,9.10\n",
    "pick-place-v3,no_ttt,6,0.2500,9.45\n",
    "pick-place-v3,no_ttt,7,0.0500,4.11\n",
    "pick-place-v3,no_ttt,8,0.0500,4.40\n",
    "pick-place-v3,no_ttt,9,0.0000,3.65\n",
    "push-v3,no_ttt,0,0.3000,68.32\n",
    "push-v3,no_ttt,1,0.5500,91.34\n",
    "push-v3,no_ttt,2,0.2500,48.30\n",
    "push-v3,no_ttt,3,0.4500,90.83\n",
    "push-v3,no_ttt,4,0.1000,19.24\n",
    "push-v3,no_ttt,5,0.1500,44.47\n",
    "push-v3,no_ttt,6,0.3500,142.81\n",
    "push-v3,no_ttt,7,0.2500,51.65\n",
    "push-v3,no_ttt,8,0.2000,32.61\n",
    "push-v3,no_ttt,9,0.5000,83.46\n",
    "reach-v3,no_ttt,0,0.0500,525.81\n",
    "reach-v3,no_ttt,1,0.0500,547.59\n",
    "reach-v3,no_ttt,2,0.0500,586.55\n",
    "reach-v3,no_ttt,3,0.2000,419.20\n",
    "reach-v3,no_ttt,4,0.3500,412.46\n",
    "reach-v3,no_ttt,5,0.1000,348.23\n",
    "reach-v3,no_ttt,6,0.2500,461.81\n",
    "reach-v3,no_ttt,7,0.2500,395.31\n",
    "reach-v3,no_ttt,8,0.0500,507.88\n",
    "reach-v3,no_ttt,9,0.1000,364.76\n",
    "window-close-v3,no_ttt,0,1.0000,121.92\n",
    "window-close-v3,no_ttt,1,1.0000,121.86\n",
    "window-close-v3,no_ttt,2,1.0000,120.11\n",
    "window-close-v3,no_ttt,3,1.0000,120.45\n",
    "window-close-v3,no_ttt,4,1.0000,125.39\n",
    "window-close-v3,no_ttt,5,1.0000,123.85\n",
    "window-close-v3,no_ttt,6,1.0000,120.96\n",
    "window-close-v3,no_ttt,7,1.0000,122.23\n",
    "window-close-v3,no_ttt,8,1.0000,122.59\n",
    "window-close-v3,no_ttt,9,1.0000,118.79\n",
    "window-open-v3,no_ttt,0,1.0000,78.94\n",
    "window-open-v3,no_ttt,1,1.0000,80.32\n",
    "window-open-v3,no_ttt,2,1.0000,82.01\n",
    "window-open-v3,no_ttt,3,1.0000,81.99\n",
    "window-open-v3,no_ttt,4,1.0000,85.22\n",
    "window-open-v3,no_ttt,5,1.0000,81.47\n",
    "window-open-v3,no_ttt,6,1.0000,82.71\n",
    "window-open-v3,no_ttt,7,1.0000,81.52\n",
    "window-open-v3,no_ttt,8,1.0000,82.37\n",
    "window-open-v3,no_ttt,9,1.0000,80.85\n",
    "\"\"\"\n",
    "\n",
    "data_online = \"\"\"env,reward,seed,success_rate,avg_return\n",
    "button-press-topdown-v3,online,0,0.8000,170.86\n",
    "button-press-topdown-v3,online,1,0.8000,180.86\n",
    "button-press-topdown-v3,online,2,0.9000,164.74\n",
    "button-press-topdown-v3,online,3,0.9000,150.90\n",
    "button-press-topdown-v3,online,4,0.8500,173.45\n",
    "button-press-topdown-v3,online,5,0.9000,152.63\n",
    "button-press-topdown-v3,online,6,1.0000,134.20\n",
    "button-press-topdown-v3,online,7,0.9000,166.51\n",
    "button-press-topdown-v3,online,8,0.8000,179.53\n",
    "button-press-topdown-v3,online,9,1.0000,122.04\n",
    "door-open-v3,online,0,1.0000,315.40\n",
    "door-open-v3,online,1,1.0000,328.27\n",
    "door-open-v3,online,2,1.0000,294.98\n",
    "door-open-v3,online,3,1.0000,293.63\n",
    "door-open-v3,online,4,1.0000,322.91\n",
    "door-open-v3,online,5,1.0000,324.66\n",
    "door-open-v3,online,6,1.0000,299.30\n",
    "door-open-v3,online,7,1.0000,287.04\n",
    "door-open-v3,online,8,1.0000,269.97\n",
    "door-open-v3,online,9,1.0000,300.50\n",
    "drawer-close-v3,online,0,1.0000,34.15\n",
    "drawer-close-v3,online,1,1.0000,41.17\n",
    "drawer-close-v3,online,2,1.0000,37.81\n",
    "drawer-close-v3,online,3,1.0000,26.17\n",
    "drawer-close-v3,online,4,1.0000,28.09\n",
    "drawer-close-v3,online,5,1.0000,46.42\n",
    "drawer-close-v3,online,6,1.0000,24.47\n",
    "drawer-close-v3,online,7,1.0000,27.12\n",
    "drawer-close-v3,online,8,1.0000,23.38\n",
    "drawer-close-v3,online,9,1.0000,31.22\n",
    "drawer-open-v3,online,0,1.0000,289.19\n",
    "drawer-open-v3,online,1,1.0000,360.28\n",
    "drawer-open-v3,online,2,1.0000,360.95\n",
    "drawer-open-v3,online,3,1.0000,311.26\n",
    "drawer-open-v3,online,4,1.0000,347.67\n",
    "drawer-open-v3,online,5,0.9500,352.80\n",
    "drawer-open-v3,online,6,1.0000,342.04\n",
    "drawer-open-v3,online,7,1.0000,361.73\n",
    "drawer-open-v3,online,8,1.0000,320.71\n",
    "drawer-open-v3,online,9,1.0000,348.43\n",
    "peg-insert-side-v3,online,0,0.0500,80.53\n",
    "peg-insert-side-v3,online,1,0.0500,50.01\n",
    "peg-insert-side-v3,online,2,0.2500,111.61\n",
    "peg-insert-side-v3,online,3,0.1000,55.14\n",
    "peg-insert-side-v3,online,4,0.4500,169.84\n",
    "peg-insert-side-v3,online,5,0.0500,45.85\n",
    "peg-insert-side-v3,online,6,0.0500,60.59\n",
    "peg-insert-side-v3,online,7,0.2000,70.82\n",
    "peg-insert-side-v3,online,8,0.3500,124.43\n",
    "peg-insert-side-v3,online,9,0.2500,95.09\n",
    "pick-place-v3,online,0,0.1500,12.87\n",
    "pick-place-v3,online,1,0.2000,7.81\n",
    "pick-place-v3,online,2,0.4000,30.65\n",
    "pick-place-v3,online,3,0.2000,11.16\n",
    "pick-place-v3,online,4,0.2500,13.17\n",
    "pick-place-v3,online,5,0.2500,19.85\n",
    "pick-place-v3,online,6,0.4000,29.14\n",
    "pick-place-v3,online,7,0.1500,8.31\n",
    "pick-place-v3,online,8,0.0000,2.45\n",
    "pick-place-v3,online,9,0.5000,32.07\n",
    "push-v3,online,0,0.2000,61.49\n",
    "push-v3,online,1,0.5500,85.29\n",
    "push-v3,online,2,0.2500,103.07\n",
    "push-v3,online,3,0.4500,98.14\n",
    "push-v3,online,4,0.1000,44.06\n",
    "push-v3,online,5,0.3000,136.02\n",
    "push-v3,online,6,0.7500,142.68\n",
    "push-v3,online,7,0.3500,133.00\n",
    "push-v3,online,8,0.0500,61.86\n",
    "push-v3,online,9,0.6500,105.39\n",
    "reach-v3,online,0,0.2500,384.14\n",
    "reach-v3,online,1,0.2500,293.38\n",
    "reach-v3,online,2,0.5000,311.48\n",
    "reach-v3,online,3,0.2000,473.44\n",
    "reach-v3,online,4,0.2000,421.34\n",
    "reach-v3,online,5,0.3500,333.88\n",
    "reach-v3,online,6,0.4000,376.03\n",
    "reach-v3,online,7,0.2500,250.22\n",
    "reach-v3,online,8,0.0000,494.88\n",
    "reach-v3,online,9,0.5500,287.15\n",
    "window-close-v3,online,0,1.0000,120.67\n",
    "window-close-v3,online,1,1.0000,121.59\n",
    "window-close-v3,online,2,1.0000,121.76\n",
    "window-close-v3,online,3,1.0000,122.56\n",
    "window-close-v3,online,4,1.0000,122.44\n",
    "window-close-v3,online,5,1.0000,119.64\n",
    "window-close-v3,online,6,1.0000,123.96\n",
    "window-close-v3,online,7,1.0000,123.47\n",
    "window-close-v3,online,8,1.0000,121.94\n",
    "window-close-v3,online,9,1.0000,119.34\n",
    "window-open-v3,online,0,1.0000,79.82\n",
    "window-open-v3,online,1,1.0000,81.76\n",
    "window-open-v3,online,2,1.0000,82.35\n",
    "window-open-v3,online,3,1.0000,80.19\n",
    "window-open-v3,online,4,1.0000,86.94\n",
    "window-open-v3,online,5,1.0000,77.99\n",
    "window-open-v3,online,6,1.0000,82.49\n",
    "window-open-v3,online,7,1.0000,84.06\n",
    "window-open-v3,online,8,1.0000,80.09\n",
    "window-open-v3,online,9,1.0000,74.20\n",
    "\"\"\" \n",
    "\n",
    "data_clip = \"\"\"env,reward,seed,success_rate,avg_return\n",
    "button-press-topdown-v3,clip,0,1.0000,120.23\n",
    "button-press-topdown-v3,clip,1,1.0000,150.37\n",
    "button-press-topdown-v3,clip,2,1.0000,154.59\n",
    "button-press-topdown-v3,clip,3,1.0000,141.26\n",
    "button-press-topdown-v3,clip,4,1.0000,135.32\n",
    "button-press-topdown-v3,clip,5,1.0000,131.04\n",
    "button-press-topdown-v3,clip,6,1.0000,146.63\n",
    "button-press-topdown-v3,clip,7,0.7000,209.59\n",
    "button-press-topdown-v3,clip,8,0.6000,234.38\n",
    "button-press-topdown-v3,clip,9,0.7500,184.65\n",
    "door-open-v3,clip,0,1.0000,307.38\n",
    "door-open-v3,clip,1,1.0000,354.07\n",
    "door-open-v3,clip,2,1.0000,285.34\n",
    "door-open-v3,clip,3,1.0000,285.82\n",
    "door-open-v3,clip,4,1.0000,274.85\n",
    "door-open-v3,clip,5,1.0000,296.84\n",
    "door-open-v3,clip,6,1.0000,302.56\n",
    "door-open-v3,clip,7,1.0000,320.04\n",
    "door-open-v3,clip,8,1.0000,270.78\n",
    "door-open-v3,clip,9,1.0000,278.12\n",
    "drawer-close-v3,clip,0,1.0000,32.70\n",
    "drawer-close-v3,clip,1,1.0000,38.73\n",
    "drawer-close-v3,clip,2,1.0000,36.20\n",
    "drawer-close-v3,clip,3,1.0000,25.37\n",
    "drawer-close-v3,clip,4,1.0000,23.15\n",
    "drawer-close-v3,clip,5,1.0000,41.13\n",
    "drawer-close-v3,clip,6,1.0000,26.45\n",
    "drawer-close-v3,clip,7,1.0000,25.51\n",
    "drawer-close-v3,clip,8,1.0000,23.30\n",
    "drawer-close-v3,clip,9,1.0000,40.48\n",
    "drawer-open-v3,clip,0,1.0000,295.24\n",
    "drawer-open-v3,clip,1,1.0000,374.35\n",
    "drawer-open-v3,clip,2,1.0000,411.78\n",
    "drawer-open-v3,clip,3,0.4500,466.49\n",
    "drawer-open-v3,clip,4,1.0000,326.38\n",
    "drawer-open-v3,clip,5,1.0000,334.42\n",
    "drawer-open-v3,clip,6,1.0000,332.73\n",
    "drawer-open-v3,clip,7,1.0000,310.59\n",
    "drawer-open-v3,clip,8,1.0000,366.10\n",
    "drawer-open-v3,clip,9,1.0000,316.63\n",
    "peg-insert-side-v3,clip,0,0.3000,121.22\n",
    "peg-insert-side-v3,clip,1,0.0000,10.75\n",
    "peg-insert-side-v3,clip,2,0.0000,40.02\n",
    "peg-insert-side-v3,clip,3,0.1000,70.05\n",
    "peg-insert-side-v3,clip,4,0.5500,98.46\n",
    "peg-insert-side-v3,clip,5,0.1000,113.92\n",
    "peg-insert-side-v3,clip,6,0.0500,49.77\n",
    "peg-insert-side-v3,clip,7,0.0000,23.35\n",
    "peg-insert-side-v3,clip,8,0.2500,152.99\n",
    "peg-insert-side-v3,clip,9,0.0000,49.20\n",
    "pick-place-v3,clip,0,0.1000,9.39\n",
    "pick-place-v3,clip,1,0.0000,2.18\n",
    "pick-place-v3,clip,2,0.0000,1.81\n",
    "pick-place-v3,clip,3,0.2000,2.83\n",
    "pick-place-v3,clip,4,0.2000,6.06\n",
    "pick-place-v3,clip,5,0.0000,17.56\n",
    "pick-place-v3,clip,6,0.0000,1.97\n",
    "pick-place-v3,clip,7,0.0000,6.80\n",
    "pick-place-v3,clip,8,0.0000,2.19\n",
    "pick-place-v3,clip,9,0.1500,104.92\n",
    "push-v3,clip,0,0.3500,61.24\n",
    "push-v3,clip,1,0.1000,24.22\n",
    "push-v3,clip,2,0.1500,30.50\n",
    "push-v3,clip,3,0.1500,28.42\n",
    "push-v3,clip,4,0.4500,87.47\n",
    "push-v3,clip,5,0.3500,68.60\n",
    "push-v3,clip,6,0.2000,44.18\n",
    "push-v3,clip,7,0.1500,59.34\n",
    "push-v3,clip,8,0.0500,17.28\n",
    "push-v3,clip,9,0.1000,70.44\n",
    "reach-v3,clip,0,0.1000,593.98\n",
    "reach-v3,clip,1,0.0500,404.20\n",
    "reach-v3,clip,2,0.2000,503.89\n",
    "reach-v3,clip,3,0.3500,348.16\n",
    "reach-v3,clip,4,0.3500,405.24\n",
    "reach-v3,clip,5,0.0000,531.86\n",
    "reach-v3,clip,6,0.2000,516.44\n",
    "reach-v3,clip,7,0.0000,326.67\n",
    "reach-v3,clip,8,0.2500,391.92\n",
    "reach-v3,clip,9,0.3000,448.24\n",
    "window-close-v3,clip,0,1.0000,121.83\n",
    "window-close-v3,clip,1,1.0000,122.32\n",
    "window-close-v3,clip,2,1.0000,121.80\n",
    "window-close-v3,clip,3,1.0000,119.00\n",
    "window-close-v3,clip,4,1.0000,123.51\n",
    "window-close-v3,clip,5,1.0000,120.91\n",
    "window-close-v3,clip,6,1.0000,121.74\n",
    "window-close-v3,clip,7,1.0000,124.34\n",
    "window-close-v3,clip,8,1.0000,122.18\n",
    "window-close-v3,clip,9,1.0000,117.81\n",
    "window-open-v3,clip,0,1.0000,79.08\n",
    "window-open-v3,clip,1,1.0000,83.66\n",
    "window-open-v3,clip,2,1.0000,84.58\n",
    "window-open-v3,clip,3,1.0000,80.19\n",
    "window-open-v3,clip,4,1.0000,85.53\n",
    "window-open-v3,clip,5,1.0000,82.32\n",
    "window-open-v3,clip,6,1.0000,82.09\n",
    "window-open-v3,clip,7,1.0000,82.85\n",
    "window-open-v3,clip,8,1.0000,82.42\n",
    "window-open-v3,clip,9,1.0000,78.13\n",
    "\"\"\"\n",
    "\n",
    "data_clip_reg = \"\"\"env,reward,seed,success_rate,avg_return\n",
    "button-press-topdown-v3,clip_reg,0,1.0000,142.30\n",
    "button-press-topdown-v3,clip_reg,1,1.0000,135.71\n",
    "button-press-topdown-v3,clip_reg,2,0.9000,163.17\n",
    "button-press-topdown-v3,clip_reg,3,1.0000,124.03\n",
    "button-press-topdown-v3,clip_reg,4,0.8500,172.21\n",
    "button-press-topdown-v3,clip_reg,5,0.7500,191.53\n",
    "button-press-topdown-v3,clip_reg,6,0.9000,157.16\n",
    "button-press-topdown-v3,clip_reg,7,0.7000,208.37\n",
    "button-press-topdown-v3,clip_reg,8,0.7000,203.38\n",
    "button-press-topdown-v3,clip_reg,9,1.0000,118.77\n",
    "door-open-v3,clip_reg,0,1.0000,312.37\n",
    "door-open-v3,clip_reg,1,1.0000,382.16\n",
    "door-open-v3,clip_reg,2,1.0000,309.81\n",
    "door-open-v3,clip_reg,3,1.0000,313.98\n",
    "door-open-v3,clip_reg,4,1.0000,335.37\n",
    "door-open-v3,clip_reg,5,1.0000,329.93\n",
    "door-open-v3,clip_reg,6,1.0000,277.38\n",
    "door-open-v3,clip_reg,7,1.0000,303.25\n",
    "door-open-v3,clip_reg,8,1.0000,273.71\n",
    "door-open-v3,clip_reg,9,1.0000,311.53\n",
    "drawer-close-v3,clip_reg,0,1.0000,33.33\n",
    "drawer-close-v3,clip_reg,1,1.0000,41.47\n",
    "drawer-close-v3,clip_reg,2,1.0000,43.65\n",
    "drawer-close-v3,clip_reg,3,1.0000,25.95\n",
    "drawer-close-v3,clip_reg,4,1.0000,25.15\n",
    "drawer-close-v3,clip_reg,5,0.8500,51.46\n",
    "drawer-close-v3,clip_reg,6,1.0000,29.66\n",
    "drawer-close-v3,clip_reg,7,1.0000,44.17\n",
    "drawer-close-v3,clip_reg,8,1.0000,22.53\n",
    "drawer-close-v3,clip_reg,9,1.0000,36.62\n",
    "drawer-open-v3,clip_reg,0,0.8500,393.97\n",
    "drawer-open-v3,clip_reg,1,1.0000,343.46\n",
    "drawer-open-v3,clip_reg,2,1.0000,331.45\n",
    "drawer-open-v3,clip_reg,3,0.9000,350.71\n",
    "drawer-open-v3,clip_reg,4,1.0000,338.66\n",
    "drawer-open-v3,clip_reg,5,1.0000,364.09\n",
    "drawer-open-v3,clip_reg,6,1.0000,295.45\n",
    "drawer-open-v3,clip_reg,7,1.0000,377.82\n",
    "drawer-open-v3,clip_reg,8,1.0000,338.27\n",
    "drawer-open-v3,clip_reg,9,1.0000,312.33\n",
    "peg-insert-side-v3,clip_reg,0,0.2500,93.92\n",
    "peg-insert-side-v3,clip_reg,1,0.0000,23.95\n",
    "peg-insert-side-v3,clip_reg,2,0.0500,100.06\n",
    "peg-insert-side-v3,clip_reg,3,0.1000,55.39\n",
    "peg-insert-side-v3,clip_reg,4,0.0000,77.88\n",
    "peg-insert-side-v3,clip_reg,5,0.0000,19.67\n",
    "peg-insert-side-v3,clip_reg,6,0.0500,37.42\n",
    "peg-insert-side-v3,clip_reg,7,0.1000,63.30\n",
    "peg-insert-side-v3,clip_reg,8,0.2000,132.03\n",
    "peg-insert-side-v3,clip_reg,9,0.1000,92.68\n",
    "pick-place-v3,clip_reg,0,0.0000,2.41\n",
    "pick-place-v3,clip_reg,1,0.0000,2.24\n",
    "pick-place-v3,clip_reg,2,0.0000,2.49\n",
    "pick-place-v3,clip_reg,3,0.1000,21.75\n",
    "pick-place-v3,clip_reg,4,0.1500,8.57\n",
    "pick-place-v3,clip_reg,5,0.0000,2.67\n",
    "pick-place-v3,clip_reg,6,0.0000,2.36\n",
    "pick-place-v3,clip_reg,7,0.0000,1.70\n",
    "pick-place-v3,clip_reg,8,0.0500,5.50\n",
    "pick-place-v3,clip_reg,9,0.1000,54.01\n",
    "push-v3,clip_reg,0,0.2500,178.91\n",
    "push-v3,clip_reg,1,0.4000,73.47\n",
    "push-v3,clip_reg,2,0.2500,58.04\n",
    "push-v3,clip_reg,3,0.4000,90.12\n",
    "push-v3,clip_reg,4,0.0500,22.81\n",
    "push-v3,clip_reg,5,0.1000,46.58\n",
    "push-v3,clip_reg,6,0.2000,71.59\n",
    "push-v3,clip_reg,7,0.3500,61.39\n",
    "push-v3,clip_reg,8,0.0000,19.92\n",
    "push-v3,clip_reg,9,0.2000,102.48\n",
    "reach-v3,clip_reg,0,0.0500,392.96\n",
    "reach-v3,clip_reg,1,0.0000,452.93\n",
    "reach-v3,clip_reg,2,0.0000,342.28\n",
    "reach-v3,clip_reg,3,0.4500,501.50\n",
    "reach-v3,clip_reg,4,0.2000,509.98\n",
    "reach-v3,clip_reg,5,0.0500,568.94\n",
    "reach-v3,clip_reg,6,0.3500,634.59\n",
    "reach-v3,clip_reg,7,0.0500,381.02\n",
    "reach-v3,clip_reg,8,0.1000,473.22\n",
    "reach-v3,clip_reg,9,0.1500,435.77\n",
    "window-close-v3,clip_reg,0,1.0000,121.90\n",
    "window-close-v3,clip_reg,1,1.0000,121.03\n",
    "window-close-v3,clip_reg,2,1.0000,123.18\n",
    "window-close-v3,clip_reg,3,1.0000,121.79\n",
    "window-close-v3,clip_reg,4,1.0000,122.06\n",
    "window-close-v3,clip_reg,5,1.0000,122.31\n",
    "window-close-v3,clip_reg,6,1.0000,121.83\n",
    "window-close-v3,clip_reg,7,1.0000,121.37\n",
    "window-close-v3,clip_reg,8,1.0000,122.89\n",
    "window-close-v3,clip_reg,9,1.0000,119.86\n",
    "window-open-v3,clip_reg,0,1.0000,76.17\n",
    "window-open-v3,clip_reg,1,1.0000,82.77\n",
    "window-open-v3,clip_reg,2,1.0000,84.01\n",
    "window-open-v3,clip_reg,3,1.0000,81.89\n",
    "window-open-v3,clip_reg,4,1.0000,83.03\n",
    "window-open-v3,clip_reg,5,1.0000,81.56\n",
    "window-open-v3,clip_reg,6,1.0000,84.76\n",
    "window-open-v3,clip_reg,7,1.0000,83.94\n",
    "window-open-v3,clip_reg,8,1.0000,82.46\n",
    "window-open-v3,clip_reg,9,1.0000,74.70\n",
    "\"\"\"\n",
    "\n",
    "# Load into DataFrame\n",
    "df_exp = pd.read_csv(StringIO(data_exp))\n",
    "df_online = pd.read_csv(StringIO(data_online))\n",
    "df_no_ttt = pd.read_csv(StringIO(data_no_ttt))\n",
    "df_clip = pd.read_csv(StringIO(data_clip))\n",
    "df_clip_reg = pd.read_csv(StringIO(data_clip_reg))\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "4f0ddafb",
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "# --- 1) Core IQM on a 1D array of scores -----------------\n",
    "def iqm_from_array(x: np.ndarray) -> float:\n",
    "    x = np.asarray(x, dtype=float)\n",
    "    x_sorted = np.sort(x)\n",
    "    k = len(x_sorted)\n",
    "    lo = int(np.floor(0.25 * k))\n",
    "    hi = int(np.ceil(0.75 * k))\n",
    "    # middle 50% (handles small k gracefully)\n",
    "    middle = x_sorted[lo:hi]\n",
    "    return float(middle.mean()) if len(middle) else float(x_sorted.mean())\n",
    "\n",
    "# --- 2) IQM on a DF: flatten across tasks×seeds -----------\n",
    "def iqm_from_df(df: pd.DataFrame, score_col: str) -> float:\n",
    "    return iqm_from_array(df[score_col].to_numpy())\n",
    "\n",
    "# --- 3) Stratified bootstrap CI (percentile), stratify by env/task ----\n",
    "def iqm_stratified_boot_ci(\n",
    "    df: pd.DataFrame,\n",
    "    group_col: str,     # e.g., \"env\"\n",
    "    score_col: str,     # e.g., \"success_rate\" or \"normalized_score\"\n",
    "    B: int = 10_000,\n",
    "    ci: float = 0.95,\n",
    "    rng: np.random.Generator | None = None\n",
    "):\n",
    "    if rng is None:\n",
    "        rng = np.random.default_rng(0)\n",
    "\n",
    "    # Pre-split groups to speed up resampling\n",
    "    groups = [g[score_col].to_numpy() for _, g in df.groupby(group_col, sort=False)]\n",
    "    n_per_group = [len(g) for g in groups]\n",
    "\n",
    "    samples = np.empty(B, dtype=float)\n",
    "    for b in range(B):\n",
    "        # resample within each group independently (same size, with replacement)\n",
    "        resampled = []\n",
    "        for g, n in zip(groups, n_per_group):\n",
    "            idx = rng.integers(0, n, size=n)  # bootstrap indices\n",
    "            resampled.append(g[idx])\n",
    "        x = np.concatenate(resampled, axis=0)\n",
    "        samples[b] = iqm_from_array(x)\n",
    "\n",
    "    alpha = (1 - ci) / 2\n",
    "    lo, hi = np.quantile(samples, [alpha, 1 - alpha])\n",
    "    point = iqm_from_array(df[score_col].to_numpy())\n",
    "    return point, float(lo), float(hi)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "f57b5f9e",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "IQM(success) = 0.7790  (95% CI: [0.7500, 0.8040])\n"
     ]
    }
   ],
   "source": [
    "point, lo, hi = iqm_stratified_boot_ci(df_exp, group_col=\"env\", score_col=\"success_rate\", B=10_000)\n",
    "print(f\"IQM(success) = {point:.4f}  (95% CI: [{lo:.4f}, {hi:.4f}])\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "eaafc4c5",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "IQM(success) = 0.8150  (95% CI: [0.7850, 0.8380])\n"
     ]
    }
   ],
   "source": [
    "point, lo, hi = iqm_stratified_boot_ci(df_online, group_col=\"env\", score_col=\"success_rate\", B=10_000)\n",
    "print(f\"IQM(success) = {point:.4f}  (95% CI: [{lo:.4f}, {hi:.4f}])\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "59f1ce71",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "IQM(success) = 0.7850  (95% CI: [0.7590, 0.8090])\n"
     ]
    }
   ],
   "source": [
    "point, lo, hi = iqm_stratified_boot_ci(df_no_ttt, group_col=\"env\", score_col=\"success_rate\", B=10_000)\n",
    "print(f\"IQM(success) = {point:.4f}  (95% CI: [{lo:.4f}, {hi:.4f}])\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "id": "72123f56",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "IQM(success) = 0.7600  (95% CI: [0.7220, 0.7910])\n"
     ]
    }
   ],
   "source": [
    "point, lo, hi = iqm_stratified_boot_ci(df_clip, group_col=\"env\", score_col=\"success_rate\", B=10_000)\n",
    "print(f\"IQM(success) = {point:.4f}  (95% CI: [{lo:.4f}, {hi:.4f}])\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "id": "ef5c3e9c",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "IQM(success) = 0.7460  (95% CI: [0.7180, 0.7710])\n"
     ]
    }
   ],
   "source": [
    "point, lo, hi = iqm_stratified_boot_ci(df_clip_reg, group_col=\"env\", score_col=\"success_rate\", B=10_000)\n",
    "print(f\"IQM(success) = {point:.4f}  (95% CI: [{lo:.4f}, {hi:.4f}])\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "67588939",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "mw311",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.11.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
