{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# !pip install zeno_client"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd\n",
    "import json\n",
    "import os\n",
    "from dotenv import load_dotenv\n",
    "\n",
    "import zeno_client"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%load_ext dotenv\n",
    "%dotenv"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "RESULT_JSONS = [\n",
    "    \"cllamaINST_zeno.jsonl\",\n",
    "    ]\n",
    "RESULT_NAMES = [\"cllamaINST\"]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "max_records = 1000\n",
    "data = []\n",
    "\n",
    "raw_json_pd = pd.read_json(path_or_buf=RESULT_JSONS[0], lines=True)\n",
    "raw_json_pd[\"id\"] = raw_json_pd.index\n",
    "raw_json_pd = raw_json_pd.drop('observation', axis=1)\n",
    "\n",
    "\n",
    "with open(RESULT_JSONS[0], 'r') as f:\n",
    "    for line in f:\n",
    "        data.append(json.loads(line))\n",
    "        if len(data) == max_records:\n",
    "            break\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# define the data\n",
    "data_df = pd.DataFrame(\n",
    "    {\n",
    "        \"id\": list(range(len(data))),\n",
    "        \"site\": [x[\"website\"] for x in data],\n",
    "        \"objective\": [x[\"objective\"] for x in data],\n",
    "        \"observation\": [\n",
    "            f\"{x['observation']}\\n```python\\n{x['past_actions'] if x['past_actions'] else 'Empty'}```\\nobjective: {x['objective']}\\nprediction: {x['prediction']}\".replace('+==+==+','🚀')\n",
    "        for x in data],\n",
    "        \"ground_truth\": [x[\"ground_truth\"] for x in data]\n",
    "})\n",
    "obs_df = pd.DataFrame(\n",
    "    {\n",
    "        \"id\": list(range(len(data))),\n",
    "        \"observation\": [\n",
    "            f\"{x['observation']}\\n```python\\n{x['past_actions'] if x['past_actions'] else 'Empty'}```\\nobjective: {x['objective']}\\nprediction: {x['prediction']}\".replace('+==+==+','🚀')\n",
    "        for x in data]\n",
    "    })\n",
    "\n",
    "df = pd.merge(obs_df, raw_json_pd, on='id', how='inner')\n",
    "# data_df = df.drop('prediction',axis=1)\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# read ZENO_API_KEY from .env file\n",
    "load_dotenv(override=True)\n",
    "\n",
    "# client = zeno_client.ZenoClient(os.getenv(\"ZENO_API_KEY\"))\n",
    "client = zeno_client.ZenoClient('zen_V_CDGaABIxH-D8YbqfPGoY6K2RN9iHkp-YPrbopvDjc')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "project = client.create_project(\n",
    "    name=\"agent_test_0\",\n",
    "    view={\n",
    "        \"data\": {\"type\": \"markdown\"},\n",
    "        \"label\": {\"type\": \"text\"},\n",
    "        \"output\": {\"type\": \"text\"},\n",
    "    },\n",
    "    metrics=[\n",
    "        zeno_client.ZenoMetric(name=\"accuracy\", type=\"mean\", columns=[\"exact_match\",\"action_match\"]),\n",
    "    ],\n",
    ")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "project.upload_dataset(\n",
    "    df, \n",
    "    id_column=\"id\", \n",
    "    data_column=\"observation\", \n",
    "    label_column=\"ground_truth\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# upload system\n",
    "# code_llama = pd.DataFrame(\n",
    "#     {\n",
    "#         \"example_id\": list(range(len(data))),\n",
    "#         \"prediction\": [x[\"prediction\"] for x in data],\n",
    "#         \"correct\": [x[\"ground_truth\"] == x[\"prediction\"] for x in data],\n",
    "#         \"label_line\": [x[\"label_line\"] for x in data],\n",
    "#         \"pred_line\": [x[\"pred_line\"] for x in data],\n",
    "#         \"total_line\": [x[\"total_line\"] for x in data],\n",
    "#         \"label_pos\": [x[\"label_pos\"] for x in data],\n",
    "#         \"pred_pos\": [x[\"pred_pos\"] for x in data],\n",
    "#     }\n",
    "# )\n",
    "code_llama = df.drop('ground_truth', axis=1).drop('observation', axis=1).drop('objective', axis=1).drop('website', axis=1)\n",
    "code_llama = df[['prediction','id']]\n",
    "code_llama\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "project.upload_system(code_llama, name=\"codellama-7b\", id_column=\"id\", output_column=\"prediction\")"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "agent",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
