{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "601e2920",
   "metadata": {},
   "outputs": [],
   "source": [
    "import csv\n",
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "id": "827a47b0",
   "metadata": {},
   "outputs": [],
   "source": [
    "file_path = \"/fs-computility/ai4phys/shared/caipengxiang/variables.xlsx\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "id": "53662788",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "Index(['碱', '溶剂', '钯', 'Ligand'], dtype='object')"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.read_excel(file_path)\n",
    "df.columns\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "dc456da8",
   "metadata": {},
   "outputs": [],
   "source": [
    "data_dict = df.to_dict(orient='list')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "d317fd2e",
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "json_path = \"/fs-computility/ai4phys/shared/caipengxiang/suzuki_partition.json\"\n",
    "json_file = json.load(open(json_path, \"r\"))\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "id": "d193daad",
   "metadata": {},
   "outputs": [],
   "source": [
    "output = {}\n",
    "import random\n",
    "for k,v in json_file.items():\n",
    "    temp = []\n",
    "    for item in v:\n",
    "        temp.extend(item)\n",
    "        random.shuffle(temp)\n",
    "    output[k] = temp"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "id": "e6395abb",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'ligand': ['Xantphos',\n",
       "  'dtbpf',\n",
       "  'P(Ph)3',\n",
       "  'XPhos',\n",
       "  'P(tBu)3',\n",
       "  'CataCXium A',\n",
       "  'P(Cy)3',\n",
       "  'dppf',\n",
       "  'nothing',\n",
       "  'AmPhos',\n",
       "  'SPhos',\n",
       "  'P(o-Tol)3'],\n",
       " 'base': ['KOH',\n",
       "  'nothing',\n",
       "  'Et3N',\n",
       "  'K3PO4',\n",
       "  'LiOtBu',\n",
       "  'CsF',\n",
       "  'NaOH',\n",
       "  'NaHCO3'],\n",
       " 'solvent': ['MeOH', 'DMF', 'MeOH/H2O_V2 9:1', 'THF', 'THF_V2', 'MeCN']}"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "output"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "id": "e49984e8",
   "metadata": {},
   "outputs": [],
   "source": [
    "json.dump(output, open(\"./dry_sum_suzuki.json\", \"w\", encoding='utf-8'), indent=2, ensure_ascii=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "d7e95d8e",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "vllm082",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.12"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
