{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# Run experiments"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "# releaese; stable\n",
    "import json\n",
    "import os\n",
    "import argparse\n",
    "import subprocess\n",
    "import numpy as np\n",
    "from src.utils import myrepr\n",
    "\n",
    "# Function to create and submit SLURM job scripts\n",
    "def submit_slurm_job(script_path, args, folder, job_name, submit):\n",
    "    outs_folder = os.path.join(folder, \"slurm_outs\")\n",
    "    sh_folder = os.path.join(folder, \"slurm_sh\")\n",
    "    os.makedirs(outs_folder, exist_ok=True)\n",
    "    os.makedirs(sh_folder, exist_ok=True)\n",
    "    slurm_script = os.path.join(sh_folder, f\"{job_name}.sh\")\n",
    "    \n",
    "    # Create SLURM job script\n",
    "    with open(slurm_script, \"w\") as f:\n",
    "        f.write(\"#!/bin/bash\\n\")\n",
    "        f.write(f\"#SBATCH --job-name={job_name}\\n\")\n",
    "        f.write(\"#SBATCH --cpus-per-task=1\\n\")\n",
    "        #f.write('#SBATCH --constraint=\"intel&cascadelake\"\\n')\n",
    "        f.write(\"#SBATCH -N 1\\n\")\n",
    "        f.write(\"#SBATCH --partition=batch\\n\")\n",
    "        f.write(\"#SBATCH --mem=64GB\\n\")\n",
    "        f.write(\"#SBATCH --time=19:00:00\\n\")\n",
    "        f.write(f\"#SBATCH --output={outs_folder}/{job_name}.out\\n\")\n",
    "        f.write(f\"python {script_path} \")\n",
    "        # for arg in args:\n",
    "        #     f.write(f\"{arg} \")\n",
    "        \n",
    "        for arg, value in zip(args[0::2], args[1::2]):\n",
    "            if value != \"\":\n",
    "                f.write(f\"    {arg} {value} \\\\\\n\")    \n",
    "        \n",
    "        f.write(\"\\n\")\n",
    "    if submit:\n",
    "        # Submit the job using sbatch and capture the output\n",
    "        result = subprocess.run([\"sbatch\", slurm_script], capture_output=True, text=True)\n",
    "        \n",
    "        # Print the result of the job submission\n",
    "        if result.returncode == 0:\n",
    "            #print(f\"Job {job_name} submitted successfully: {result.stdout.strip()}\")\n",
    "            print(f\"{job_name}\")\n",
    "        else:\n",
    "            print(f\"Job {job_name} submission failed: {result.stderr.strip()}\")\n",
    "\n",
    "# Function to properly format list arguments\n",
    "def format_list_args(args):\n",
    "\n",
    "    list_args = [\n",
    "        \"--stop_criteruim_params\",\n",
    "        \"--collectable_metrics\",\n",
    "        \"--computable_params\",\n",
    "        \"--loadable_params\",\n",
    "        \"--loadable_datasets\"\n",
    "    ]\n",
    "    for i in range(len(args)):\n",
    "        if args[i] in list_args:\n",
    "            args[i + 1] = f'\"{args[i + 1]}\"'\n",
    "    return args\n",
    "\n",
    "def process_job_submissions(arrays_dict, submit, exps_to_launch, json_config):\n",
    "    config = json.loads(json_config)\n",
    "    base_args = config[\"base_config\"][\"args\"]\n",
    "    base_args = format_list_args(base_args)\n",
    "    parser = argparse.ArgumentParser(description=\"Submit SLURM jobs with JSON configuration\")\n",
    "    parser.add_argument(\"--folder\", type=str, help=\"Custom folder path to use as the working directory\", default=\"\")\n",
    "    args_namespace = parser.parse_args()\n",
    "    working_directory = os.getcwd()\n",
    "\n",
    "    for conf in config[\"configurations\"]:\n",
    "        if conf[\"name\"] not in exps_to_launch:\n",
    "            continue\n",
    "        exp_conf_args = format_list_args(conf[\"args\"])\n",
    "        \n",
    "        for factor_value in arrays_dict[\"factor_ar\"]:\n",
    "            for num_workers in arrays_dict[\"num_workers_ar\"]:\n",
    "                prob = 1/num_workers\n",
    "                for noise_scale in arrays_dict[\"noise_scale_ar\"]:\n",
    "                    all_conf_args = base_args + exp_conf_args + [\"--factor\", str(factor_value)] + [\"--num_workers\", str(num_workers)] + [\"--noise_scale\", str(noise_scale)] + [\"--prob\", str(prob)]\n",
    "                    loss_func = base_args[base_args.index(\"--loss_func\") + 1]\n",
    "                    step_size = base_args[base_args.index(\"--step_size\") + 1]\n",
    "                    #exp_name = exp_conf_args[exp_conf_args.index(\"--exp_name\") + 1]\n",
    "                    exp_name = conf[\"name\"]\n",
    "                    job_name = f\"{loss_func}_{exp_name}_s{step_size}_nw{num_workers}_nsc{myrepr(noise_scale)}_f{myrepr(factor_value)}\"\n",
    "                    submit_slurm_job(conf[\"program\"], all_conf_args, working_directory, job_name, submit)\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## l1-norm loss"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "\n",
    "# releaese; stable\n",
    "json_config = '''\n",
    "{\n",
    "    \"version\": \"0.2.0\",\n",
    "    \"base_config\": {\n",
    "        \"type\": \"debugpy\",\n",
    "        \"request\": \"launch\",\n",
    "        \"console\": \"integratedTerminal\",\n",
    "        \"justMyCode\": true,\n",
    "        \"args\": [\n",
    "            \"--dataset\", \"synthetic_sparse_zero\",\n",
    "            \"--loss_func\", \"l1_norm\",\n",
    "            \"--regularizer_type\", \"str-cvx\",\n",
    "            \"--sampling\", \"full\",\n",
    "            \"--num_samples\", \"1\",\n",
    "            \"--tol\", \"1e-7\",\n",
    "            \"--la\", \"0\",\n",
    "            \"--dim\", \"1000\",\n",
    "            \"--batchsize\", \"1\",\n",
    "            \n",
    "            \"--use_ray\", \"0\",\n",
    "            \"--is_sparse_dataset\", \"1\",\n",
    "            \"--print_status\", \"1\",\n",
    "            \"--is_grad_comp_init\", \"0\",\n",
    "            \"--PRINT_EVERY\", \"10000\",\n",
    "            \"--SAVE_EVERY\", \"10000000\",\n",
    "            \"--NUM_LAUNCHES\", \"1\",\n",
    "            \"--seeds\", \"1\",\n",
    "            \n",
    "            \"--max_iters\", \"60000\",\n",
    "            \"--step_size\", \"polyak\",\n",
    "            \n",
    "            \"--stop_criteruim_params\", \"['iters', 'func_diff']\",\n",
    "            \"--loadable_datasets\", \"['X', 'y']\",\n",
    "            \"--computable_params\", \"[]\"\n",
    "        ]\n",
    "    },\n",
    "    \"configurations\": [\n",
    "        {\n",
    "            \"name\": \"EF21-P\",\n",
    "            \"program\": \"EF21-P.py\",\n",
    "            \"args\": [\n",
    "                \"--alg_name\", \"EF21-P\",\n",
    "                \"--exp_name\", \"EF21-P\",\n",
    "                \"--compressor\", \"TopK\",\n",
    "                \"--loadable_params\", \"['L_0', 'f_star', 'x_star']\",\n",
    "                \"--collectable_metrics\", \"['iters', 'bits', 'func_diff', 'r-L_0']\"\n",
    "            ]\n",
    "        },\n",
    "        {\n",
    "            \"name\": \"MARINA-P_sameRandK\",\n",
    "            \"program\": \"MARINA-P.py\",\n",
    "            \"args\": [\n",
    "                \"--alg_name\", \"MARINA-P\",\n",
    "                \"--exp_name\", \"MARINA-P\",\n",
    "                \"--compressor\", \"sameRandK\",\n",
    "                \"--loadable_params\", \"['L_0', 'wtL_0', 'f_star', 'x_star']\",\n",
    "                \"--collectable_metrics\", \"['iters', 'bits', 'func_diff','r-L_0,pm', 'r-L_0', 'r-wtL_0', 'r-L_hat', 'r-L_0+r-L_0,pm']\"\n",
    "            ]\n",
    "        },\n",
    "        {\n",
    "            \"name\": \"MARINA-P_indRandK\",\n",
    "            \"program\": \"MARINA-P.py\",\n",
    "            \"args\": [\n",
    "                \"--alg_name\", \"MARINA-P\",\n",
    "                \"--exp_name\", \"MARINA-P\",\n",
    "                \"--compressor\", \"indRandK\",\n",
    "                \"--loadable_params\", \"['L_0', 'wtL_0', 'f_star', 'x_star']\",\n",
    "                \"--collectable_metrics\", \"['iters', 'bits', 'func_diff','r-L_0,pm', 'r-L_0', 'r-wtL_0', 'r-L_hat', 'r-L_0+r-L_0,pm']\"\n",
    "            ]\n",
    "        },\n",
    "        {\n",
    "            \"name\": \"MARINA-P_PermK\",\n",
    "            \"program\": \"MARINA-P.py\",\n",
    "            \"args\": [\n",
    "                \"--alg_name\", \"MARINA-P\",\n",
    "                \"--exp_name\", \"MARINA-P\",\n",
    "                \"--compressor\", \"PermK\",\n",
    "                \"--loadable_params\", \"['L_0', 'wtL_0', 'f_star', 'x_star']\",\n",
    "                \"--collectable_metrics\", \"['iters', 'bits', 'func_diff','r-L_0,pm', 'r-L_0', 'r-wtL_0', 'r-L_hat', 'r-L_0+r-L_0,pm']\"\n",
    "            ]\n",
    "        },\n",
    "        {\n",
    "            \"name\": \"3PCv2-P_sameRandK-TopK\",\n",
    "            \"program\": \"3PCv2-P.py\",\n",
    "            \"args\": [\n",
    "                \"--alg_name\", \"3PCv2-P\",\n",
    "                \"--exp_name\", \"3PCv2-P\",\n",
    "                \"--compressor\", \"sameRandK\",\n",
    "                \"--loadable_params\", \"['L_0', 'wtL_0', 'f_star', 'x_star']\",\n",
    "                \"--collectable_metrics\", \"['iters', 'bits', 'func_diff','r-L_0,pm', 'r-L_0', 'r-wtL_0', 'r-L_hat', 'r-L_0+r-L_0,pm']\"\n",
    "            ]\n",
    "        },\n",
    "        {\n",
    "            \"name\": \"3PCv2-P_indRandK-TopK\",\n",
    "            \"program\": \"3PCv2-P.py\",\n",
    "            \"args\": [\n",
    "                \"--alg_name\", \"3PCv2-P\",\n",
    "                \"--exp_name\", \"3PCv2-P\",\n",
    "                \"--compressor\", \"indRandK\",\n",
    "                \"--loadable_params\", \"['L_0', 'wtL_0', 'f_star', 'x_star']\",\n",
    "                \"--collectable_metrics\", \"['iters', 'bits', 'func_diff','r-L_0,pm', 'r-L_0', 'r-wtL_0', 'r-L_hat', 'r-L_0+r-L_0,pm']\"\n",
    "            ]\n",
    "        } \n",
    "    ]\n",
    "}\n",
    "'''\n",
    "\n",
    "submit = 1\n",
    "\n",
    "exps_to_launch = [\"MARINA-P_sameRandK\", \"MARINA-P_indRandK\", \"MARINA-P_PermK\"]\n",
    "\n",
    "\n",
    "#exps_to_launch = [\"3PCv2-P_sameRandK-TopK\", \"3PCv2-P_indRandK-TopK\"]\n",
    "#exps_to_launch = [\"MARINA-P_indRandK\"]\n",
    "#exps_to_launch = [\"MARINA-P_sameRandK\"]\n",
    "\n",
    "exps_to_launch = [\"EF21-P\"]\n",
    "\n",
    "arrays_dict = { \n",
    "    #\"factor_ar\": [1.0],\n",
    "    #\"noise_scale_ar\": np.array([0.1], dtype=float),\n",
    "    #\"num_workers_ar\": np.array([10], dtype=int),\n",
    "    \n",
    "    \"factor_ar\": 2**np.arange(-6, 6).astype(float),\n",
    "    \"noise_scale_ar\": np.array([0.1, 1, 10], dtype=float),\n",
    "    #\"noise_scale_ar\": np.array([0.01, 100], dtype=float),\n",
    "    \"num_workers_ar\": np.array([10, 100], dtype=int),\n",
    "    #\"factor_ar\":4**np.arange(-3,-2).astype(float),\n",
    "    #\"noise_scale_ar\": np.array([0.1, 1], dtype=float),\n",
    "    #\"num_workers_ar\": np.array([100], dtype=int)\n",
    "}\n",
    "\n",
    "process_job_submissions(arrays_dict, submit, exps_to_launch, json_config)\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!rm -r slurm_sh/*EF21-P*.sh"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!rm -r slurm_outs/*.out\n",
    "!rm -r slurm_sh/*.sh"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%%bash\n",
    "squeue -u <username> --format=\"%10i %9P %85j %8u %1t %4M %.6D  %10M %10l %8Q %7m\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%%bash\n",
    "scancel -u <username>"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "%%bash\n",
    "sacct --starttime=2024-10-02 --endtime=2024-10-03 --format=JobID,JobName%50,Start,End,Elapsed,State"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!tail -n 20 slurm_outs/*_EF21-P*.out"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "!tail -n 20 slurm_outs/*_MARINA-P_sameRandK*.out\n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "pyten",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.13"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
