{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 流水线生成"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "\"\"\" 引入root目录 \"\"\"\n",
    "\n",
    "from pathlib import Path\n",
    "\n",
    "# 获取当前工作目录\n",
    "current_dir = Path.cwd()\n",
    "root_dir = Path(\"/home/john/svc/muer-svc-whisper-sovits-svc\")\n",
    "# root_dir = current_dir.parent.parent\n",
    "print(f\"Root dir: {root_dir}\")\n",
    "import sys\n",
    "\n",
    "sys.path.append(str(root_dir))\n",
    "\"\"\"\"\"\" \"\"\"\"\"\" \"\"\"\"\"\" \"\"\"\"\"\" \"\"\"\"\"\"\n",
    "import os\n",
    "import datetime\n",
    "import subprocess\n",
    "\n",
    "\n",
    "def generate_test(\n",
    "    model_name=\"whisper_vits_svc_spk_change\",\n",
    "    speaker_dir=\"seen\",\n",
    "    content_dir=\"h_m_l\",\n",
    "    ckpt_name=\"sovits_from_pretrained_origin\",\n",
    "    ckpt_epoch=None,\n",
    "):\n",
    "    model_dir = root_dir / \"models\" / model_name\n",
    "    os.chdir(model_dir)\n",
    "\n",
    "    now_time = datetime.datetime.now().strftime(\"%m-%d_%H\")\n",
    "\n",
    "    # speaker数据目录为data/test_data\n",
    "    spk_data_dir = root_dir.parent / \"data/test_data/speaker\" / speaker_dir\n",
    "    content_data_dir = root_dir.parent / \"data/test_data/content\" / content_dir\n",
    "    out_data_dir = (\n",
    "        root_dir.parent\n",
    "        / \"data/test_data/output\"\n",
    "        / f\"{model_name}_{speaker_dir}_{content_dir}_{ckpt_name}_{ckpt_epoch}\"\n",
    "    )\n",
    "    out_data_dir.mkdir(exist_ok=True)\n",
    "    wav_dir = out_data_dir\n",
    "    tmp_dir = content_data_dir / \"tmp\"\n",
    "    wav_dir.mkdir(exist_ok=True)\n",
    "    tmp_dir.mkdir(exist_ok=True)\n",
    "    ckpt_dir = model_dir / \"chkpt\" / ckpt_name\n",
    "    # print(f\"Model dir: {model_dir} Ckpt dir: {ckpt_dir}\")\n",
    "    for model_path in ckpt_dir.glob(\"*.pt\"):\n",
    "        if ckpt_epoch and ckpt_epoch not in model_path.stem:\n",
    "            # print(f\"Skip {model_path}\")\n",
    "            continue\n",
    "        print(f\"Infering {model_path}\")\n",
    "        model_path = model_path.relative_to(model_dir)\n",
    "        for spk_file in spk_data_dir.glob(\"*.wav\"):\n",
    "            for content_file in content_data_dir.glob(\"*.wav\"):\n",
    "                command = [\n",
    "                    \"python\",\n",
    "                    \"svc_inference.py\",\n",
    "                    \"--config\",\n",
    "                    f\"configs/{ckpt_name}.yaml\",\n",
    "                    \"--model\",\n",
    "                    str(model_path),\n",
    "                    \"--spk\",\n",
    "                    str(spk_file),\n",
    "                    \"--wave\",\n",
    "                    str(content_file),\n",
    "                    \"--out\",\n",
    "                    str(wav_dir),\n",
    "                    \"--shift\",\n",
    "                    \"0\",\n",
    "                    \"--ppg\",\n",
    "                    str(tmp_dir / f\"{content_file.stem}.ppg.npy\"),\n",
    "                    \"--vec\",\n",
    "                    str(tmp_dir / f\"{content_file.stem}.vec.npy\"),\n",
    "                    \"--pit\",\n",
    "                    str(tmp_dir / f\"{content_file.stem}.pit.csv\"),\n",
    "                ]\n",
    "                subprocess.run(command)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_list = [\n",
    "    # model_name, speaker_dir, content_dir, ckpt_name, ckpt_epoch\n",
    "    (\"whisper_vits_svc\", \"seen\", \"h_m_l\", \"sovits_from_pretrained_origin\", \"100\"),\n",
    "    (\n",
    "        \"whisper_vits_svc\",\n",
    "        \"seen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_from_pretrained_origin_decoder_only\",\n",
    "        \"100\",\n",
    "    ),\n",
    "    (\n",
    "        \"whisper_vits_svc\",\n",
    "        \"seen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_test2\",\n",
    "        \"175\",\n",
    "    ),\n",
    "    (\n",
    "        \"whisper_vits_svc_spk_change\",\n",
    "        \"seen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits5.0\",\n",
    "        \"110\",\n",
    "    ),\n",
    "    (\n",
    "        \"whisper_vits_svc_without_ppg\",\n",
    "        \"seen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_withoutppg\",\n",
    "        \"100\",\n",
    "    ),\n",
    "]\n",
    "\n",
    "for test in test_list:\n",
    "    generate_test(*test)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_list = [\n",
    "    # model_name, speaker_dir, content_dir, ckpt_name, ckpt_epoch\n",
    "    (\n",
    "        \"whisper_vits_svc_without_ppg\",\n",
    "        \"unseen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_withoutppg\",\n",
    "        \"100\",\n",
    "    ),\n",
    "    (\"whisper_vits_svc\", \"unseen\", \"h_m_l\", \"sovits_from_pretrained_origin\", \"100\"),\n",
    "    (\n",
    "        \"whisper_vits_svc_spk_change\",\n",
    "        \"unseen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits5.0\",\n",
    "        \"110\",\n",
    "    ),\n",
    "]\n",
    "\n",
    "for test in test_list:\n",
    "    generate_test(*test)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_list = [\n",
    "    # model_name, speaker_dir, content_dir, ckpt_name, ckpt_epoch\n",
    "    (\"whisper_vits_svc_kmeans\", \"seen\", \"h_m_l\", \"sovits_kmeans900_tokenize\", \"250\"),\n",
    "    (\"whisper_vits_svc_kmeans\", \"unseen\", \"h_m_l\", \"sovits_kmeans900_tokenize\", \"250\"),\n",
    "]\n",
    "\n",
    "for test in test_list:\n",
    "    generate_test(*test)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_list = [\n",
    "    # model_name, speaker_dir, content_dir, ckpt_name, ckpt_epoch\n",
    "    (\n",
    "        \"whisper_vits_svc_without_ppg\",\n",
    "        \"seen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_without_hubert\",\n",
    "        \"100\",\n",
    "    ),\n",
    "    (\n",
    "        \"whisper_vits_svc_without_ppg\",\n",
    "        \"unseen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_without_hubert\",\n",
    "        \"100\",\n",
    "    ),\n",
    "]\n",
    "\n",
    "for test in test_list:\n",
    "    generate_test(*test)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_list = [\n",
    "    # model_name, speaker_dir, content_dir, ckpt_name, ckpt_epoch\n",
    "    (\n",
    "        \"whisper_vits_svc_without_classifier\",\n",
    "        \"seen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_without_classifier\",\n",
    "        \"50\",\n",
    "    ),\n",
    "    (\n",
    "        \"whisper_vits_svc_without_classifier\",\n",
    "        \"unseen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_without_classifier\",\n",
    "        \"50\",\n",
    "    ),\n",
    "]\n",
    "\n",
    "for test in test_list:\n",
    "    generate_test(*test)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_list = [\n",
    "    # model_name, speaker_dir, content_dir, ckpt_name, ckpt_epoch\n",
    "    (\n",
    "        \"whisper_vits_svc_kmeans\",\n",
    "        \"seen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_kmeans900_tokenize_without_ppg\",\n",
    "        \"575\",\n",
    "    ),\n",
    "    (\n",
    "        \"whisper_vits_svc_kmeans\",\n",
    "        \"unseen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_kmeans900_tokenize_without_ppg\",\n",
    "        \"575\",\n",
    "    ),\n",
    "]\n",
    "\n",
    "for test in test_list:\n",
    "    generate_test(*test)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_list = [\n",
    "    # model_name, speaker_dir, content_dir, ckpt_name, ckpt_epoch\n",
    "    (\n",
    "        \"whisper_vits_svc_without_ppg\",\n",
    "        \"seen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_contentvec_256\",\n",
    "        \"350\",\n",
    "    ),\n",
    "    (\n",
    "        \"whisper_vits_svc_without_ppg\",\n",
    "        \"unseen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_contentvec_256\",\n",
    "        \"350\",\n",
    "    ),\n",
    "    (\n",
    "        \"whisper_vits_svc_without_ppg\",\n",
    "        \"seen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_contentvec_768\",\n",
    "        \"875\",\n",
    "    ),\n",
    "    (\n",
    "        \"whisper_vits_svc_without_ppg\",\n",
    "        \"unseen\",\n",
    "        \"h_m_l\",\n",
    "        \"sovits_contentvec_768\",\n",
    "        \"875\",\n",
    "    ),\n",
    "]\n",
    "\n",
    "for test in test_list:\n",
    "    generate_test(*test)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_list = [\n",
    "    # model_name, speaker_dir, content_dir, ckpt_name, ckpt_epoch\n",
    "    (\"whisper_vits_svc\", \"farest\", \"zjl\", \"sovits_from_pretrained_origin\", \"100\"),\n",
    "    (\n",
    "        \"whisper_vits_svc_spk_change\",\n",
    "        \"farest\",\n",
    "        \"zjl\",\n",
    "        \"sovits_spk\",\n",
    "        \"25\",\n",
    "    ),\n",
    "    (\n",
    "        \"whisper_vits_svc_spk_change\",\n",
    "        \"farest\",\n",
    "        \"zjl\",\n",
    "        \"sovits_spk\",\n",
    "        \"190\",\n",
    "    ),\n",
    "]\n",
    "\n",
    "for test in test_list:\n",
    "    generate_test(*test)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_list = [\n",
    "    # model_name, speaker_dir, content_dir, ckpt_name, ckpt_epoch\n",
    "    # (\"whisper_vits_svc\", \"farest\", \"h_m_l\", \"sovits_1700h\", \"80\"),\n",
    "    # (\"whisper_vits_svc\", \"seen\", \"h_m_l\", \"sovits_1700h\", \"80\"),\n",
    "    # (\"whisper_vits_svc\", \"unseen\", \"test_content_data_one\", \"sovits_1700h\", \"80\"),\n",
    "    # (\"whisper_vits_svc\", \"ly\", \"h_m_l\", \"sovits_1700h\", \"80\"),\n",
    "]\n",
    "\n",
    "for test in test_list:\n",
    "    generate_test(*test)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "test_list = [\n",
    "    # model_name, speaker_dir, content_dir, ckpt_name, ckpt_epoch\n",
    "    # (\"whisper_vits_svc_spk_change\", \"farest\", \"h_m_l\", \"sovits_spk_1700h\", \"8\"),\n",
    "    # (\"whisper_vits_svc_spk_change\", \"seen\", \"h_m_l\", \"sovits_spk_1700h\", \"8\"),\n",
    "    # (\"whisper_vits_svc_spk_change\", \"unseen\", \"h_m_l\", \"sovits_spk_1700h\", \"8\"),\n",
    "    # (\n",
    "    #     \"whisper_vits_svc_spk_change\",\n",
    "    #     \"unseen\",\n",
    "    #     \"test_content_data_one\",\n",
    "    #     \"sovits_spk_1700h\",\n",
    "    #     \"8\",\n",
    "    # ),\n",
    "    # (\"whisper_vits_svc_spk_change\", \"ly\", \"h_m_l\", \"sovits_spk_1700h\", \"8\"),\n",
    "    # (\n",
    "    #     \"whisper_vits_svc_spk_change\",\n",
    "    #     \"zj\",\n",
    "    #     \"h_m_l\",\n",
    "    #     \"sovits_spk_1700h_finetune_sing\",\n",
    "    #     \"19\",\n",
    "    # ),\n",
    "    # (\n",
    "    #     \"whisper_vits_svc_spk_change\",\n",
    "    #     \"zj\",\n",
    "    #     \"h_m_l\",\n",
    "    #     \"sovits_spk_1700h_finetune_read\",\n",
    "    #     \"19\",\n",
    "    # ),\n",
    "    (\n",
    "        \"whisper_vits_svc_spk_change\",\n",
    "        \"zj\",\n",
    "        \"test_content_data_one\",\n",
    "        \"sovits_spk_1700h_finetune_sing\",\n",
    "        \"19\",\n",
    "    ),\n",
    "    (\n",
    "        \"whisper_vits_svc_spk_change\",\n",
    "        \"zj\",\n",
    "        \"test_content_data_one\",\n",
    "        \"sovits_spk_1700h_finetune_read\",\n",
    "        \"19\",\n",
    "    ),\n",
    "]\n",
    "\n",
    "for test in test_list:\n",
    "    generate_test(*test)"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "diffsinger",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.14"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
