{"cells":[{"cell_type":"code","execution_count":null,"metadata":{"id":"T4SKN9pxCYdr"},"outputs":[],"source":["!pip install -q -U google-generativeai"]},{"cell_type":"code","execution_count":null,"metadata":{"id":"lCwqaG-xn0Z6"},"outputs":[],"source":["import pathlib\n","import textwrap\n","import os\n","import csv\n","import pandas as pd\n","import time\n","import google.generativeai as genai\n","\n","GOOGLE_API_KEY= '<<ENTER YOUT API KEY>>'\n","\n","genai.configure(api_key=GOOGLE_API_KEY)"]},{"cell_type":"code","execution_count":null,"metadata":{"id":"hlOvw_W1n8d1"},"outputs":[],"source":["df = pd.read_csv('./result_ASR.csv')\n","original = df['transcription']\n","beam_result1 = df['whisper_base_predSE'] # The 1st candidate for ASR, which contains an error\n","beam_result2 = df['whisper_small_predSE'] # The 2nd candidate for ASR, which contains an error"]},{"cell_type":"code","execution_count":null,"metadata":{"colab":{"base_uri":"https://localhost:8080/","height":1000},"executionInfo":{"elapsed":3983907,"status":"ok","timestamp":1723389748872,"user":{"displayName":"현시은","userId":"00296812091026401646"},"user_tz":-540},"id":"0-N6x08in-FV","outputId":"1ea25ae6-1bd6-4a3f-cf97-0027fb2c25ed"},"outputs":[],"source":["from requests.exceptions import ConnectionError\n","\n","gemini_result = []\n","max_retries = 3\n","\n","for i in range(0, len(original)):\n","    instruction = \"You are an AI model that corrects Automatic Speech Recognition results and converts them into LaTeX. Let's think step by step. I will give you two candidates from the Automatic Speech Recognition results. Based on these two ASR results, make the necessary corrections and then output the corresponding LaTeX code for the formula. I will show you one example, so refer to it and convert it into LaTeX. You just have to tell me the answer. Don't tell me anything else, just tell me the LaTeX code.\"\n","    prompt = f\"\"\"\n","    Input : a plus seven y plus ten z equals z || a plus 7y plus f z equals 0\n","    Output : $ a + 7y + 10z = 0 $\n","    Input : {beam_result1[i]} || {beam_result2[i]}\n","    Output : (Tell me Your answer.)\n","    \"\"\"\n","    model = genai.GenerativeModel('gemini-pro')\n","    full_prompt = f\"{instruction}\\n{prompt}\"\n","    # model call\n","    for attempt in range(max_retries):\n","        try:\n","            response = model.generate_content(full_prompt)\n","            result = response.text\n","            gemini_result.append(result)\n","            print(f\"{result}\")\n","            break  # If successful, stop iterating.\n","        except ConnectionError as e:\n","            print(f\"ConnectionError occurred on attempt {attempt + 1}: {e}\")\n","            if attempt < max_retries - 1:\n","                time.sleep(5)  # Retry in 5 seconds\n","            else:\n","                print(f\"Failed after {max_retries} attempts.\")\n","                gemini_result.append(\"<ERROR>\")  # If error occurs, add <ERROR> to the result.\n","        except Exception as e:\n","            print(f\"An unexpected error occurred: {e}\")\n","            if attempt < max_retries - 1:\n","                time.sleep(5)  # Retry in 5 seconds\n","            else:\n","                print(f\"Failed after {max_retries} attempts.\")\n","                gemini_result.append(\"<ERROR>\")  # If error occurs, add <ERROR> to the result.\n","    time.sleep(1)"]},{"cell_type":"code","execution_count":null,"metadata":{},"outputs":[],"source":["df[\"gemini_LaTeX_result\"] = gemini_result\n","df.to_csv('gemini_LaTeX_result.csv', index=False)"]}],"metadata":{"colab":{"provenance":[]},"kernelspec":{"display_name":"Python 3","name":"python3"},"language_info":{"codemirror_mode":{"name":"ipython","version":3},"file_extension":".py","mimetype":"text/x-python","name":"python","nbconvert_exporter":"python","pygments_lexer":"ipython3","version":"3.10.13"}},"nbformat":4,"nbformat_minor":0}
