{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [],
   "source": [
    "from datasets import load_dataset, Dataset\n",
    "import pandas as pd\n",
    "ds = load_dataset(\"HuggingFaceH4/ultrafeedback_binarized\", split=\"train_prefs\")\n",
    "def get_instruct_response(item):\n",
    "    # item[\"instruction\"] = item['chosen'][0][\"content\"]\n",
    "    item[\"response\"] = item['chosen'][1][\"content\"]\n",
    "    return item\n",
    "ds = ds.map(get_instruct_response, batch_size=1024, num_proc=8)\n",
    "export_data = ds.select_columns([\"prompt\", \"response\"])\n",
    "# export_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from gpt4o import Openai, API_INFOS\n",
    "oai_clients = Openai(\n",
    "    apis=API_INFOS\n",
    ")\n",
    "res = oai_clients.get_response(\"对于LLM生成的文本，将其以markdown的格式进行渲染，从文本美学观感的角度看，对于文本美学观感比较重要的因素有哪些？\")\n",
    "from text2img import text_to_image\n",
    "text_to_image(text=res, output_image=\"gpt4o.png\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "response_1 = export_data['response'][0]\n",
    "response_10 = export_data['response'][9]\n",
    "# print(response_10)\n",
    "# response_10_html = markdown_to_html(response_10)\n",
    "# with open(\"response_10_2.html\", 'w') as f:\n",
    "#     # f.write(\"\\n\")\n",
    "#     f.write(response_10_html)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "<!-- pandoc -f markdown -t html5 response10.md -o output.html -c github-pandoc.css\n",
    "pandoc response10.md -o output.html -c style.css\n",
    "pandoc -f markdown response10.md -o output.html -c github-pandoc.css\n",
    "pandoc -s -c github-pandoc.css response10.md -o output2.html --self-contained\n",
    "pandoc -s -c style2.css response10.md -o output10.html --self-contained\n",
    "pandoc -s -c style.css response10.md -o output10.html --self-contained -->"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from text2img import text_to_image\n",
    "for i in range(10):\n",
    "    output_path = f\"output_{i}.png\"\n",
    "    text = export_data[\"response\"][i]\n",
    "    text_to_image(text, output_path, size=(700, 1020))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from text2img import text_to_image\n",
    "output_path = \"output.png\"\n",
    "text = response_10\n",
    "text_to_image(text, output_path)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_data():\n",
    "    ds = load_dataset(\"HuggingFaceH4/ultrafeedback_binarized\", split=\"train_prefs\")\n",
    "    def get_instruct_response(item):\n",
    "        # item[\"instruction\"] = item['chosen'][0][\"content\"]\n",
    "        item[\"response\"] = item['chosen'][1][\"content\"]\n",
    "        return item\n",
    "    ds = ds.map(get_instruct_response, batch_size=1024, num_proc=8)\n",
    "    export_data = ds.select_columns([\"prompt\", \"response\"])\n",
    "    return export_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "# [{for item in ds['rejected'][0][1]['content']]\n",
    "temp_data = data\n",
    "# temp_ds = ds.select(range(10))\n",
    "for i, item in enumerate(ds):\n",
    "    # print(item['rejected'])\n",
    "    # index=item['index']\n",
    "    temp_data[i]['rejected'] = item['rejected'][1]['content']\n",
    "    temp_data[i]['instruct'] = item['prompt']\n",
    "temp_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from utils import read_jsonl\n",
    "import json\n",
    "data = read_jsonl(\"revised_data/output_sorted.jsonl\")\n",
    "not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "# datalen\n",
    "data\n",
    "indices = set([item['index'] for item in data])\n",
    "original_indices = set(range(export_data.shape[0]))\n",
    "print(f\"index complete: {original_indices - indices}\")\n",
    "null_response_indices = [item['index'] for item in data if item['gpt_answer'].strip() == '']\n",
    "null_revised_indices = [item['index'] for item in data if item['revised_text'].strip() == '']\n",
    "noneed_revised_indices = [item['index'] for item in data if item['does_it_need_modification'].strip() == 'N']\n",
    "same_revised_text_indices = [item['index'] for item in data if item['response'].strip() == item['revised_text'].strip()]\n",
    "# print(len(null_response))\n",
    "# print(len(not_revised))\n",
    "print(f\"null_response_indices:{len(null_response_indices)}\")\n",
    "print(f\"null_revised_indices:{len(null_revised_indices)}\")\n",
    "print(f\"noneed_revised_indices:{len(noneed_revised_indices)}\")\n",
    "print(f\"same_revised_text_indices:{len(same_revised_text_indices)}\")\n",
    "# 使用集合的交集操作  \n",
    "indices_to_discard  = set(null_response_indices) | set(null_revised_indices) | set(noneed_revised_indices) | set(same_revised_text_indices)    \n",
    "indices_to_discard = list(indices_to_discard)\n",
    "print(f\"indices_to_discard: {len(indices_to_discard)}\")\n",
    "temp_data = data\n",
    "# temp_ds = ds.select(range(10))\n",
    "for i, item in enumerate(ds):\n",
    "    # print(item['rejected'])\n",
    "    # index=item['index']\n",
    "    temp_data[i]['rejected'] = item['rejected'][1]['content']\n",
    "    temp_data[i]['instruct'] = item['prompt']\n",
    "    temp_data[i]['chosen'] = item['chosen']\n",
    "revised_data = [item for item in temp_data if item[\"index\"] not in indices_to_discard]\n",
    "print(f\"length of revised data: {len(revised_data)}\")\n",
    "textual_aesthetics_chosen = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"response\"]} for item in revised_data]\n",
    "with open(\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_chosen.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_chosen, f, indent=4)\n",
    "textual_aesthetics_rejected = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"rejected\"]} for item in revised_data]\n",
    "with open(\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_rejected.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_rejected, f, indent=4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "print(textual_aesthetics_chosen[:3])\n",
    "print(textual_aesthetics_rejected[:3])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "temp_data = data\n",
    "# temp_ds = ds.select(range(10))\n",
    "for i, item in enumerate(ds):\n",
    "    # print(item['rejected'])\n",
    "    # index=item['index']\n",
    "    temp_data[i]['rejected'] = item['rejected'][1]['content']\n",
    "    temp_data[i]['instruct'] = item['prompt']\n",
    "    temp_data[i]['chosen'] = item['chosen']\n",
    "# temp_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "revised_data = [item for item in temp_data if item[\"index\"] not in indices_to_discard]\n",
    "revised_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "revised_data = [item for item in data if item[\"index\"] not in indices_to_discard]\n",
    "revised_data_indices = [item['index'] for item in data if item[\"index\"] not in indices_to_discard]\n",
    "len(revised_data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "textual_aesthetics_chosen = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"response\"]} for item in revised_data]\n",
    "import json\n",
    "with open(\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_chosen.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_chosen, f, indent=4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "with open(\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_chosen.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_chosen, f, indent=4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "same_revised_text_indices = [item['index'] for item in data if item['response'].strip() == item['revised_text'].strip()]\n",
    "same_revised_text_indices"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "data = read_jsonl(\"revised_data/output_retry.jsonl\")\n",
    "null_response = [item['index'] for item in data if item['gpt_answer'] == '']\n",
    "not_revised = [item['revised_text'] for item in data if item['revised_text'] == '']\n",
    "print(len(null_response))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "data = read_jsonl(\"revised_data/output_retry.jsonl\")\n",
    "null_response = [item['index'] for item in data if item['gpt_answer'] == '']\n",
    "not_revised = [item['revised_text'] for item in data if item['revised_text'] == '']\n",
    "print(len(null_response))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_instruct_response(item):\n",
    "    # item[\"instruction\"] = item['chosen'][0][\"content\"]\n",
    "    item[\"response\"] = item['chosen'][1][\"content\"]\n",
    "    return item\n",
    "ds = ds.map(get_instruct_response, batch_size=1024, num_proc=8)\n",
    "export_data = ds.select_columns([\"prompt\", \"response\"])\n",
    "export_data"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from gpt4o import Openai, API_INFOS\n",
    "client = Openai(apis=API_INFOS)\n",
    "ans = client.get_response(\"你是gpt几？\", system=\"you are gpt2.5, a helpful chat assisstant\")\n",
    "print(ans)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "我需要写一个prompt，让gpt帮我将LLM对于给定instruction生成的文本在文本美学方面进行修改的prompt，以下是我写的一个中文的system_template，对于这个template，如何让gpt更好的完成我的任务，给出修改意见和修改后的英语的system_template\n",
    "system_template = \\\n",
    "\"\"\"请扮演一个文本改写者来改写LLM(Large Language Model)生成的文本，使其更具有文本美学。你的任务是对于提供的用户instruction和一个LLM生成的答案，你从文本美学的角度去思考这个答案是否合理，是否需要修改,然后给出修改的文本。\n",
    "*Format*\n",
    "文本美学分析:\n",
    "[文本美学分析]\n",
    "是否需要修改:[Y/N]\n",
    "修改后的文本：\n",
    "[修改后的文本]\n",
    "\"\"\""
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": []
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "我需要写一个prompt，让gpt帮我将LLM对于给定instruction生成的文本在文本美学方面进行修改的prompt,主要从文本的排版和布局上对文本美观程度进行优化，例如段落长短、缩进、标题、列表、markdown形式的加粗、斜体、代码块，这些需要根据文本类型的需要来适当的修改，也可以添加一些其他方面的对文本美学的要求。帮我给出一些在观感上文本美学的构成要素，融入到prompt中。以下是我写的一个system template 和user template，对于这个template，如何让gpt更好的完成我的任务，给出修改意见和修改后的英语的template\n",
    "system_template = \\\n",
    "\"\"\"You are tasked with acting as a text rewriter to enhance the aesthetic quality of text generated by a Large Language Model (LLM). Your job is to evaluate the provided user instruction and the LLM-generated response from an aesthetic perspective, determine whether the text needs modification, and then provide the revised text if necessary.   \n",
    "    \n",
    "*Format*  \n",
    "Textual Aesthetic Analysis: [Your analysis]  \n",
    "Does it need modification: [Y/N]  \n",
    "Revised Text: [Your revised text, if applicable]  \n",
    "\"\"\"  \n",
    "user_template = \\\n",
    "\"\"\"### User Instruction:\n",
    "{instruction}\n",
    "\n",
    "### Answer\n",
    "{completition}\n",
    "\n",
    "Your task is to:  \n",
    "1. Analyze the LLM-generated response from a textual aesthetic perspective.  \n",
    "2. Determine whether the text needs modification.  \n",
    "3. Provide a revised version of the text if necessary.  \n",
    "   \n",
    "*Format*  \n",
    "Textual Aesthetic Analysis: [Your analysis]  \n",
    "Does it need modification: [Y/N]  \n",
    "Revised Text: [Your revised text, if applicable] \n",
    "\"\"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "system_template = \\\n",
    "\"\"\"You are tasked with acting as a text rewriter to enhance the aesthetic quality of text generated by a Large Language Model (LLM). Your job is to evaluate the provided user instruction and the LLM-generated response from an aesthetic perspective, determine whether the text needs modification, and then provide the revised text if necessary.   \n",
    "  \n",
    "Consider the following aspects of textual aesthetics:  \n",
    "- **Fluency**: Is the text smooth and easy to read?  \n",
    "- **Vocabulary**: Are the words used varied and appropriate?  \n",
    "- **Sentence Structure**: Are the sentences well-constructed and rhythmically balanced?  \n",
    "- **Imagery and Tone**: Does the text evoke vivid images and maintain a consistent tone?  \n",
    "  \n",
    "*Format*  \n",
    "Textual Aesthetic Analysis: [Your analysis]  \n",
    "Does it need modification: [Y/N]  \n",
    "Revised Text: [Your revised text, if applicable]  \n",
    "\"\"\"  "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from text2img import text_to_image\n",
    "from utils import read_jsonl\n",
    "revised_data = read_jsonl(\"revised_data/output_sorted.jsonl\")\n",
    "revised_data\n",
    "for item in revised_data:\n",
    "    index = item[\"index\"]\n",
    "    output_img_original = f\"output_original_{index}.png\"\n",
    "    text_to_image(item[\"response\"], output_img_original, save_dir=\"original_response\", temp_dir=\"original_temp\")\n",
    "    output_img = f\"output_{index}.png\"\n",
    "    text_to_image(item[\"gpt_answer\"], output_img, save_dir=\"revised_response\", temp_dir=\"revised_temp\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from text2img import text_to_image  \n",
    "from utils import read_jsonl  \n",
    "import concurrent.futures  \n",
    "  \n",
    "def process_item(item):  \n",
    "    index = item[\"index\"]  \n",
    "    output_img_original = f\"output_original_{index}.png\"  \n",
    "    text_to_image(item[\"response\"], output_img_original, save_dir=\"original_response\", temp_dir=\"original_temp\")  \n",
    "    output_img = f\"output_{index}.png\"  \n",
    "    text_to_image(item[\"gpt_answer\"], output_img, save_dir=\"revised_response\", temp_dir=\"revised_temp\")  \n",
    "  \n",
    "revised_data = read_jsonl(\"revised_data/output_sorted.jsonl\")  \n",
    "  \n",
    "# 指定线程数，例如 4  \n",
    "max_workers = 10  \n",
    "  \n",
    "with concurrent.futures.ThreadPoolExecutor(max_workers=max_workers) as executor:  \n",
    "    futures = [executor.submit(process_item, item) for item in revised_data]  \n",
    "    for future in concurrent.futures.as_completed(futures):  \n",
    "        try:  \n",
    "            future.result()  \n",
    "        except Exception as exc:  \n",
    "            print(f'Generated an exception: {exc}')  \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from text2img import text_to_image\n",
    "from utils import read_jsonl\n",
    "revised_data = read_jsonl(\"revised_data/output_sorted.jsonl\")\n",
    "revised_data\n",
    "for item in revised_data:\n",
    "    index = item[\"index\"]\n",
    "    output_img = f\"output_{index}.png\"\n",
    "    text_to_image(item[\"gpt_answer\"], output_img)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "import json\n",
    "from concurrent.futures import ThreadPoolExecutor, as_completed  \n",
    "import os\n",
    "import pandas as pd\n",
    "from gpt4o import Openai, API_INFOS\n",
    "def get_revised_text(client, instruction, completion, user_template, system_template, max_tokens=2048):  \n",
    "    content = user_template.format(instruction=instruction, completion=completion)  \n",
    "    # print(f\"content: {content}\")\n",
    "    gpt_answer = client.get_response(content=content, system=system_template, max_tokens=max_tokens)  \n",
    "    gpt_answer = gpt_answer.strip()  \n",
    "    need_modification = \"Y\" if \"Does it need modification: Y\" in gpt_answer else \"N\"  \n",
    "    revised_text_start = gpt_answer.find(\"Revised Text:\") + len(\"Revised Text:\")  \n",
    "    revised_text = gpt_answer[revised_text_start:].strip()  \n",
    "    return need_modification, revised_text, gpt_answer  \n",
    "  \n",
    "def process_row(index, client, row, user_template, system_template, max_tokens=2048, output_file=\"output.jsonl\"):  \n",
    "    prompt = row['prompt']  \n",
    "    response = row['response']  \n",
    "    need_modification, revised_text, gpt_answer = get_revised_text(client, prompt, response, user_template, system_template, max_tokens=max_tokens)  \n",
    "    # print(f\"index {index}\")\n",
    "    result = {  \n",
    "        'index': index,  \n",
    "        'prompt': prompt,  \n",
    "        'response': response,  \n",
    "        'does_it_need_modification': need_modification,  \n",
    "        'revised_text': revised_text,  \n",
    "        'gpt_answer': gpt_answer  \n",
    "    }  \n",
    "    # Write the result to a JSONL file  \n",
    "    with open(output_file, 'a') as f:  \n",
    "        f.write(json.dumps(result) + \"\\n\")  \n",
    "    return result  \n",
    "def main():  \n",
    "    # Initialize multiple clients  \n",
    "    clients = [Openai(apis=[API_INFOS[i]]) for i in range(6)]  \n",
    "  \n",
    "    sample_data = export_data.select(range(100))\n",
    "    # user_template = \"User: {instruction}\\nCompletion: {completion}\"  \n",
    "    # system_template = \"You are a helpful assistant.\"  \n",
    "    max_tokens = 2048  \n",
    "    output_file = \"./revised_data/output.jsonl\"  \n",
    "  \n",
    "    # Clear the output file before starting  \n",
    "    if os.path.exists(output_file):  \n",
    "        os.remove(output_file)  \n",
    "  \n",
    "    revised_data = []  \n",
    "  \n",
    "    with ThreadPoolExecutor(max_workers=6) as executor:  \n",
    "        # Create a future for each row in the dataset  \n",
    "        futures = [executor.submit(process_row, i, clients[i % len(clients)], row, user_template, system_template, max_tokens, output_file) for i, row in enumerate(sample_data)]  \n",
    "  \n",
    "        # Collect the results as they complete  \n",
    "        # for future in tqdm(as_completed(futures), total=len(futures)):  \n",
    "        #     revised_data.append(future.result())  \n",
    "        with tqdm(total=len(futures)) as pbar:  \n",
    "            # Collect the results as they complete  \n",
    "            for future in as_completed(futures):  \n",
    "                result = future.result()  \n",
    "                revised_data.append(result)  \n",
    "                pbar.update(1)  # Update the progress bar\n",
    "  \n",
    "    # Load results from JSONL file and ensure the order is preserved  \n",
    "    with open(output_file, 'r') as f:  \n",
    "        revised_data = [json.loads(line) for line in f]  \n",
    "  \n",
    "    # Sort by the original index  \n",
    "    revised_dataset = revised_data.sort(key=lambda x: x['index'])  \n",
    "  \n",
    "    # Create a new Dataset  \n",
    "    revised_dataset = Dataset.from_pandas(pd.DataFrame(revised_data))  \n",
    "    revised_dataset.to_json(\"./revised_data/output_sorted.jsonl\") \n",
    "main()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 49,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[{'index': 0,\n",
       "  'prompt': 'how can i develop a habit of drawing daily',\n",
       "  'response': \"Developing a daily habit of drawing can be challenging but with consistent practice and a few tips, it can become an enjoyable and rewarding part of your daily routine. Here are some strategies to help you develop the habit of drawing daily:\\n\\n1. Set a specific time: Allocate a specific time of the day to draw. It could be in the morning, afternoon, or evening. Make drawing a part of your daily routine.\\n2. Set a specific duration: Determine the amount of time you want to spend on drawing each day. It can be as little as 10 minutes or as long as an hour. Be consistent with the duration to help build the habit.\\n3. Start small and simple: Don't try to create a masterpiece every day, start with simple and easy-to-do sketches. Focus on improving your skills gradually.\\n4. Use a variety of tools and mediums: Experiment with different tools like pencils, pens, markers, and different mediums like paper, canvas, or digital apps to keep your drawing practice interesting and engaging.\\n5. Take breaks and rest: Taking breaks and resting after some time of drawing can help you avoid burnout and stay motivated.\\n6. Challenge yourself: Set challenges like drawing objects from memory or a specific subject to improve your skills and keep your drawing practice interesting.\\n7. Track your progress: Keep a record of your daily drawing practice and track your progress. This can be a source of motivation and help you see how far you've come.\\n\\nRemember, developing a habit takes time and patience. Stay consistent with your drawing practice, be flexible and open to trying new things, and with time, you'll develop a habit of daily drawing that brings you joy and satisfaction.\",\n",
       "  'does_it_need_modification': 'Y',\n",
       "  'revised_text': \"Developing a daily habit of drawing can be challenging, but with consistent practice and a few tips, it can become an enjoyable and rewarding part of your daily routine. Here are some strategies to help you develop the habit of drawing daily:\\n\\n1. **Set a specific time**: Allocate a specific time of the day to draw. It could be in the morning, afternoon, or evening. Make drawing a part of your daily routine.\\n\\n2. **Set a specific duration**: Determine the amount of time you want to spend on drawing each day. It can be as little as 10 minutes or as long as an hour. Be consistent with the duration to help build the habit.\\n\\n3. **Start small and simple**: Don't try to create a masterpiece every day. Start with simple and easy-to-do sketches. Focus on improving your skills gradually.\\n\\n4. **Use a variety of tools and mediums**: Experiment with different tools like pencils, pens, markers, and different mediums like paper, canvas, or digital apps to keep your drawing practice interesting and engaging.\\n\\n5. **Take breaks and rest**: Taking breaks and resting after some time of drawing can help you avoid burnout and stay motivated.\\n\\n6. **Challenge yourself**: Set challenges like drawing objects from memory or a specific subject to improve your skills and keep your drawing practice interesting.\\n\\n7. **Track your progress**: Keep a record of your daily drawing practice and track your progress. This can be a source of motivation and help you see how far you've come.\\n\\nRemember, developing a habit takes time and patience. Stay consistent with your drawing practice, be flexible and open to trying new things, and with time, you'll develop a habit of daily drawing that brings you joy and satisfaction.\",\n",
       "  'gpt_answer': \"**Textual Aesthetic Analysis**:  \\nThe text is generally clear and well-organized, but it could benefit from some formatting improvements to enhance readability. Specifically, using bullet points for the list of strategies and adding some emphasis on key points would make the text more engaging and easier to follow.\\n\\n**Does it need modification**: [[Y]]\\n\\n**Revised Text**:  \\n<|Revised Content Start|>  \\nDeveloping a daily habit of drawing can be challenging, but with consistent practice and a few tips, it can become an enjoyable and rewarding part of your daily routine. Here are some strategies to help you develop the habit of drawing daily:\\n\\n1. **Set a specific time**: Allocate a specific time of the day to draw. It could be in the morning, afternoon, or evening. Make drawing a part of your daily routine.\\n\\n2. **Set a specific duration**: Determine the amount of time you want to spend on drawing each day. It can be as little as 10 minutes or as long as an hour. Be consistent with the duration to help build the habit.\\n\\n3. **Start small and simple**: Don't try to create a masterpiece every day. Start with simple and easy-to-do sketches. Focus on improving your skills gradually.\\n\\n4. **Use a variety of tools and mediums**: Experiment with different tools like pencils, pens, markers, and different mediums like paper, canvas, or digital apps to keep your drawing practice interesting and engaging.\\n\\n5. **Take breaks and rest**: Taking breaks and resting after some time of drawing can help you avoid burnout and stay motivated.\\n\\n6. **Challenge yourself**: Set challenges like drawing objects from memory or a specific subject to improve your skills and keep your drawing practice interesting.\\n\\n7. **Track your progress**: Keep a record of your daily drawing practice and track your progress. This can be a source of motivation and help you see how far you've come.\\n\\nRemember, developing a habit takes time and patience. Stay consistent with your drawing practice, be flexible and open to trying new things, and with time, you'll develop a habit of daily drawing that brings you joy and satisfaction.  \\n<|Revised Content End|>\"},\n",
       " {'index': 1,\n",
       "  'prompt': \"how can I transform the getPosition method of antv/g's group in zrender?\",\n",
       "  'response': \"It is not recommended to modify built-in methods as it can lead to unexpected results and potential bugs. You may consider developing a new method or exploring other methods to achieve your desired outcome. Alternatively, you can search for other libraries or modules that offer similar functionalities or reach out to the library's support team for assistance.\",\n",
       "  'does_it_need_modification': 'Y',\n",
       "  'revised_text': \"Modifying built-in methods is generally not recommended as it can lead to unexpected results and potential bugs. Instead, consider the following alternatives:\\n\\n1. **Develop a New Method**: Create a new method that achieves your desired outcome without altering the existing built-in methods.\\n2. **Explore Other Methods**: Look into other methods provided by the library that might offer the functionality you need.\\n3. **Use Other Libraries**: Search for other libraries or modules that provide similar functionalities.\\n4. **Seek Support**: Reach out to the library's support team or community for assistance and guidance.\\n\\nBy following these alternatives, you can achieve your goals while maintaining the stability and reliability of your code.\",\n",
       "  'gpt_answer': \"**Textual Aesthetic Analysis**:  \\nThe text provides a clear and concise recommendation against modifying built-in methods, suggesting alternative approaches. However, it could benefit from improved structure and formatting to enhance readability and comprehension.\\n\\n**Does it need modification**: [[Y]]\\n\\n**Revised Text**:  \\n<|Revised Content Start|>  \\nModifying built-in methods is generally not recommended as it can lead to unexpected results and potential bugs. Instead, consider the following alternatives:\\n\\n1. **Develop a New Method**: Create a new method that achieves your desired outcome without altering the existing built-in methods.\\n2. **Explore Other Methods**: Look into other methods provided by the library that might offer the functionality you need.\\n3. **Use Other Libraries**: Search for other libraries or modules that provide similar functionalities.\\n4. **Seek Support**: Reach out to the library's support team or community for assistance and guidance.\\n\\nBy following these alternatives, you can achieve your goals while maintaining the stability and reliability of your code.\\n<|Revised Content End|>\"}]"
      ]
     },
     "execution_count": 49,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from utils import read_jsonl\n",
    "revised_data = read_jsonl('revised_data/output_sorted.jsonl')\n",
    "revised_data[:2]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from utils import read_jsonl\n",
    "import json\n",
    "data = read_jsonl(\"revised_data/output_sorted.jsonl\")\n",
    "not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "# datalen\n",
    "# data\n",
    "indices = set([item['index'] for item in data])\n",
    "original_indices = set(range(export_data.shape[0]))\n",
    "print(f\"index complete: {original_indices - indices}\")\n",
    "null_response_indices = [item['index'] for item in data if item['gpt_answer'].strip() == '']\n",
    "null_revised_indices = [item['index'] for item in data if item['revised_text'].strip() == '']\n",
    "noneed_revised_indices = [item['index'] for item in data if item['does_it_need_modification'].strip() == 'N']\n",
    "same_revised_text_indices = [item['index'] for item in data if item['response'].strip() == item['revised_text'].strip()]\n",
    "# print(len(null_response))\n",
    "# print(len(not_revised))\n",
    "print(f\"null_response_indices:{len(null_response_indices)}\")\n",
    "print(f\"null_revised_indices:{len(null_revised_indices)}\")\n",
    "print(f\"noneed_revised_indices:{len(noneed_revised_indices)}\")\n",
    "print(f\"same_revised_text_indices:{len(same_revised_text_indices)}\")\n",
    "# 使用集合的交集操作  \n",
    "indices_to_discard  = set(null_response_indices) | set(null_revised_indices) | set(noneed_revised_indices) | set(same_revised_text_indices)    \n",
    "indices_to_discard = list(indices_to_discard)\n",
    "print(f\"indices_to_discard: {len(indices_to_discard)}\")\n",
    "temp_data = data\n",
    "# temp_ds = ds.select(range(10))\n",
    "for i, item in enumerate(ds):\n",
    "    # print(item['rejected'])\n",
    "    # index=item['index']\n",
    "    temp_data[i]['rejected'] = item['rejected'][1]['content']\n",
    "    temp_data[i]['instruct'] = item['prompt']\n",
    "    temp_data[i]['chosen'] = item['chosen']\n",
    "revised_data = [item for item in temp_data if item[\"index\"] not in indices_to_discard]\n",
    "print(f\"length of revised data: {len(revised_data)}\")\n",
    "textual_aesthetics_chosen = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"response\"]} for item in revised_data]\n",
    "with open(\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_chosen.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_chosen, f, indent=4)\n",
    "textual_aesthetics_rejected = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"rejected\"]} for item in revised_data]\n",
    "with open(\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_rejected.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_rejected, f, indent=4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Counter({0: 1566, -1: 1316, 1: 1107, 2: 995, 3: 858, 4: 784, -2: 764, 5: 697, 6: 676, -6: 650, 7: 634, -3: 631, 10: 625, 9: 616, 8: 613, 12: 605, 11: 576, 13: 559, -7: 558, 18: 550, -4: 543, 15: 537, 20: 537, -5: 533, 14: 530, 16: 507, 19: 499, 21: 494, -8: 482, 17: 482, 23: 482, 24: 477, 22: 440, 29: 417, -10: 415, 25: 415, 27: 414, -9: 414, 30: 413, 26: 408, 31: 403, 28: 400, 34: 378, 33: 375, 32: 373, 39: 364, -12: 362, 35: 359, -13: 348, 36: 345, -11: 345, -15: 334, 37: 329, 42: 324, 38: 318, 40: 313, 43: 313, -14: 307, 44: 305, -16: 303, -17: 291, -18: 284, 48: 281, 41: 281, 46: 275, 45: 266, -20: 254, 50: 251, -19: 244, 47: 243, 56: 241, 51: 241, -21: 238, -22: 229, 54: 226, -24: 224, 49: 224, -23: 215, 53: 212, -25: 207, -26: 202, 55: 201, 52: 201, -30: 191, -29: 189, 60: 189, -33: 184, -27: 184, -28: 183, 57: 182, 62: 181, -32: 181, 58: 176, -31: 175, 63: 167, 59: 165, 61: 165, -35: 162, 70: 160, -36: 158, 67: 158, -34: 157, 69: 153, 68: 152, 65: 149, 64: 148, 66: 148, 71: 145, -39: 145, -42: 139, -38: 137, -37: 133, -40: 132, 74: 130, -49: 126, 73: 125, -41: 125, 77: 124, 87: 123, -46: 122, 78: 119, -43: 118, -47: 117, 72: 117, 81: 117, 79: 113, -48: 113, 76: 112, 75: 112, -44: 109, -45: 109, 83: 104, -53: 100, 84: 100, 85: 97, -50: 96, -52: 96, 82: 94, 80: 94, 89: 94, -55: 93, 96: 92, -51: 91, 92: 90, -59: 90, -61: 89, -56: 89, -54: 88, -60: 87, 88: 86, -62: 85, 95: 84, -66: 84, -58: 84, 94: 83, 86: 82, -57: 80, 93: 79, 105: 79, -63: 78, 100: 77, -67: 75, 90: 75, -65: 74, 91: 73, 117: 73, -74: 72, -69: 72, 99: 72, 111: 71, -64: 70, -68: 67, 104: 67, 107: 67, 98: 66, 103: 66, 136: 65, 114: 64, 102: 64, 106: 63, 108: 63, 101: 63, -76: 62, -78: 62, -73: 61, 116: 61, -80: 60, 123: 60, -89: 59, -79: 59, 97: 59, 125: 58, 121: 57, 118: 57, -84: 57, 115: 56, 109: 56, 110: 56, -70: 56, -71: 56, 135: 56, -75: 55, -83: 55, 122: 54, 112: 54, -72: 53, 113: 53, -77: 53, -91: 52, -86: 51, 128: 51, -82: 50, 137: 50, 126: 50, 130: 50, 124: 49, 119: 49, 134: 48, 139: 48, 157: 48, -85: 47, -88: 47, 127: 47, 169: 46, -90: 46, 129: 46, 145: 46, 120: 46, 138: 45, 133: 44, 155: 44, 140: 43, 146: 43, -81: 43, 156: 42, 164: 42, -97: 42, 177: 42, 175: 41, 158: 41, 149: 41, -95: 40, 154: 40, -102: 39, 165: 39, 143: 39, -87: 38, 160: 38, 131: 38, -103: 38, -94: 38, 163: 37, 152: 37, 132: 37, 144: 37, -96: 36, -100: 36, 228: 36, 161: 36, 142: 35, 141: 35, 166: 35, 153: 35, -92: 34, -118: 34, 184: 34, 147: 34, 159: 34, 213: 34, -98: 33, -99: 33, 174: 33, -123: 32, -115: 32, 172: 31, 197: 31, 182: 31, 193: 31, 200: 31, 170: 31, -113: 31, 148: 31, 190: 30, -106: 30, -107: 30, 201: 29, 212: 29, -111: 29, 189: 29, 180: 29, -93: 29, 203: 28, 192: 28, -105: 28, 225: 28, 183: 28, -121: 27, -101: 27, 202: 27, -117: 27, 167: 26, 214: 26, -104: 26, -116: 26, 151: 26, 218: 26, 195: 26, -110: 25, -133: 25, 186: 25, 427: 25, 247: 25, 181: 25, 248: 25, 426: 25, 168: 25, -122: 24, -114: 24, 204: 24, 150: 24, 179: 24, 272: 24, 244: 24, -109: 24, 185: 24, -128: 24, 215: 24, 237: 24, 231: 24, 171: 23, -143: 23, 178: 23, -120: 23, 198: 23, -132: 23, 216: 23, 187: 23, 173: 23, 233: 23, -135: 23, -125: 23, 176: 23, 262: 23, 229: 23, 280: 23, -126: 22, -150: 22, -131: 22, 256: 22, 252: 22, 162: 22, -112: 22, 199: 22, 255: 22, 191: 22, 251: 22, 220: 22, 227: 22, -127: 22, 240: 22, -142: 22, 230: 21, 223: 21, 226: 21, 234: 21, 296: 21, 194: 21, 270: 21, -124: 21, -138: 21, 221: 21, 206: 21, -119: 21, 219: 21, -129: 20, -145: 20, 242: 20, 245: 20, 205: 20, -149: 20, 236: 20, 217: 20, 269: 20, -108: 20, 207: 20, 263: 19, 259: 19, 428: 19, -137: 19, 224: 19, 273: 19, -136: 19, 243: 19, 208: 19, 196: 18, 267: 18, 447: 18, 258: 18, 289: 18, 283: 18, 239: 18, -157: 18, 264: 17, -139: 17, -140: 17, -153: 17, 361: 17, 222: 17, 275: 17, 389: 17, -151: 17, 355: 17, 339: 17, 241: 17, 235: 17, 238: 17, 421: 16, 358: 16, 284: 16, -197: 16, 310: 16, 249: 16, 188: 16, 305: 16, 444: 16, 370: 16, 276: 16, 303: 16, 425: 16, -163: 16, 295: 16, 271: 16, 253: 16, 306: 16, 291: 16, 408: 16, 342: 15, 329: 15, 246: 15, -155: 15, 422: 15, 286: 15, -148: 15, 312: 15, 423: 15, 211: 15, -165: 15, 210: 15, -144: 15, 363: 15, 410: 15, -147: 15, 265: 15, 300: 15, 294: 15, 457: 15, 372: 14, 288: 14, 316: 14, 344: 14, 397: 14, 268: 14, 330: 14, 519: 14, 446: 14, 261: 14, 418: 14, 336: 14, 331: 14, 449: 14, 257: 14, 277: 14, 287: 14, 420: 14, 250: 14, -161: 14, -173: 14, 311: 14, 327: 13, -168: 13, 254: 13, 320: 13, 337: 13, 297: 13, 232: 13, -169: 13, 274: 13, -158: 13, -170: 13, 324: 13, 285: 13, 455: 13, 385: 13, -159: 13, -130: 13, -141: 12, 409: 12, -166: 12, 266: 12, -201: 12, 282: 12, 260: 12, 412: 12, 347: 12, 381: 12, 442: 12, -156: 12, 354: 12, 278: 12, 400: 12, 299: 12, -152: 12, -146: 12, 293: 12, -176: 12, -199: 11, 432: 11, -177: 11, 319: 11, 430: 11, -167: 11, 341: 11, 419: 11, 441: 11, 333: 11, 518: 11, -164: 11, 209: 11, 368: 11, 417: 11, 393: 11, 328: 11, -213: 11, 450: 11, 405: 11, 488: 11, 462: 11, 480: 11, 390: 11, 302: 11, 388: 11, 346: 11, -162: 11, 481: 11, 335: 11, 378: 11, 487: 10, 639: 10, 435: 10, 440: 10, -225: 10, 402: 10, 406: 10, 401: 10, 505: 10, 359: 10, 464: 10, -182: 10, -134: 10, 290: 10, 377: 10, 415: 10, 511: 10, 314: 10, 298: 10, -179: 10, -154: 10, -191: 10, 467: 10, 323: 10, -160: 10, -190: 10, 334: 10, 436: 10, 383: 10, 544: 10, 308: 10, -186: 10, 313: 10, 315: 10, 349: 9, -207: 9, 497: 9, 460: 9, 529: 9, 474: 9, 382: 9, 403: 9, 394: 9, 326: 9, -184: 9, 490: 9, 516: 9, -212: 9, -180: 9, 340: 9, 484: 9, 416: 9, 500: 9, 392: 9, 453: 9, 614: 9, 371: 9, 530: 9, 404: 9, 592: 9, 279: 9, 367: 9, 281: 9, 424: 9, -194: 9, 304: 9, 445: 9, 380: 9, 387: 9, 413: 9, 332: 9, -221: 8, -238: 8, 501: 8, 658: 8, 362: 8, -206: 8, 506: 8, 461: 8, 307: 8, 451: 8, 338: 8, 443: 8, -231: 8, -178: 8, -211: 8, 521: 8, 348: 8, 465: 8, 486: 8, 523: 8, -289: 8, 478: 8, 485: 8, -222: 8, 532: 8, -257: 8, -195: 8, -202: 8, 398: 8, 321: 8, 434: 8, 429: 8, 384: 8, 492: 8, -254: 8, 475: 8, 493: 8, 366: 8, 301: 8, -227: 7, 578: 7, 468: 7, 350: 7, 536: 7, 520: 7, 508: 7, 351: 7, -240: 7, 433: 7, 439: 7, 375: 7, 601: 7, -217: 7, 743: 7, -242: 7, -200: 7, 513: 7, 593: 7, 634: 7, 524: 7, 526: 7, 509: 7, 489: 7, -188: 7, 527: 7, 559: 7, 352: 7, 680: 7, 356: 7, 407: 7, 373: 7, 557: 7, 343: 7, 564: 7, 596: 7, 399: 7, -185: 7, 396: 7, 494: 7, 589: 7, 504: 7, -214: 7, 345: 6, 317: 6, 587: 6, 638: 6, 552: 6, -196: 6, 379: 6, -205: 6, -193: 6, 459: 6, 633: 6, 566: 6, 577: 6, -204: 6, -311: 6, 476: 6, 612: 6, 318: 6, 551: 6, 364: 6, -174: 6, 623: 6, 651: 6, 562: 6, 507: 6, 555: 6, 470: 6, 661: 6, 322: 6, 437: 6, 620: 6, -250: 6, 687: 6, 617: 6, 528: 6, -220: 6, 448: 6, -209: 6, -298: 6, -233: 6, 753: 6, -224: 6, 431: 6, -183: 6, 556: 6, 579: 6, 1894: 6, 554: 5, 292: 5, 411: 5, 667: 5, 365: 5, -317: 5, -187: 5, -232: 5, 649: 5, 681: 5, -241: 5, -234: 5, -236: 5, -226: 5, 510: 5, -356: 5, 696: 5, 540: 5, 357: 5, 622: 5, 482: 5, 595: 5, 840: 5, 376: 5, -228: 5, -215: 5, -237: 5, -246: 5, 496: 5, 701: 5, 515: 5, -256: 5, 792: 5, -181: 5, -329: 5, 537: 5, -175: 5, -270: 5, 581: 5, 784: 5, -294: 5, -218: 5, -371: 5, 640: 5, 503: 5, 477: 5, 636: 5, -292: 5, 534: 5, -244: 5, 624: 5, 325: 5, 627: 5, 353: 5, 533: 5, 631: 5, 662: 5, -210: 5, 369: 5, 591: 5, 483: 5, 386: 5, 856: 5, 576: 5, 414: 5, 664: 5, 770: 5, 514: 5, -266: 5, 642: 5, -198: 5, 547: 5, 309: 5, 934: 4, 580: 4, -309: 4, 517: 4, 647: 4, -297: 4, 473: 4, -229: 4, 697: 4, 588: 4, -324: 4, -343: 4, 573: 4, -269: 4, 778: 4, 898: 4, 395: 4, 914: 4, 599: 4, 616: 4, -284: 4, -203: 4, 761: 4, 654: 4, 391: 4, 684: 4, 825: 4, -251: 4, 648: 4, 539: 4, 602: 4, 796: 4, 575: 4, 605: 4, 615: 4, 463: 4, 668: 4, -272: 4, -403: 4, 719: 4, 643: 4, 674: 4, 600: 4, 626: 4, 495: 4, 653: 4, -391: 4, -346: 4, 666: 4, -480: 4, 454: 4, 472: 4, 565: 4, 438: 4, -333: 4, 619: 4, -381: 4, 670: 4, 1892: 4, 754: 4, -219: 4, -245: 4, 810: 4, 645: 4, 590: 4, 553: 4, 924: 4, 689: 4, 561: 4, 734: 4, -192: 4, 584: 4, -189: 4, -249: 4, 558: 4, 675: 4, 360: 4, 621: 4, -223: 4, -344: 4, 717: 4, 548: 4, 609: 4, 669: 4, 512: 4, -263: 4, -258: 4, -267: 4, -369: 4, -172: 4, -208: 4, 560: 4, 374: 4, 706: 4, 586: 4, -340: 4, 797: 3, -463: 3, 782: 3, -296: 3, -216: 3, 499: 3, -394: 3, 629: 3, -436: 3, 572: 3, 765: 3, -306: 3, -373: 3, 452: 3, 604: 3, 789: 3, -271: 3, -230: 3, 571: 3, -268: 3, -477: 3, 1106: 3, 979: 3, 663: 3, 1008: 3, -457: 3, 828: 3, 693: 3, 694: 3, 545: 3, -363: 3, 456: 3, -303: 3, -318: 3, 727: 3, 699: 3, 613: 3, 635: 3, -302: 3, -338: 3, 568: 3, 745: 3, 714: 3, 865: 3, -487: 3, 723: 3, 884: 3, 665: 3, -247: 3, 672: 3, -262: 3, 646: 3, -239: 3, -280: 3, 764: 3, 543: 3, -434: 3, -482: 3, 921: 3, 741: 3, 709: 3, -379: 3, -366: 3, -275: 3, 970: 3, -314: 3, -253: 3, 931: 3, 630: 3, -326: 3, 531: 3, 650: 3, 958: 3, -500: 3, 574: 3, 900: 3, -287: 3, 597: 3, -288: 3, 585: 3, 703: 3, 685: 3, 917: 3, 827: 3, -305: 3, 628: 3, -445: 3, 471: 3, -171: 3, 777: 3, 1171: 3, -410: 3, 829: 3, -417: 3, -525: 3, -374: 3, 611: 3, 546: 3, 756: 3, -323: 3, 563: 3, -291: 3, 1098: 3, 538: 3, 843: 3, -476: 3, 469: 3, -370: 3, 853: 3, 632: 3, -252: 3, 1891: 3, 861: 3, 660: 3, 491: 3, -437: 3, -327: 3, 838: 3, 973: 3, -386: 3, 732: 3, 1004: 3, 657: 3, 845: 3, 677: 3, 805: 2, 695: 2, -415: 2, 1844: 2, -768: 2, 794: 2, 820: 2, -397: 2, 1099: 2, 760: 2, 907: 2, 1026: 2, -337: 2, -646: 2, -462: 2, -281: 2, -248: 2, 1540: 2, -447: 2, 1027: 2, -438: 2, 725: 2, -635: 2, 918: 2, 1189: 2, -365: 2, 740: 2, 1508: 2, 804: 2, -712: 2, 749: 2, 1082: 2, 1897: 2, 1116: 2, 594: 2, 618: 2, 1172: 2, 679: 2, -428: 2, 729: 2, 567: 2, -355: 2, 1144: 2, -310: 2, -279: 2, 690: 2, -282: 2, -357: 2, 881: 2, 971: 2, 834: 2, 479: 2, 1181: 2, 673: 2, 877: 2, 1170: 2, 844: 2, 569: 2, 852: 2, 625: 2, 954: 2, -652: 2, 752: 2, 1137: 2, 466: 2, -259: 2, 1233: 2, -651: 2, -607: 2, 987: 2, 813: 2, 911: 2, 980: 2, 826: 2, -472: 2, 823: 2, 1282: 2, 716: 2, 1043: 2, 535: 2, 1201: 2, 1979: 2, 1359: 2, -364: 2, -425: 2, 644: 2, 498: 2, -458: 2, 1101: 2, -569: 2, 920: 2, -553: 2, -315: 2, 686: 2, 726: 2, -573: 2, -405: 2, 522: 2, 570: 2, 1006: 2, 678: 2, -662: 2, 606: 2, 806: 2, 969: 2, -402: 2, -339: 2, -362: 2, 835: 2, 637: 2, -243: 2, -515: 2, -426: 2, -429: 2, 983: 2, -299: 2, -312: 2, -490: 2, 1092: 2, 1033: 2, 988: 2, 938: 2, -235: 2, 659: 2, 972: 2, -603: 2, 869: 2, -261: 2, -335: 2, -393: 2, 790: 2, 883: 2, -265: 2, 525: 2, 793: 2, -375: 2, 715: 2, -432: 2, 747: 2, 705: 2, 1097: 2, -554: 2, -548: 2, -295: 2, 854: 2, -330: 2, 1210: 2, 458: 2, 1042: 2, 550: 2, 700: 2, 762: 2, 1696: 2, 711: 2, -570: 2, 788: 2, -277: 2, 641: 2, 816: 2, 1014: 2, 1110: 2, 656: 2, 948: 2, 910: 2, 1155: 2, 1331: 2, 603: 2, 799: 2, 682: 2, 1076: 2, 1297: 2, 1893: 2, -409: 2, 766: 2, 1016: 2, -528: 2, -322: 2, 1241: 2, -413: 2, -421: 2, -334: 2, -290: 2, -461: 2, 1399: 2, 893: 2, -320: 2, 779: 2, -551: 2, 894: 2, 772: 2, 798: 2, 811: 2, 964: 2, -382: 2, 758: 2, 702: 2, 691: 2, 1075: 2, 1059: 2, -341: 2, 1052: 2, 724: 2, 943: 2, 759: 2, 1187: 2, 776: 2, 1183: 2, 610: 2, -450: 2, 876: 2, -467: 2, 1003: 2, 757: 2, 733: 2, 542: 2, 598: 2, 1220: 1, 1134: 1, -508: 1, 1455: 1, 1289: 1, 1009: 1, -780: 1, 975: 1, -714: 1, -762: 1, 1093: 1, 1280: 1, 1064: 1, 998: 1, -449: 1, -398: 1, 1211: 1, 1466: 1, -647: 1, 960: 1, 863: 1, -513: 1, -633: 1, 867: 1, 1196: 1, 1272: 1, -558: 1, 1242: 1, 1215: 1, -826: 1, 704: 1, 707: 1, -274: 1, -691: 1, -590: 1, 1878: 1, 1045: 1, 1192: 1, 864: 1, 1452: 1, -754: 1, 1332: 1, -486: 1, 1614: 1, 976: 1, 1010: 1, -724: 1, -475: 1, -383: 1, -1024: 1, -577: 1, -580: 1, 1635: 1, 502: 1, 850: 1, 1925: 1, -501: 1, -368: 1, 815: 1, 871: 1, -454: 1, 846: 1, 737: 1, -597: 1, -934: 1, 1227: 1, 1987: 1, 787: 1, 791: 1, -692: 1, -709: 1, 978: 1, 1238: 1, -519: 1, -285: 1, -406: 1, 1350: 1, 1372: 1, 1234: 1, 1136: 1, 795: 1, 1096: 1, -536: 1, 912: 1, 803: 1, 1060: 1, 1401: 1, 897: 1, 722: 1, 1646: 1, 951: 1, 1057: 1, 1340: 1, -850: 1, -495: 1, 990: 1, -680: 1, 731: 1, 925: 1, 860: 1, -392: 1, 858: 1, 1692: 1, 1747: 1, 1330: 1, 895: 1, -687: 1, 1362: 1, 1776: 1, -681: 1, 942: 1, -468: 1, -489: 1, -332: 1, 1469: 1, 721: 1, -331: 1, -336: 1, 771: 1, -512: 1, 688: 1, 773: 1, -441: 1, 968: 1, 1904: 1, 1145: 1, 1287: 1, 944: 1, 671: 1, -833: 1, 1118: 1, -442: 1, -811: 1, 906: 1, 1114: 1, -630: 1, 1065: 1, -757: 1, -378: 1, 1163: 1, -499: 1, 780: 1, -260: 1, 887: 1, 1885: 1, -698: 1, -643: 1, -328: 1, 953: 1, 995: 1, 807: 1, -424: 1, -308: 1, 1184: 1, -423: 1, -563: 1, -469: 1, 1047: 1, 1439: 1, 1195: 1, 961: 1, 1333: 1, 728: 1, -792: 1, -443: 1, -1018: 1, 1129: 1, 901: 1, 1051: 1, 698: 1, -860: 1, 833: 1, -439: 1, -719: 1, 1120: 1, -361: 1, -479: 1, -638: 1, 1838: 1, -407: 1, -430: 1, -676: 1, -616: 1, -708: 1, 1159: 1, 1257: 1, -560: 1, 1040: 1, -761: 1, 841: 1, -478: 1, 1547: 1, 1094: 1, 1966: 1, 1274: 1, 1219: 1, 583: 1, 582: 1, -867: 1, 1090: 1, -399: 1, 1266: 1, 755: 1, 1022: 1, 1044: 1, 1367: 1, -283: 1, 1062: 1, 655: 1, 1235: 1, -529: 1, -605: 1, -716: 1, 909: 1, 1028: 1, 1927: 1, 956: 1, 1049: 1, 785: 1, -538: 1, 1150: 1, -388: 1, 1292: 1, 1458: 1, -659: 1, 1440: 1, 713: 1, -506: 1, -385: 1, -503: 1, 720: 1, 930: 1, -316: 1, 872: 1, 1154: 1, -670: 1, 1437: 1, 1907: 1, -255: 1, 549: 1, -669: 1, 992: 1, 974: 1, 1911: 1, -556: 1, -654: 1, 809: 1, 880: 1, -944: 1, -583: 1, -631: 1, 708: 1, 1237: 1, -494: 1, 1041: 1, 1286: 1, -622: 1, 1336: 1, -533: 1, 652: 1, 1666: 1, 1179: 1, 1537: 1, 905: 1, 1250: 1, 812: 1, 1442: 1, -701: 1, -304: 1, -505: 1, 1111: 1, -293: 1, 1025: 1, -787: 1, 1858: 1, 1125: 1, -592: 1, 1541: 1, -313: 1, -637: 1, -608: 1, -739: 1, -540: 1, 710: 1, -456: 1, 922: 1, -593: 1, 2673: 1, 1035: 1, 1279: 1, 1133: 1, -562: 1, 1410: 1, -459: 1, 1078: 1, 1029: 1, -527: 1, 739: 1, -596: 1, 1777: 1, 1071: 1, 746: 1, 874: 1, 786: 1, -422: 1, -606: 1, -783: 1, 836: 1, 1586: 1, 1216: 1, 945: 1, 903: 1, -614: 1, 1928: 1, 541: 1, -485: 1, -618: 1, 847: 1, -752: 1, 1072: 1, 750: 1, 1084: 1, -347: 1, 1131: 1, 1138: 1, -359: 1, -619: 1, 1063: 1, -629: 1, -440: 1, 1853: 1, 1124: 1, 1074: 1, 1182: 1, 927: 1, -433: 1, -286: 1, 774: 1, 886: 1, -737: 1, 1206: 1, 676: 1, 1229: 1, 1146: 1, -273: 1, 991: 1, -301: 1, -674: 1, 941: 1, 932: 1, 937: 1, -796: 1, 848: 1, 1814: 1, 1254: 1, -350: 1, -352: 1, -404: 1, 1304: 1, -523: 1, 1326: 1, 890: 1, 904: 1, -321: 1, 1772: 1, 947: 1, 608: 1, 1638: 1, 959: 1, 873: 1, -325: 1, -763: 1, 977: 1, -648: 1, 1392: 1, 1347: 1, 928: 1, -587: 1, 718: 1, -474: 1, -389: 1, -966: 1, 1148: 1, 1856: 1, 1481: 1, -522: 1, 1800: 1, -568: 1, 892: 1, -264: 1, 1577: 1, 1953: 1, -541: 1, 1916: 1, 955: 1, 1636: 1, -853: 1, 1863: 1, 751: 1, 1066: 1, 683: 1, -547: 1, 1387: 1, 889: 1, -897: 1, 1117: 1, 1598: 1, 1839: 1, 822: 1, -342: 1, -451: 1, 814: 1, -484: 1, 1823: 1, 775: 1, 1901: 1, -376: 1, -588: 1, 999: 1, -628: 1, -679: 1, 896: 1, -657: 1, 1077: 1, 1446: 1, 1103: 1, -420: 1, -604: 1, -411: 1, 1212: 1, 1295: 1, 1785: 1, -731: 1, -470: 1, -412: 1, 963: 1, 936: 1, 1152: 1, 1988: 1, 859: 1, 744: 1, 1247: 1, 1903: 1, 837: 1, -642: 1, 1861: 1, 1165: 1, 730: 1, 800: 1, 1329: 1, 1156: 1, 1625: 1, 1132: 1, 1299: 1, 1180: 1, 1603: 1, 1036: 1, -481: 1, 1361: 1, 1811: 1, 1365: 1, 1569: 1, -349: 1, 1015: 1, 1149: 1, 1020: 1, -520: 1, 817: 1, -634: 1, 1889: 1, -380: 1})\n",
      "Mean: 49.15065020037622, Median: 13.0, Standard Deviation: 169.45465111600666\n",
      "Max length difference: 2673, Min length difference: -1024\n"
     ]
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAA1sAAAIjCAYAAAD1OgEdAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/TGe4hAAAACXBIWXMAAA9hAAAPYQGoP6dpAABy5UlEQVR4nO3dd3hUddrG8XvSEyCEmhClZBEQEERBMSsova5rYUUEBRXBAopi5VURsCCoiCCCuAK6goUVG4tIpIgC0iRSpRmIAimQ3iczv/ePmJEhAULI5CTk+7kurnDO+Z0zz3kymcydU8ZmjDECAAAAAJQpL6sLAAAAAIALEWELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAKqwLl266LLLLivXx7TZbJowYYLbvM2bN+vvf/+7qlWrJpvNpujoaEnS8uXL1a5dOwUEBMhmsyklJaVca63s7rrrLjVp0qRcHqtJkya66667XNMLFiyQzWbTli1byuXxu3Tpoi5dupTLYwFASRG2AOA8lfebynN19OhRTZgwwRVgylKTJk1ks9lks9nk5eWlkJAQtWnTRiNHjtTGjRtLtA273a5bb71VSUlJeuONN/Sf//xHjRs31okTJzRw4EAFBgZq1qxZ+s9//qNq1aqV+T5UFhMmTHD12mazKSgoSI0aNdINN9yg+fPnKzc3t0weZ/fu3ZowYYIOHTpUJtsrSxW5NgAojo/VBQAAPOvo0aOaOHGimjRponbt2pX59tu1a6fHHntMkpSenq49e/Zo8eLFevfdd/Xoo49q2rRpbuOzs7Pl4/PXr5+DBw/q8OHDevfdd3Xvvfe65i9fvlzp6el64YUX1KNHjzKvu7KaPXu2qlevrtzcXB05ckTffvut7rnnHk2fPl1Lly5Vw4YNXWPfffddOZ3Oc9r+7t27NXHiRHXp0uWcjort3btXXl6e/RvumWpbsWKFRx8bAEqDsAUAOC8XXXSR7rjjDrd5U6ZM0eDBg/XGG2+oWbNmeuCBB1zLAgIC3MYmJCRIkkJCQko0/3xkZmZW+qNj//rXv1S3bl3X9Pjx47Vw4UINHTpUt956q3766SfXMl9fX4/WYoxRTk6OAgMD5e/v79HHOhs/Pz9LHx8AisNphABQTo4cOaJ77rlHoaGh8vf3V+vWrTVv3jy3MWvWrJHNZtOnn36ql156SRdffLECAgLUvXt3HThwoMg2Z82apb/97W8KDAzU1VdfrR9++MHt2pU1a9boqquukiTdfffdrlPQFixY4Lad3bt3q2vXrgoKCtJFF12kqVOnnte+BgYG6j//+Y9q166tl156ScYY17KTr9m66667dP3110uSbr31VtlsNlf9w4YNkyRdddVVstlsbtcDbdy4UX369FHNmjUVFBSk66+/XuvWrXOrofC0u927d2vw4MGqVauWOnXq5Fr+4Ycfqn379goMDFTt2rU1aNAg/f77727bKLymrST9ycnJ0YQJE9S8eXMFBASoQYMGuuWWW3Tw4EHXGKfTqenTp6t169YKCAhQaGio7rvvPiUnJ5eu0X8aMmSI7r33Xm3cuFFRUVGu+cVds/Xxxx+rffv2qlGjhoKDg9WmTRu9+eabkgpOib311lslSV27dnU9X9asWSOp4LTRf/zjH/r222/VoUMHBQYG6p133nEtO/l7VCgrK0v33Xef6tSpo+DgYA0dOrTI/hZ3Hd+p2zxbbcVds5WQkKDhw4crNDRUAQEBuvzyy/X++++7jTl06JBsNptee+01zZ07V02bNpW/v7+uuuoqbd68udh+A0BJcWQLAMpBfHy8rrnmGtlsNo0ePVr16tXTN998o+HDhystLU2PPPKI2/hXXnlFXl5eevzxx5WamqqpU6dqyJAhbtdBzZ49W6NHj1bnzp316KOP6tChQ7rppptUq1YtXXzxxZKkli1batKkSRo/frxGjhypzp07S5L+/ve/u7aTnJysPn366JZbbtHAgQP13//+V0899ZTatGmjvn37lnqfq1evrptvvlnvvfeedu/erdatWxcZc9999+miiy7Syy+/rIcfflhXXXWVQkNDJUktWrTQ3LlzNWnSJEVERKhp06aSpFWrVqlv375q3769nn/+eXl5eWn+/Pnq1q2bfvjhB1199dVuj3HrrbeqWbNmevnll12h76WXXtJzzz2ngQMH6t5771ViYqJmzpyp6667Ttu2bXM7mlaS/jgcDv3jH//QypUrNWjQII0ZM0bp6emKiorSzp07XbXfd999WrBgge6++249/PDDiomJ0VtvvaVt27Zp3bp153Uk6s4779TcuXO1YsUK9ezZs9gxUVFRuv3229W9e3dNmTJFkrRnzx6tW7dOY8aM0XXXXaeHH35YM2bM0P/93/+pZcuWkuT6KhWcLnj77bfrvvvu04gRI9SiRYsz1jV69GiFhIRowoQJ2rt3r2bPnq3Dhw+7/rBQUiWp7WTZ2dnq0qWLDhw4oNGjRysiIkKLFy/WXXfdpZSUFI0ZM8Zt/KJFi5Senq777rtPNptNU6dO1S233KLffvvN40cIAVzADADgvMyfP99IMps3bz7tmOHDh5sGDRqY48ePu80fNGiQqVmzpsnKyjLGGLN69WojybRs2dLk5ua6xr355ptGktmxY4cxxpjc3FxTp04dc9VVVxm73e4at2DBAiPJXH/99a55mzdvNpLM/Pnzi9R1/fXXG0nmgw8+cM3Lzc01YWFhZsCAAWfd98aNG5v+/fufdvkbb7xhJJkvv/zSNU+Sef75513Thfu8ePFit3WL66vT6TTNmjUzvXv3Nk6n0zU/KyvLREREmJ49e7rmPf/880aSuf322922e+jQIePt7W1eeuklt/k7duwwPj4+bvNL2p958+YZSWbatGlFelBY5w8//GAkmYULF7otX758ebHzT1W4P4mJicUuT05ONpLMzTff7Jo3bNgw07hxY9f0mDFjTHBwsMnPzz/t4yxevNhIMqtXry6yrHHjxkaSWb58ebHLhg0b5pou/P61b9/e5OXlueZPnTr1rM+J023zTLVdf/31bs/76dOnG0nmww8/dM3Ly8szkZGRpnr16iYtLc0YY0xMTIyRZOrUqWOSkpJcY7/88ksjyXz99ddFHgsASorTCAHAw4wx+uyzz3TDDTfIGKPjx4+7/vXu3Vupqan6+eef3da5++673a5BKTwi9dtvv0mStmzZohMnTmjEiBFuN5sYMmSIatWqdU71Va9e3e2aKz8/P1199dWuxzof1atXl1Rw44yyEB0drf3792vw4ME6ceKEq4+ZmZnq3r271q5dW+SGEPfff7/b9JIlS+R0OjVw4EC370VYWJiaNWum1atXF9mHs/Xns88+U926dfXQQw8Vqbnw6M3ixYtVs2ZN9ezZ0+1x27dvr+rVqxd53HNVkl6HhIQoMzPT7VTDcxUREaHevXuXePzIkSPdjgw98MAD8vHx0bJly0pdQ0ksW7ZMYWFhuv32213zfH199fDDDysjI0Pff/+92/jbbrvN7Wfn1J85ACgNTiMEAA9LTExUSkqK5s6dq7lz5xY7pvBmEIUaNWrkNl34JrDwWpfDhw9Lki655BK3cT4+Puf8uUoXX3xxkdO5atWqpe3bt5/TdoqTkZEhSapRo8Z5b0uS9u/fL0mu67mKk5qa6vamOSIiosg2jDFq1qxZseufespYSfpz8OBBtWjRwi34Fld7amqq6tevX+zyU58D56okvX7wwQf16aefqm/fvrrooovUq1cvDRw4UH369Cnx45zaz7M5tc/Vq1dXgwYNPH779sOHD6tZs2ZF7pBYeNph4c9QobP9zAFAaRC2AMDDCo+03HHHHacNCW3btnWb9vb2LnacOelGE2XFk4+1c+dOSUVDYWkV9vLVV1897W3sC4/wFAoMDCyyDZvNpm+++abYfT91/bLqj9PpVP369bVw4cJil9erV++ctneqkvS6fv36io6O1rfffqtvvvlG33zzjebPn6+hQ4cWuXHE6ZzaT09yOBzl9ljl+TMHoOogbAGAh9WrV081atSQw+Eos8+Laty4sSTpwIED6tq1q2t+fn6+Dh065BbezuUmBGUpIyNDn3/+uRo2bHjamxicq8IbTQQHB5e6l02bNpUxRhEREWrevHmZ1bVx40bZ7fbT3kyhadOm+u6773Tttdd6JLD85z//kaSznuLn5+enG264QTfccIOcTqcefPBBvfPOO3ruued0ySWXlPnzZf/+/W7P0YyMDB07dkz9+vVzzatVq5ZSUlLc1svLy9OxY8fc5p1LbY0bN9b27dvldDrdjm79+uuvruUA4GlcswUAHubt7a0BAwbos88+cx19OFliYuI5b7NDhw6qU6eO3n33XeXn57vmL1y4sMhpT4WfK3Xqm1lPys7O1p133qmkpCQ988wzZfYGvn379mratKlee+0112lzJytJL2+55RZ5e3tr4sSJRY5aGGN04sSJc65rwIABOn78uN56660iywofY+DAgXI4HHrhhReKjMnPzz+v78+iRYv073//W5GRkerevftpx526b15eXq5gnpubK6nsny9z586V3W53Tc+ePVv5+flud7ps2rSp1q5dW2S9U49snUtt/fr1U1xcnD755BPXvPz8fM2cOVPVq1d3feQAAHgSR7YAoIzMmzdPy5cvLzJ/zJgxeuWVV7R69Wp17NhRI0aMUKtWrZSUlKSff/5Z3333nZKSks7psfz8/DRhwgQ99NBD6tatmwYOHKhDhw5pwYIFatq0qVu4adq0qUJCQjRnzhzVqFFD1apVU8eOHc/52pvTOXLkiD788ENJBUctdu/ercWLFysuLk6PPfaY7rvvvjJ5HKkgHPz73/9W37591bp1a91999266KKLdOTIEa1evVrBwcH6+uuvz7iNpk2b6sUXX9S4ceNct8uvUaOGYmJi9Pnnn2vkyJF6/PHHz6muoUOH6oMPPtDYsWO1adMmde7cWZmZmfruu+/04IMP6sYbb9T111+v++67T5MnT1Z0dLR69eolX19f7d+/X4sXL9abb76pf/3rX2d9rP/+97+qXr268vLydOTIEX377bdat26dLr/8ci1evPiM6957771KSkpSt27ddPHFF+vw4cOaOXOm2rVr5zr62K5dO3l7e2vKlClKTU2Vv7+/unXrdtprzc4mLy9P3bt318CBA7V37169/fbb6tSpk/75z3+61XX//fdrwIAB6tmzp3755Rd9++23bh/efK61jRw5Uu+8847uuusubd26VU2aNNF///tfrVu3TtOnTy+z6wgB4EwIWwBQRmbPnl3s/LvuuksXX3yxNm3apEmTJmnJkiV6++23VadOHbVu3dr1eUfnavTo0TLG6PXXX9fjjz+uyy+/XF999ZUefvhhBQQEuMb5+vrq/fff17hx43T//fcrPz9f8+fPL7OwFR0drTvvvFM2m001atRQw4YNdcMNN+jee+8t8plXZaFLly7asGGDXnjhBb311lvKyMhQWFiYOnbsWOJg9/TTT6t58+Z64403NHHiRElSw4YN1atXL7cQUFLe3t5atmyZXnrpJS1atEifffaZ6tSpo06dOqlNmzaucXPmzFH79u31zjvv6P/+7/9cNzS54447dO2115bosR544AFJUkBAgOrWrat27dpp3rx5Gjx4sPz9/c+47h133KG5c+fq7bffVkpKisLCwnTbbbdpwoQJrlPtwsLCNGfOHE2ePFnDhw+Xw+HQ6tWrSx223nrrLS1cuFDjx4+X3W7X7bffrhkzZrj9QWDEiBGKiYnRe++9p+XLl6tz586KiooqcpTuXGoLDAzUmjVr9PTTT+v9999XWlqaWrRoofnz5xf74csA4Ak2w5WfAHDBcDqdqlevnm655Ra9++67VpcDAECVxjVbAFBJ5eTkFLnm6IMPPlBSUpK6dOliTVEAAMCFI1sAUEmtWbNGjz76qG699VbVqVNHP//8s9577z21bNlSW7dudftQZAAAUP64ZgsAKqkmTZqoYcOGmjFjhpKSklS7dm0NHTpUr7zyCkELAIAKgCNbAAAAAOABXLMFAAAAAB5A2AIAAAAAD+CarRJyOp06evSoatSo4fbZIAAAAACqFmOM0tPTFR4e7vqcwuIQtkro6NGjatiwodVlAAAAAKggfv/9d1188cWnXU7YKqEaNWpIKmhocHCwxdW4s9vtWrFihXr16iVfX1+ry6ly6L916L116L116L216L916L116H1RaWlpatiwoSsjnA5hq4QKTx0MDg6ukGErKChIwcHB/ABYgP5bh95bh95bh95bi/5bh95bh96f3tkuL+IGGQAAAADgAYQtAAAAAPAAwhYAAAAAeABhCwAAAAA8gLAFAAAAAB5gadhau3atbrjhBoWHh8tms+mLL74oMmbPnj365z//qZo1a6patWq66qqrFBsb61qek5OjUaNGqU6dOqpevboGDBig+Ph4t23Exsaqf//+CgoKUv369fXEE08oPz/f07sHAAAAoAqzNGxlZmbq8ssv16xZs4pdfvDgQXXq1EmXXnqp1qxZo+3bt+u5555TQECAa8yjjz6qr7/+WosXL9b333+vo0eP6pZbbnEtdzgc6t+/v/Ly8rR+/Xq9//77WrBggcaPH+/x/QMAAABQdVn6OVt9+/ZV3759T7v8mWeeUb9+/TR16lTXvKZNm7r+n5qaqvfee0+LFi1St27dJEnz589Xy5Yt9dNPP+maa67RihUrtHv3bn333XcKDQ1Vu3bt9MILL+ipp57ShAkT5Ofn57kdBAAAAFBlVdgPNXY6nfrf//6nJ598Ur1799a2bdsUERGhcePG6aabbpIkbd26VXa7XT169HCtd+mll6pRo0basGGDrrnmGm3YsEFt2rRRaGioa0zv3r31wAMPaNeuXbriiiuKffzc3Fzl5ua6ptPS0iQVfKib3W73wB6XXmE9Fa2uqoL+W4feW4feW4feW4v+W4feW4feF1XSXlTYsJWQkKCMjAy98sorevHFFzVlyhQtX75ct9xyi1avXq3rr79ecXFx8vPzU0hIiNu6oaGhiouLkyTFxcW5Ba3C5YXLTmfy5MmaOHFikfkrVqxQUFDQee6dZ0RFRVldQpVG/61D761D761D761F/61D761D7/+SlZVVonEVNmw5nU5J0o033qhHH31UktSuXTutX79ec+bM0fXXX+/Rxx83bpzGjh3rmk5LS1PDhg3Vq1cvBQcHe/Sxz5XdbldUVJR69uwpX19fq8upcui/dei9dei9dei9tei/dei9deh9UYVnvZ1NhQ1bdevWlY+Pj1q1auU2v2XLlvrxxx8lSWFhYcrLy1NKSorb0a34+HiFhYW5xmzatMltG4V3KywcUxx/f3/5+/sXme/r61thn2QVubaqgP5bh95bh95bh95bi/5bh95bh97/paR9qLCfs+Xn56errrpKe/fudZu/b98+NW7cWJLUvn17+fr6auXKla7le/fuVWxsrCIjIyVJkZGR2rFjhxISElxjoqKiFBwcXCTIAQAAAEBZsfTIVkZGhg4cOOCajomJUXR0tGrXrq1GjRrpiSee0G233abrrrtOXbt21fLly/X1119rzZo1kqSaNWtq+PDhGjt2rGrXrq3g4GA99NBDioyM1DXXXCNJ6tWrl1q1aqU777xTU6dOVVxcnJ599lmNGjWq2CNXAAAAAFAWLA1bW7ZsUdeuXV3ThddIDRs2TAsWLNDNN9+sOXPmaPLkyXr44YfVokULffbZZ+rUqZNrnTfeeENeXl4aMGCAcnNz1bt3b7399tuu5d7e3lq6dKkeeOABRUZGqlq1aho2bJgmTZpUfjsKAAAAoMqxNGx16dJFxpgzjrnnnnt0zz33nHZ5QECAZs2addoPRpakxo0ba9myZaWuEwAAAADOVYW9ZgsAAAAAKjPCFgAAAAB4AGELAAAAADyAsAWg0kpOTnb7CgAAUJEQtgBUWikpKW5fAQAAKhLCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ABLw9batWt1ww03KDw8XDabTV988cVpx95///2y2WyaPn262/ykpCQNGTJEwcHBCgkJ0fDhw5WRkeE2Zvv27ercubMCAgLUsGFDTZ061QN7AwAAAAB/sTRsZWZm6vLLL9esWbPOOO7zzz/XTz/9pPDw8CLLhgwZol27dikqKkpLly7V2rVrNXLkSNfytLQ09erVS40bN9bWrVv16quvasKECZo7d26Z7w8AAAAAFPKx8sH79u2rvn37nnHMkSNH9NBDD+nbb79V//793Zbt2bNHy5cv1+bNm9WhQwdJ0syZM9WvXz+99tprCg8P18KFC5WXl6d58+bJz89PrVu3VnR0tKZNm+YWygAAAACgLFkats7G6XTqzjvv1BNPPKHWrVsXWb5hwwaFhIS4gpYk9ejRQ15eXtq4caNuvvlmbdiwQdddd538/PxcY3r37q0pU6YoOTlZtWrVKvaxc3NzlZub65pOS0uTJNntdtnt9rLaxTJRWE9Fq6uqoP/WcTgcrq/0v3zxvLcOvbcW/bcOvbcOvS+qpL2o0GFrypQp8vHx0cMPP1zs8ri4ONWvX99tno+Pj2rXrq24uDjXmIiICLcxoaGhrmWnC1uTJ0/WxIkTi8xfsWKFgoKCznlfykNUVJTVJVRp9N86+/bt0759+6wuo0rieW8dem8t+m8dem8dev+XrKysEo2rsGFr69atevPNN/Xzzz/LZrOV++OPGzdOY8eOdU2npaWpYcOG6tWrl4KDg8u9njOx2+2KiopSz5495evra3U5VQ79t86BAwe0b98+NW/eXJdcconV5VQpPO+tQ++tRf+tQ++tQ++LKjzr7WwqbNj64YcflJCQoEaNGrnmORwOPfbYY5o+fboOHTqksLAwJSQkuK2Xn5+vpKQkhYWFSZLCwsIUHx/vNqZwunBMcfz9/eXv719kvq+vb4V9klXk2qoC+l/+vL29XV/pvTV43luH3luL/luH3luH3v+lpH2osJ+zdeedd2r79u2Kjo52/QsPD9cTTzyhb7/9VpIUGRmplJQUbd261bXeqlWr5HQ61bFjR9eYtWvXup1XGRUVpRYtWpz2FEIAAAAAOF+WHtnKyMjQgQMHXNMxMTGKjo5W7dq11ahRI9WpU8dtvK+vr8LCwtSiRQtJUsuWLdWnTx+NGDFCc+bMkd1u1+jRozVo0CDXbeIHDx6siRMnavjw4Xrqqae0c+dOvfnmm3rjjTfKb0cBAAAAVDmWhq0tW7aoa9eurunCa6SGDRumBQsWlGgbCxcu1OjRo9W9e3d5eXlpwIABmjFjhmt5zZo1tWLFCo0aNUrt27dX3bp1NX78eG77DgAAAMCjLA1bXbp0kTGmxOMPHTpUZF7t2rW1aNGiM67Xtm1b/fDDD+daHgAAAACUWoW9ZgsAAAAAKjPCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFoBKKzU11e0rAABARULYAlBppaWluX0FAACoSAhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4gKVha+3atbrhhhsUHh4um82mL774wrXMbrfrqaeeUps2bVStWjWFh4dr6NChOnr0qNs2kpKSNGTIEAUHByskJETDhw9XRkaG25jt27erc+fOCggIUMOGDTV16tTy2D0AAAAAVZilYSszM1OXX365Zs2aVWRZVlaWfv75Zz333HP6+eeftWTJEu3du1f//Oc/3cYNGTJEu3btUlRUlJYuXaq1a9dq5MiRruVpaWnq1auXGjdurK1bt+rVV1/VhAkTNHfuXI/vHwAAAICqy8fKB+/bt6/69u1b7LKaNWsqKirKbd5bb72lq6++WrGxsWrUqJH27Nmj5cuXa/PmzerQoYMkaebMmerXr59ee+01hYeHa+HChcrLy9O8efPk5+en1q1bKzo6WtOmTXMLZQAAAABQliwNW+cqNTVVNptNISEhkqQNGzYoJCTEFbQkqUePHvLy8tLGjRt18803a8OGDbruuuvk5+fnGtO7d29NmTJFycnJqlWrVrGPlZubq9zcXNd0WlqapILTG+12uwf2rvQK66lodVUV9N86xhjXV/pfvnjeW4feW4v+W4feW4feF1XSXlSasJWTk6OnnnpKt99+u4KDgyVJcXFxql+/vts4Hx8f1a5dW3Fxca4xERERbmNCQ0Ndy04XtiZPnqyJEycWmb9ixQoFBQWd9/54wqlHAlG+6L91MjMztWzZMqvLqJJ43luH3luL/luH3luH3v8lKyurROMqRdiy2+0aOHCgjDGaPXt2uTzmuHHjNHbsWNd0WlqaGjZsqF69ernCXkVht9sVFRWlnj17ytfX1+pyqhz6b53vv/9emZmZqlatmq6//nqry6lSeN5bh95bi/5bh95bh94XVXjW29lU+LBVGLQOHz6sVatWuQWdsLAwJSQkuI3Pz89XUlKSwsLCXGPi4+PdxhROF44pjr+/v/z9/YvM9/X1rbBPsopcW1VA/8ufzWZzfaX31uB5bx16by36bx16bx16/5eS9qFCf85WYdDav3+/vvvuO9WpU8dteWRkpFJSUrR161bXvFWrVsnpdKpjx46uMWvXrnU7rzIqKkotWrQ47SmEAAAAAHC+LA1bGRkZio6OVnR0tCQpJiZG0dHRio2Nld1u17/+9S9t2bJFCxculMPhUFxcnOLi4pSXlydJatmypfr06aMRI0Zo06ZNWrdunUaPHq1BgwYpPDxckjR48GD5+flp+PDh2rVrlz755BO9+eabbqcIAgAAAEBZs/Q0wi1btqhr166u6cIANGzYME2YMEFfffWVJKldu3Zu661evVpdunSRJC1cuFCjR49W9+7d5eXlpQEDBmjGjBmusTVr1tSKFSs0atQotW/fXnXr1tX48eO57TsAAAAAj7I0bHXp0sV16+binGlZodq1a2vRokVnHNO2bVv98MMP51wfAAAAAJRWhb5mCwAAAAAqK8IWAAAAAHgAYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAMIWAAAAAHgAYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAMIWAAAAAHgAYQsAAAAAPICwBaDSSk9Pd/sKAABQkRC2AFRaGRkZbl8BAAAqEsIWAAAAAHgAYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAMIWAAAAAHgAYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAMIWAAAAAHgAYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAEvD1tq1a3XDDTcoPDxcNptNX3zxhdtyY4zGjx+vBg0aKDAwUD169ND+/fvdxiQlJWnIkCEKDg5WSEiIhg8froyMDLcx27dvV+fOnRUQEKCGDRtq6tSpnt41AAAAAFWcpWErMzNTl19+uWbNmlXs8qlTp2rGjBmaM2eONm7cqGrVqql3797KyclxjRkyZIh27dqlqKgoLV26VGvXrtXIkSNdy9PS0tSrVy81btxYW7du1auvvqoJEyZo7ty5Ht8/AAAAAFWXj5UP3rdvX/Xt27fYZcYYTZ8+Xc8++6xuvPFGSdIHH3yg0NBQffHFFxo0aJD27Nmj5cuXa/PmzerQoYMkaebMmerXr59ee+01hYeHa+HChcrLy9O8efPk5+en1q1bKzo6WtOmTXMLZQAAAABQliwNW2cSExOjuLg49ejRwzWvZs2a6tixozZs2KBBgwZpw4YNCgkJcQUtSerRo4e8vLy0ceNG3XzzzdqwYYOuu+46+fn5ucb07t1bU6ZMUXJysmrVqlXs4+fm5io3N9c1nZaWJkmy2+2y2+1lvbvnpbCeilZXVUH/Kwb6X7543luH3luL/luH3luH3hdV0l5U2LAVFxcnSQoNDXWbHxoa6loWFxen+vXruy338fFR7dq13cZEREQU2UbhstOFrcmTJ2vixIlF5q9YsUJBQUGl2CPPi4qKsrqEKo3+l78aNWq4vi5btsziaqomnvfWoffWov/WoffWofd/ycrKKtG4Chu2rDZu3DiNHTvWNZ2WlqaGDRuqV69eCg4OtrCyoux2u6KiotSzZ0/5+vpaXU6VQ/+tM3/+fIWGhio+Pl5333231eVUKTzvrUPvrUX/rUPvrUPviyo86+1sKmzYCgsLkyTFx8erQYMGrvnx8fFq166da0xCQoLbevn5+UpKSnKtHxYWpvj4eLcxhdOFY4rj7+8vf3//IvN9fX0r7JOsItdWFdD/8peRkaHQ0FBlZGTQe4vwvLcOvbcW/bcOvbcOvf9LSftQYT9nKyIiQmFhYVq5cqVrXlpamjZu3KjIyEhJUmRkpFJSUrR161bXmFWrVsnpdKpjx46uMWvXrnU7rzIqKkotWrQ47SmEAAAAAHC+LA1bGRkZio6OVnR0tKSCm2JER0crNjZWNptNjzzyiF588UV99dVX2rFjh4YOHarw8HDddNNNkqSWLVuqT58+GjFihDZt2qR169Zp9OjRGjRokMLDwyVJgwcPlp+fn4YPH65du3bpk08+0Ztvvul2iiAAAAAAlDVLTyPcsmWLunbt6pouDEDDhg3TggUL9OSTTyozM1MjR45USkqKOnXqpOXLlysgIMC1zsKFCzV69Gh1795dXl5eGjBggGbMmOFaXrNmTa1YsUKjRo1S+/btVbduXY0fP57bvgMAAADwKEvDVpcuXWSMOe1ym82mSZMmadKkSacdU7t2bS1atOiMj9O2bVv98MMPpa4TAAAAAM5Vhb1mCwAAAAAqM8IWAAAAAHgAYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAMIWAAAAAHhAqcLWb7/9VtZ1AAAAAMAFpVRh65JLLlHXrl314YcfKicnp6xrAgAAAIBKr1Rh6+eff1bbtm01duxYhYWF6b777tOmTZvKujYAAAAAqLRKFbbatWunN998U0ePHtW8efN07NgxderUSZdddpmmTZumxMTEsq4TAAAAACqV87pBho+Pj2655RYtXrxYU6ZM0YEDB/T444+rYcOGGjp0qI4dO1ZWdQIAAABApXJeYWvLli168MEH1aBBA02bNk2PP/64Dh48qKioKB09elQ33nhjWdUJAAAAAJWKT2lWmjZtmubPn6+9e/eqX79++uCDD9SvXz95eRVkt4iICC1YsEBNmjQpy1oBAAAAoNIoVdiaPXu27rnnHt11111q0KBBsWPq16+v995777yKAwAAAIDKqlRha//+/Wcd4+fnp2HDhpVm8wAAAABQ6ZXqmq358+dr8eLFReYvXrxY77///nkXBQAAAACVXanC1uTJk1W3bt0i8+vXr6+XX375vIsCAAAAgMquVGErNjZWERERReY3btxYsbGx510UAAAAAFR2pQpb9evX1/bt24vM/+WXX1SnTp3zLgoAAAAAKrtSha3bb79dDz/8sFavXi2HwyGHw6FVq1ZpzJgxGjRoUFnXCAAAAACVTqnuRvjCCy/o0KFD6t69u3x8CjbhdDo1dOhQrtkCAAAAAJUybPn5+emTTz7RCy+8oF9++UWBgYFq06aNGjduXNb1AQAAAEClVKqwVah58+Zq3rx5WdUCAAAAABeMUoUth8OhBQsWaOXKlUpISJDT6XRbvmrVqjIpDgAAAAAqq1KFrTFjxmjBggXq37+/LrvsMtlstrKuCwAAAAAqtVKFrY8//liffvqp+vXrV9b1AAAAAMAFoVS3fvfz89Mll1xS1rUAAAAAwAWjVGHrscce05tvviljTFnXAwAAAAAXhFKdRvjjjz9q9erV+uabb9S6dWv5+vq6LV+yZEmZFAcAJZGZmWl1CQAAAEWUKmyFhITo5ptvLutaAOCcFIas/375P91///2qV6+exRUBAAD8pVRha/78+WVdBwCcs9zcXElSjt2ptLQ0whYAAKhQSnXNliTl5+fru+++0zvvvKP09HRJ0tGjR5WRkVFmxQEAAABAZVWqI1uHDx9Wnz59FBsbq9zcXPXs2VM1atTQlClTlJubqzlz5pR1nQAAAABQqZTqyNaYMWPUoUMHJScnKzAw0DX/5ptv1sqVK8usOAAAAACorEp1ZOuHH37Q+vXr5efn5za/SZMmOnLkSJkUBgAAAACVWamObDmdTjkcjiLz//jjD9WoUeO8iwIAAACAyq5UYatXr16aPn26a9pmsykjI0PPP/+8+vXrV1a1AQAAAEClVarTCF9//XX17t1brVq1Uk5OjgYPHqz9+/erbt26+uijj8q6RgAAAACodEoVti6++GL98ssv+vjjj7V9+3ZlZGRo+PDhGjJkiNsNMwAAAACgqipV2JIkHx8f3XHHHWVZCwAAAABcMEoVtj744IMzLh86dGipigEAAACAC0WpwtaYMWPcpu12u7KysuTn56egoKAyC1sOh0MTJkzQhx9+qLi4OIWHh+uuu+7Ss88+K5vNJkkyxuj555/Xu+++q5SUFF177bWaPXu2mjVr5tpOUlKSHnroIX399dfy8vLSgAED9Oabb6p69eplUicAAAAAnKpUdyNMTk52+5eRkaG9e/eqU6dOZXqDjClTpmj27Nl66623tGfPHk2ZMkVTp07VzJkzXWOmTp2qGTNmaM6cOdq4caOqVaum3r17KycnxzVmyJAh2rVrl6KiorR06VKtXbtWI0eOLLM6AQAAAOBUpb5m61TNmjXTK6+8ojvuuEO//vprmWxz/fr1uvHGG9W/f39JBR+a/NFHH2nTpk2SCo5qTZ8+Xc8++6xuvPFGSQWnOIaGhuqLL77QoEGDtGfPHi1fvlybN29Whw4dJEkzZ85Uv3799Nprryk8PLxMagUAAACAk5VZ2JIKbppx9OjRMtve3//+d82dO1f79u1T8+bN9csvv+jHH3/UtGnTJEkxMTGKi4tTjx49XOvUrFlTHTt21IYNGzRo0CBt2LBBISEhrqAlST169JCXl5c2btyom2++udjHzs3NVW5urms6LS1NUsEpk3a7vcz2sSwU1lPR6qoq6L91vLwKDs77+/vJ4XDwPShHPO+tQ++tRf+tQ++tQ++LKmkvShW2vvrqK7dpY4yOHTumt956S9dee21pNlmsp59+Wmlpabr00kvl7e0th8Ohl156SUOGDJEkxcXFSZJCQ0Pd1gsNDXUti4uLU/369d2W+/j4qHbt2q4xxZk8ebImTpxYZP6KFSsUFBR0XvvlKVFRUVaXUKXR//LXvn17SdILzzyhPXv2aM+ePRZXVPXwvLcOvbcW/bcOvbcOvf9LVlZWicaVKmzddNNNbtM2m0316tVTt27d9Prrr5dmk8X69NNPtXDhQi1atEitW7dWdHS0HnnkEYWHh2vYsGFl9jjFGTdunMaOHeuaTktLU8OGDdWrVy8FBwd79LHPld1uV1RUlHr27ClfX1+ry6ly6L91XnjhBbVv317PvfSq/vvhPEVERFhdUpXB89469N5a9N869N469L6owrPezqZUYcvpdJZmtXP2xBNP6Omnn9agQYMkSW3atNHhw4c1efJkDRs2TGFhYZKk+Ph4NWjQwLVefHy82rVrJ0kKCwtTQkKC23bz8/OVlJTkWr84/v7+8vf3LzLf19e3wj7JKnJtVQH9L3+Fr0W5uXny9vam/xbgeW8dem8t+m8dem8dev+XkvahVHcjLC9ZWVmuazIKeXt7u95gRUREKCwsTCtXrnQtT0tL08aNGxUZGSlJioyMVEpKirZu3eoas2rVKjmdTnXs2LEc9gIAAABAVVSqI1snn153NoU3syiNG264QS+99JIaNWqk1q1ba9u2bZo2bZruueceSQWnLz7yyCN68cUX1axZM0VEROi5555TeHi461THli1bqk+fPhoxYoTmzJkju92u0aNHa9CgQdyJELhAZKanKCUlxeoyAAAA3JQqbG3btk3btm2T3W5XixYtJEn79u2Tt7e3rrzySte4wg8eLq2ZM2fqueee04MPPqiEhASFh4frvvvu0/jx411jnnzySWVmZmrkyJFKSUlRp06dtHz5cgUEBLjGLFy4UKNHj1b37t1dH2o8Y8aM86oNQMWRlZ6i1NRUq8sAAABwU6qwdcMNN6hGjRp6//33VatWLUkFH3R89913q3PnznrsscfKpLgaNWpo+vTpmj59+mnH2Gw2TZo0SZMmTTrtmNq1a2vRokVlUhMAAAAAlESprtl6/fXXNXnyZFfQkqRatWrpxRdfLNO7EQIAAABAZVWqsJWWlqbExMQi8xMTE5Wenn7eRQEAAABAZVeqsHXzzTfr7rvv1pIlS/THH3/ojz/+0Geffabhw4frlltuKesaAaBYJf1AQQAAACuUKmzNmTNHffv21eDBg9W4cWM1btxYgwcPVp8+ffT222+XdY0AUERiYqL+t3yF1WUAAACcVqlukBEUFKS3335br776qg4ePChJatq0qapVq1amxQHA6aSlpSknzy5JMsbiYgAAAIpxXh9qfOzYMR07dkzNmjVTtWrVZHjHAwAAAACSShm2Tpw4oe7du6t58+bq16+fjh07JkkaPnx4md32HQAAAAAqs1KFrUcffVS+vr6KjY1VUFCQa/5tt92m5cuXl1lxAAAAAFBZleqarRUrVujbb7/VxRdf7Da/WbNmOnz4cJkUBgAAAACVWamObGVmZrod0SqUlJQkf3//8y4KAAAAACq7UoWtzp0764MPPnBN22w2OZ1OTZ06VV27di2z4gAAAACgsirVaYRTp05V9+7dtWXLFuXl5enJJ5/Url27lJSUpHXr1pV1jQAAAABQ6ZTqyNZll12mffv2qVOnTrrxxhuVmZmpW265Rdu2bVPTpk3LukYAAAAAqHTO+ciW3W5Xnz59NGfOHD3zzDOeqAkAAAAAKr1zPrLl6+ur7du3e6IWAAAAALhglOo0wjvuuEPvvfdeWdcCAAAAABeMUt0gIz8/X/PmzdN3332n9u3bq1q1am7Lp02bVibFAQAAAEBldU5h67ffflOTJk20c+dOXXnllZKkffv2uY2x2WxlVx0AAAAAVFLnFLaaNWumY8eOafXq1ZKk2267TTNmzFBoaKhHigMAAACAyuqcrtkyxrhNf/PNN8rMzCzTggAAAADgQlCqG2QUOjV8AQAAAAAKnFPYstlsRa7J4hotAAAAACjqnK7ZMsborrvukr+/vyQpJydH999/f5G7ES5ZsqTsKgSAs3Dk25WWlmZ1GQAAAG7OKWwNGzbMbfqOO+4o02IAoDSc+fnKyMiwugwAAAA35xS25s+f76k6AAAAAOCCcl43yAAAAAAAFI+wBQAAAAAeQNgCAAAAAA8gbAGo9IxxcoMMAABQ4RC2AFR6xhhlZmZaXQYAAIAbwhYAAAAAeABhCwAAAAA8gLAFAAAAAB5A2AIAAAAADyBsAQAAAIAHELYAVEopKSnKzc6xugwAAIDTImwBqJRSU1OVk0fYAgAAFRdhCwAAAAA8gLAFAAAAAB5A2AIAAAAADyBsAaiU0tPT5XQY13RWVpaF1QAAABRF2AJQKaWnp8vpdLimCVsAAKCiIWwBuCDs2rVLSUlJVpcBAADgQtgCcEHYvXu3kpOTrS4DAADAhbAF4ILgcDjOPggAAKAcVfiwdeTIEd1xxx2qU6eOAgMD1aZNG23ZssW13Bij8ePHq0GDBgoMDFSPHj20f/9+t20kJSVpyJAhCg4OVkhIiIYPH66MjIzy3hUAnuLjr6PH4hQTE2N1JQAAAC4VOmwlJyfr2muvla+vr7755hvt3r1br7/+umrVquUaM3XqVM2YMUNz5szRxo0bVa1aNfXu3Vs5OTmuMUOGDNGuXbsUFRWlpUuXau3atRo5cqQVuwTAE3x8lW+3Ky4uzupKAAAAXHysLuBMpkyZooYNG2r+/PmueREREa7/G2M0ffp0Pfvss7rxxhslSR988IFCQ0P1xRdfaNCgQdqzZ4+WL1+uzZs3q0OHDpKkmTNnql+/fnrttdcUHh5evjsFAAAAoEqo0GHrq6++Uu/evXXrrbfq+++/10UXXaQHH3xQI0aMkCTFxMQoLi5OPXr0cK1Ts2ZNdezYURs2bNCgQYO0YcMGhYSEuIKWJPXo0UNeXl7auHGjbr755mIfOzc3V7m5ua7ptLQ0SZLdbpfdbvfE7pZaYT0Vra6qgv5bJzAgoOCrv79sAf7KzMzk+1BOeN5bh95bi/5bh95bh94XVdJe2Iwx5uzDrBHw5xupsWPH6tZbb9XmzZs1ZswYzZkzR8OGDdP69et17bXX6ujRo2rQoIFrvYEDB8pms+mTTz7Ryy+/rPfff1979+5123b9+vU1ceJEPfDAA8U+9oQJEzRx4sQi8xctWqSgoKAy3EsAAAAAlUlWVpYGDx6s1NRUBQcHn3ZchT6y5XQ61aFDB7388suSpCuuuEI7d+50hS1PGjdunMaOHeuaTktLU8OGDdWrV68zNtQKdrtdUVFR6tmzp3x9fa0up8qh/9b45JNP9OjjT+nf77yte+4bpey0JL344ot66KGHrC6tSuB5bx16by36bx16bx16X1ThWW9nU6HDVoMGDdSqVSu3eS1bttRnn30mSQoLC5MkxcfHux3Zio+PV7t27VxjEhIS3LaRn5+vpKQk1/rF8ff3l7+/f5H5vr6+FfZJVpFrqwrof/nL/vNGONk5OcrOzpYxhu9BOeN5bx16by36bx16bx16/5eS9qFC343w2muvLXL63759+9S4cWNJBTfLCAsL08qVK13L09LStHHjRkVGRkqSIiMjlZKSoq1bt7rGrFq1Sk6nUx07diyHvQAAAABQFVXoI1uPPvqo/v73v+vll1/WwIEDtWnTJs2dO1dz586VJNlsNj3yyCN68cUX1axZM0VEROi5555TeHi4brrpJkkFR8L69OmjESNGaM6cObLb7Ro9erQGDRrEnQgBAAAAeEyFDltXXXWVPv/8c40bN06TJk1SRESEpk+friFDhrjGPPnkk8rMzNTIkSOVkpKiTp06afny5a6ba0jSwoULNXr0aHXv3l1eXl4aMGCAZsyYYcUuAQAAAKgiKnTYkqR//OMf+sc//nHa5TabTZMmTdKkSZNOO6Z27dpatGiRJ8oDAAAAgGJV6Gu2AKBkCj7BIisry+I6AAAA/kLYAlD5GcIWAACoeAhbAAAAAOABhC0AAAAA8ADCFoALBqcRAgCAioSwBaBSysjIkPPPa7VkjGx+QVq6/DslJiZaWxgAAMCfCFsAKqXMzMyTpoxsfgHKcUhpaWmW1QQAAHAywhaAC4IxTmWlpyolJcXqUgAAACQRtgBcKIxRdkaqUlNTra4EAABAEmELQCVVcBqhsboMAACA0yJsAaiUsrOzyVoAAKBCI2wBuCAY41S+3a6lS5cqKSnJ6nIAAAAIWwAqp+zsbPcZxsiZb9fq1auVnJxsTVEAAAAnIWwBqJRycnLkdh6hMTLGyOFwWFYTAADAyQhbAC4Mxkgyys/Pt7oSAAAASYQtAAAAAPAIwhYAAAAAeABhCwAAAAA8gLAFAAAAAB5A2AJwgSi4MyF3IwQAABUFYQvAhcEQtgAAQMVC2AJwQSFsAQCAioKwBeDCYIzkG6CExOM6ceKE1dUAAAAQtgBcKIzk46s8u11Hjx61uhgAAADCFoALiDFy5ucrIyPD6koAAAAIWwAqp+zsbKtLAAAAOCPCFoBKJzExUd+t/t59ppFkjIxxcmQLAABUCIQtAJVOWlqacvLsp8w1f4Yto/j4eEvqAgAAOBlhC8CFwxjZ/IL00X+/UGJiotXVAACAKo6wBeACYmTzC1C23am0tDSriwEAAFUcYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAMIWAAAAAHgAYQvABcRIkpxOp8V1AAAAELYAXEgMYQsAAFQchC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAnDBcTjydeLECavLAAAAVVylCluvvPKKbDabHnnkEde8nJwcjRo1SnXq1FH16tU1YMAAxcfHu60XGxur/v37KygoSPXr19cTTzyh/Pz8cq4eQFk5fPiwMjMyil3mdOTpREKcRj3yuBITE8u5MgAAgL9UmrC1efNmvfPOO2rbtq3b/EcffVRff/21Fi9erO+//15Hjx7VLbfc4lrucDjUv39/5eXlaf369Xr//fe1YMECjR8/vrx3AUAZOXr0qPLycotf6HDKafNW7O+/KzY2tnwLAwAAOEmlCFsZGRkaMmSI3n33XdWqVcs1PzU1Ve+9956mTZumbt26qX379po/f77Wr1+vn376SZK0YsUK7d69Wx9++KHatWunvn376oUXXtCsWbOUl5dn1S4B8BgjGaP0lCSlpqZaXQwAAKjCfKwuoCRGjRql/v37q0ePHnrxxRdd87du3Sq73a4ePXq45l166aVq1KiRNmzYoGuuuUYbNmxQmzZtFBoa6hrTu3dvPfDAA9q1a5euuOKKYh8zNzdXubl//eU8LS1NkmS322W328t6F89LYT0Vra6qgv5bIzAwUAH+/gX/Dwgo+EBjm02yeUk+PvJ15istLY3vi4fwvLcOvbcW/bcOvbcOvS+qpL2o8GHr448/1s8//6zNmzcXWRYXFyc/Pz+FhIS4zQ8NDVVcXJxrzMlBq3B54bLTmTx5siZOnFhk/ooVKxQUFHSuu1EuoqKirC6hSqP/5adGjRpa9MEC1/S8d9857dhly5aVQ0VVF89769B7a9F/69B769D7v2RlZZVoXIUOW7///rvGjBmjqKgoBQQElOtjjxs3TmPHjnVNp6WlqWHDhurVq5eCg4PLtZazsdvtioqKUs+ePeXr62t1OVUO/S9/n3zyie4b9ZAC/P017913dM+I+5SdnV1wZEuSfPzklZetOXNm67bbbrO22AsUz3vr0Htr0X/r0Hvr0PuiCs96O5sKHba2bt2qhIQEXXnlla55DodDa9eu1VtvvaVvv/1WeXl5SklJcTu6FR8fr7CwMElSWFiYNm3a5LbdwrsVFo4pjr+/v/z/PEXpZL6+vhX2SVaRa6sK6H/5ys7OljGm4P85OaeELYe88rIlie+Jh/G8tw69txb9tw69tw69/0tJ+1Chb5DRvXt37dixQ9HR0a5/HTp00JAhQ1z/9/X11cqVK13r7N27V7GxsYqMjJQkRUZGaseOHUpISHCNiYqKUnBwsFq1alXu+wQAAACgaqjQR7Zq1Kihyy67zG1etWrVVKdOHdf84cOHa+zYsapdu7aCg4P10EMPKTIyUtdcc40kqVevXmrVqpXuvPNOTZ06VXFxcXr22Wc1atSoYo9cAQAAAEBZqNBhqyTeeOMNeXl5acCAAcrNzVXv3r319ttvu5Z7e3tr6dKleuCBBxQZGalq1app2LBhmjRpkoVVAwAAALjQVbqwtWbNGrfpgIAAzZo1S7NmzTrtOo0bN+aOZEAVY4wp8cWrAAAAnlChr9kCgFJxOiXfAM2aO0+JiYlWVwMAAKoowhaAC49xyOYXoLSsXI5uAQAAyxC2AFx4/rwlvNPptLgQAABQlRG2AFyQjHEqKz1VKSkpVpcCAACqKMIWgEonIyPD9YHGp2WMsjNSlZqaWj5FAQAAnKLS3Y0QADIzM886xhinHI58paenl0NFAAAARXFkC8CFyRg58+2ELQAAYBnCFoBKJyMjw+oSAAAAzoqwBaBSSUxM1MKPP5XOcskWAACA1QhbACqVtLQ0ZWRn6axpyxgZYziNEAAAWIawBaDSceSX4LCWMQW3f8/K8nxBAAAAxSBsAQAAAIAHELYAVCopKSnKzc62ugwAAICzImwBqFRSU1OVnZtTgpEFpxpyGiEAALAKYQvAhckQtgAAgLUIWwAuaLt27VJSUpLVZQAAgCqIsAXgwvTnka2dO3cqOTnZ4mIAAEBVRNgCcIEqCFt2u93iOgAAQFVF2AJwYTJG8vFXfEKifvvtN6urAQAAVRBhC0Clkp6eLqfDWbLBPr7Kz89XfHy8Z4sCAAAoBmELQKWSnp4up9NRssHGyBinMjIyPFsUAABAMQhbACqVjIwMOf+8+cVZGSMZo8zMTM8WBQAAUAzCFoBKheAEAAAqC8IWAAAAAHgAYQtApZKVlaXC27oDAABUZIQtAJXK8ePHyVoAAKBSIGwBqDQSExP15dJlIm0BAIDKgLAFoNJIS0tTdq79HNYoCGU//fSTkpKSPFMUAADAaRC2AFy4/rxF/A8//KCYmBiLiwEAAFUNYQvABS89PV2pqalWlwEAAKoYwhaAC54p6YcgAwAAlCHCFoALlzGSj59y8/KUkpJidTUAAKCKIWwBuIAVhC2Zws/nAgAAKD+ELQAAAADwAMIWgEojJSVFudnZ57yeMUZpaWkeqAgAAOD0CFsAKo3U1FRl5+ac20rGyOYXqDnvLVBiYqJnCgMAACgGYQvAhc0Y2XwDlJnn4OgWAAAoV4QtAJVGenq6nA7nOa5VcNt3p8NR9gUBAACcAWELQKWRnp4up/McQ5MxchqHUpMS9fHHHyspKckzxQEAAJyCsAWg0sjIyJCzNB9QbIwy01K1dOlSJScnl31hAAAAxSBsAag0MjMzrS4BAACgxAhbACqNgg8mLsWRLQAAAAsQtgBUGllZWaXKWsY45XTYlZ+fX/ZFAQAAnAZhC0ClkJSUpF27dp37isZIxsiRn0/YAgAA5YqwBaBSSE5O1vbt20uxpnH7AgAAUF4IWwAqhRMnTij++AmRmgAAQGVR4cPW5MmTddVVV6lGjRqqX7++brrpJu3du9dtTE5OjkaNGqU6deqoevXqGjBggOLj493GxMbGqn///goKClL9+vX1xBNPcEoRUIlkZGTIWdqXLGNkjOFnHgAAlKsKH7a+//57jRo1Sj/99JOioqJkt9vVq1cvt1tAP/roo/r666+1ePFiff/99zp69KhuueUW13KHw6H+/fsrLy9P69ev1/vvv68FCxZo/PjxVuwSgPJmjCQjh+McPxAZAADgPPhYXcDZLF++3G16wYIFql+/vrZu3arrrrtOqampeu+997Ro0SJ169ZNkjR//ny1bNlSP/30k6655hqtWLFCu3fv1nfffafQ0FC1a9dOL7zwgp566ilNmDBBfn5+VuwagHOQnp4up8N5XtsgbAEAgPJU4cPWqVJTUyVJtWvXliRt3bpVdrtdPXr0cI259NJL1ahRI23YsEHXXHONNmzYoDZt2ig0NNQ1pnfv3nrggQe0a9cuXXHFFUUeJzc3V7m5ua7ptLQ0SZLdbpfdbvfIvpVWYT0Vra6qgv6Xj7i4OPn6+crX17tghjEKDAiQpIKvxkg2218rnDxt85IC/HUiOVmJiYlq1KhROVd/4eF5bx16by36bx16bx16X1RJe2EzxlSaq82dTqf++c9/KiUlRT/++KMkadGiRbr77rvdgpEkXX311erataumTJmikSNH6vDhw/r2229dy7OyslStWjUtW7ZMffv2LfJYEyZM0MSJE4vMX7RokYKCgsp4zwAAAABUFllZWRo8eLBSU1MVHBx82nGV6sjWqFGjtHPnTlfQ8qRx48Zp7Nixrum0tDQ1bNhQvXr1OmNDrWC32xUVFaWePXvK19fX6nKqHPpfPmbOnKlnJ74omT9PJTRGgYGBmvfuO7pnxH3Kzs4+/ZEtSTa/APnJqf9+8pGuu+66cq7+wsPz3jr03lr03zr03jr0vqjCs97OptKErdGjR2vp0qVau3atLr74Ytf8sLAw5eXlKSUlRSEhIa758fHxCgsLc43ZtGmT2/YK71ZYOOZU/v7+8vf3LzLf19e3wj7JKnJtVQH995ykpCStW7dO2dlZf97sQm5hKjsn5+xhyyE55JDNZuP7VIZ43luH3luL/luH3luH3v+lpH2o8HcjNMZo9OjR+vzzz7Vq1SpFRES4LW/fvr18fX21cuVK17y9e/cqNjZWkZGRkqTIyEjt2LFDCQkJrjFRUVEKDg5Wq1atymdHAJTagQMHtDxq5Xl9xJYxTjny7SX+SxQAAMD5qvBHtkaNGqVFixbpyy+/VI0aNRQXFydJqlmzpgIDA1WzZk0NHz5cY8eOVe3atRUcHKyHHnpIkZGRuuaaayRJvXr1UqtWrXTnnXdq6tSpiouL07PPPqtRo0YVe/QKQMVy7Ngx5dkdOs+0JWd+vjIyMsqsLgAAgDOp8Ee2Zs+erdTUVHXp0kUNGjRw/fvkk09cY9544w394x//0IABA3TdddcpLCxMS5YscS339vbW0qVL5e3trcjISN1xxx0aOnSoJk2aZMUuAThHx44dU35+3vltxBg5nU6tWrVKSUlJZVMYAADAGVT4I1sluVliQECAZs2apVmzZp12TOPGjbVs2bKyLA1AOTn5Q8xLzTglGa1bt07Jycmuj48AAADwlAp/ZAsAyiZsFfzhhg82BgAA5YWwBaDCy87OPq/LtU5G2AIAAOWFsAWganA6JR9/HTl6TL/99pvV1QAAgCqAsAWgQktKStKuXbvKYEtG8vFVfn6+63P2AAAAPImwBaBCi4mJ0bp168pse8bp1IIFC3Tw4MEy2yYAAEBxCFsAKrTDhw8rJS1DZXbRlqTNmzfr8OHDZbY9AACA4hC2AFRoWVlZkpd3GW7RKDs7W0ePHi3DbQIAABRF2AJQoaWlpcmU3a0IJS8f2e12bd++vWy2CQAAcBqELQAVVmJiombP/bdK8NnmJWMckpe3bH5B+uzL/ykxMbGMNgwAAFAUYQtAhZWWlqb07DyV5fVakpHNL0A5joLtAwAAeAphC0CFlZKSooz01LLNWgAAAOWEsAWgwkpNTVVGerpIWwAAoDIibAGosNLT0+XId5T5do1xKis9VSkpKWW+bQAAgEKELQAVUlJSkr799ls5nWUftmSMsjNSlZqaqsTERG6UAQAAPIKwBaBCiomJ0ddffy1nmd2K8C/GOJVvt+vTTz/VbXcM0x1330vgAgAAZY6wBaBCSk1NVVJSkjxyvZYxctjz9PXXXys+KVVJ6VncmRAAAJQ5whaACik9PV35+fmeuTeGMZKMjh8/LntengceAAAAgLAFoII6duyY8vLK+jO2/uRwSF4+ysvLU05ubtlvHwAAQIQtABXUoUOHJJu3h7bulLx9JMkjdzsEAACQCFsAKqiUlBTJ21NhCwAAwPMIWwCqtOycbDny860uAwAAXIAIWwAqnKSkJO3atatcHisjPUNZ2dnl8lgAAKBqIWwBqHBWrlypnzZu8uyDOJ2Sl4/yHXYlHv1DMTExnn08AABQ5RC2AFQoP/30kx5+5DHlOz39SEby9pFxOpSSmqqRD4zWvn37PP2gAACgCiFsAagw9u3bp0FD7lTc8ePyzAdsFcMY2Xz8lJAQrz/++KN8HhMAAFQJPlYXAABSwXVac+bM0dH4xIJT/MqLMXI67MrNzdXRo0fL73EBAMAFjyNbACqE5ORkrV69Wvl2D32QcXGMkYyRcTiVb7crPj6+fB4XAABUCRzZAlBh5OTkyJhyClqS/gp1RpLR2rVrVaNGDf3rX/9S7dq1y7EOAABwISJsAbBcUlKSZs6cqQO/HSo42lSezF+nLK5bt07Jyclq3769li9frj59+hC6AABAqXEaIQDLJScna8WKFco3UrmdQljopLCVkZGhtLQ0LVmyRB988IGSk5PLtxYAAHBB4cgWAMudOHFCubm55X9U6xS5Tmnnrl3Kzc1VgwYNXPOTkpI40gUAAM4ZR7YAWGrfvn0aOnyEjlSIOwHa5LD5KOZwrI4cOaKUlBRJBUfePvroI450AQCAc8KRLQCWKDxalJaWppjDf8ieZ5e8LHpJMkaSl2ScsvkFypGfo9jYWL311luKjIxU+/btrakLAABUaoQtAJZITk7W22+/rbS0NOXl5f55qZZVpxEaydu74H9Oh/LzcpXv669Fiz7Sr7/+qtDQULcjXQAAACXBaYQALBETE6Nt23dpx44dksMheVWQl6P8fMnmLXn5KC8vV7Gxsdq3b58OHz6sw4cPW10dAACoRCrIuxsAVU1cXJzyHIV3AnSecWz5chYc5XI6JG8/HT16VC9OeVUpmbl65vkXtGfPHu3bt09z5sxRUlKS1cUCAIAKjNMIAZS7xMREHThwQPmOfKtLOT3j/PNom5/S0jJk8/PX4T+O6O6RD0jG6OD+vWratKkSExO5SyEAACgWYQtAudqzZ49GPPiQft21Q3I4C07Zq4iMUcFRLh/J6ZBxOmR3eGvXzh3yC6yu1OQkzZkzR8nJyfrtt99Uv359/etf/yJ0AQAAF8IWAI9LTEyUVHBTjJsHDtIfcYnKSjoheXm7bkxRYRV+6LHDIYfJU0Z6hnxy8+Rw2vTFl1+qebNm+t///qfAwEB17969SNgq3Pd69eqVd+UAAMBihC0AHrVnzx49OOYxyTh18w399PuRo8rOzpax+AOMS6wwbDnzZWw2SUb5f97QwykvxRyOVYOcHIWFhemrr77SsGHD5HA4XKvfcfe9kqSZ017Vli1bOOUQAIAqhLAFwGMSExM18sGHFL37VzlycrRp82ZlZ+cUBC2vCn5E61TGnBS8nJKM5OuvvLxsHTt2TIGBgXrnnXf066+/atXa9fKyGb00aYKS0rNkz8vTzp079dFHH6ljx46ELQAAqgjCFgCPiYmJUfzxZOVmZsphTMG1T8b55/VQldCpdTudMo585TrydezYMWVmZiom9g/l2wruZvjQmEcl/yClJSfr+RdeliM3SzExMa4ba0icXggAwIWMsAWgzCQmJio5OVlr1qxRTEyM5r3/oZLTMmTPy5VsNsk4Km/Qkgpqt3nL9eHLTodkK3gZTUlJK7j+zCFJ+bJ5+yghIV4+AdXktPkoLj5BKSnJGjjodt0x+HZt2vaLjv4eq3ffmaOIiAht2bJFHTt21MqVKyWp3G62cfDgQb300ku6//77dfXVV3v88QAAqEoIWwBK5GxHYvbt26ebB96u7Ix05WRl6MSJE8qTt+T8865+lThj/cW439DDOCXvPz+u0NgK7lyogtMNjT1PRjbl5eVKXnYdj0+VfHyVnJaut9+eLe+gYOWlJ2ngkKHy8ZKCqwWpUaNGiomJ0UUXXaTu3btLkpYvX37G67xO/r6c7v9n8ssvv2jR4s+149cDWvblZ675HHEDAOD8EbYAnFViYqLrRg8fzv+368388ePHlZKSovXr12vLli06EHNYzpxM5TsdUr5d8vH7ayPGFBzdulAUtz+mMFSaguW+/pIjX8rPl2x/LpeXHE6HHDnZkqT0zCyZnAylnPDSod+PyubtraTkZI0YMUJeXl76/ffflZycrMWLF6tnz5564IEHXMGr8PuSl5urFyc8p+cmvqi4Y0d1279u0ffrN8rX11fTX31F3t7e2rJlizp06KBatWrJ29tbn376qSIiIvThhx/K6eWr1MwcxcTE6Olnn1fcsSOa9+5cXXPNNeXZUQAALjhVKmzNmjVLr776quLi4nT55Zdr5syZnDaDKu1sRz8KA9XOnTu177dYVa8epJ9//lmNGjXSiAdG6+ctW5XnyJfyc+WQTfLyLQgW3j6S7OW4JxVEMdd0FcwrnG/+OhpmHJLNW8aRL9l85HQaydcm4+WtzIwMrf5hnZSfJ/kF6oknn1Z2Voa2bdumP/74QyEhIdq4caNiY2OVmJ6jvJxs3XrbYDl9/JWRFK/58+croFZ9ZWeka+g9I5WWmqx6tUOU7+WrtOQTuuP2QXrxlVclI2VnZ8o7MFh2e56OHTumPfv2KzEhQfeMfEDtLmupYcOG6corr5QkHT9+XJJUt25dhYSEuO1qUlKSPv30U3Xr1k3NmzeXxG3vAQCoMmHrk08+0dixYzVnzhx17NhR06dPV+/evbV3717Vr1/f6vKAMlHcm9ukpCS3U9FO/syrWwffqTp16mjW9Nfl7e2tr7/+WgkJCfLy8tLOnTu1ffdenTh+QnaHXfnyks04dNOtg+Qjp/KMt/LseQU5wmEKAoQzX/Ly+jNgeFnQgQrGOOR2/qQ55f/e3ieFrz+Phjny/7wu7M+jZkbKzs6RbD5Ky8zRnDlz5OUbIGe+vWCMr5/kZdOxhEx5+wXKlpejI0eOyCclS/bMVMXFJSgvI0mH/Pxk86um3JxsPffceDl9/QvCoJeXHI48/X7gV40YMULH07JkvLy0/9c9+nXvPi3+Yqnq1q4pL19fJSYmyhgpwMumK65op8cee0wDBgxQ69atlZycrA8++lQXhYcrpHqgnnrqKb274D+SpOmvviKpIKSdGrz27dunL7/8Up07d1bTpk2VnJzsNi1JBw4c0C+//KJu3bpJkttRuuJOnzx+/Hixj1WocHwhwiAAwFOqTNiaNm2aRowYobvvvluSNGfOHP3vf//TvHnz9PTTT1tcXeVT3Jv6c71e5GzbON2Yk8ee/Jf2k9c5df7Jb8AKnVznqU63jiS3N3KJiYmKj493zU9JSXEbW7juyds5ubaTp4urV5JSUlL0448/qnPnzjLGuN50Fn6WU+Hyyy67TFPfmCl7Xo5u7N9X119/vT777DNFR0crNTVVderUUfXq1fXUs88r6XiC/nXzTTpw6HcdPXJEPfr0V1JivHLzjYyckj1X8vaTfHwLCis8Pc7mJUd+XsFyX/8/5xeGhpNPqzMV/8OKy0NpbgZinH+FMJt3QWArvC5MXpLNW06ZglBrsxXcpMNIkk0Oe55kz5Ns3srPyij4IOacTMnLR3l5eZLxkmQKLqNz5P/1mPl2OfLzlXg8qeCopPFWvj1X8gtSvjGKSzgu2bz+rMlLGXlZ2hK9XZL03eq1+vrrr+Xt7S2Hb4AOHNgvGZuG3HGnQkIbSnnZuqZzF2VmZSk4KEB3DL5dzZo10xtvvKG2bdtqzboNSk/PVPUawbqsdUvlZGdp+86d8vHylrdxqHpIbZ1ITpLsuWp6aWvl52TJ39dHx1PSVb16Nb008Xm99c6/lRh3VD27d9OW6B06GHNYzZs11b9nv6W6deu6/YxJ0iNPPK283FzXPr044TnVq1dPq1atUkREhLZv3662bdtq+/btuvHGG1WrVq0i26hbt65bMDTGuH5Oa9as6Rpz6s/zyetLKjL/TArXKXzNKVRceDw1dJ7pte7k7Zy6zpm2ceq+Ffc6fGroPd1r8dn259T1T+7HybUUt72zbfN0+19apT2ie7rvUSFP/VHgbPtd0jMgTvfHlFWrVqlbt26uP46UtKaTH7Nw+tQj6kBlYDOV5pNFSy8vL09BQUH673//q5tuusk1f9iwYUpJSdGXX35ZZJ3c3Fzl5ua6plNTU10Xr9eoUaM8yj6tlJQULV68WFlZWeratauqV6+uAwcO6JJLLpH3KW9wU1NTtXHjRnXs2FE1a9Z0Tbdq1Uq7d+92zT/TOifPX716tbKzs7Vp2y9KT0nRc8+MU0hIiFatWqUNm7fJ28dHI+++U3MXfCgZo/uHD9O2bduUk5Oj7OxsxcXF6c4775TT6dSzE19UatJxtWh2ia688kq1bdtWb8x8W9VrVNPVV7RTdna2Vn6/ThlpyWrR7BK1atVKxhjFxsYqJCREq39Yp8zMHHn5eCuicSPVDq6mnJwc7f/tsDIyM2Rk5GOMqlevppp16uvIkaOqGRykPLtDuZkZiohoorjjSTL5dgXVrCVjz1VevkO+Xl7y8bbpeEqGJJtCagQqN98hR16ejJeXsrNz5O/nozohNZWb71RmVrbeePUVPf3sczqelCynMX9mDS8F+PjI6ZTynPnysxl5+QUoMytbNpvk5ciXt5+fjCSnMXI4jHyMQ/Xq1lFqWpZyHHYZFWzLOAqCjJeXpPw8BdYIUVZ2VsElQK4gJMnXW7I7pfwc+QQEKt+e7wpJBW/O/3yTbndIcha8sc53FLy5z88tuMbKmD+PUJ10dOXPOuRl+ytAmJMWS0WvYSqH6cCAAM2a+aZGPTRG2Tk55f74FW/a66/vndv3xyY57H+e3nm69U8ab/P685o7n4KZNpvkcPy53CY58xUYWE2zZk7XqIceUXZ2ZsH2CsO5bAXr+/oVnFbq5V2wruuonbPgqJrtz5uK2GwFz8ucTHkFVJPT6Sy4sYozX/L+c5v5dsnvz+3JSF4+BTV52SQfbynPXrAd3z/3Mf/Pn4PAIOXnG8nplM3bS4G+XnLKX7nZqbL5+8tpd8rLx1sBXlKW/a8Po5b5s0eOXAUGVVeOwyGp4GfQJpv8vLxkdzpktztl87LJ29um/Hwjm9dfY/x9fOTv663s3IKPByjutSHXYZdskrfNJqcxBZf6eXnJ7nQWtF6SI9/Iy8umQD9f+fr7y2kKjhbOmjVLsbGxcnr7KsDHW9l5duVkpqt2rVpKy85VZlaWArykjh07auPP22XysuQVEKT8rEzVCbtIITWqKTH+mIwxatiwoeKPJ+v4iUR5y6hF8+Y6Gp+o48nJqh0crKAAPx1PSpNx5KlW/TDZjEM1ggKVbTf6/Y9Y+fkGqG7tYDWNaKKGDRtqzQ8blJAYJx8vL415aLQ2bNig3377TSfSMuXt66eaQYHyDQxQndq1dPUV7WSz2ZSSkqKffvpJyRlZ8vf2kt1pVKNadb0wcbwaN26s5ORkPTfxRe3etUuyeale3VqqFxqunMx0DRr4L7099z057Xn65w39NWDAAEly+52VfOKEatWpo4CAID356EOqVauWJOnXX3/VtGnTlJZtV2ZWpkKqV1fX6zspKChIAQEB6tChg9vvS4fDoQMHDig2NlZXX3212+/J3bt3a8JLU1S/fn11v+7v6tatm+t37+rVqyXJtb1WrVppy5YtkqQrr7xSs997X/k5ObJ5eck4ncrOy9XR3w/rokYRql69up589CF5eXkV+f188ra7du1a5Hf6yU79/Z6cnKyJL7+iX/cd1CV/a6Lu113rOoK8ceNGXXzxxa7fy9dFXqNu3bopPT1d//nPfxQREaG2bdtq8utvKD4+UWF1a+uFic8X/H5evVrHjh3Tsm+/U1pKkurWbyCnI0+9e/ZQWFiYLr74Yn344Ye6//77demll7rVdumll2r2e++73kP8/PPPWrtho9JTUvTs/z2t3NzcYt/vwLMKn/dW9j41NVU7duxQ//79K0TwTk9PV0REhFJSUs74c1clwtbRo0d10UUXaf369YqMjHTNf/LJJ/X9999r48aNRdaZMGGCJk6cWJ5lAgAAAKhEfv/9d1188cWnXV5lTiM8V+PGjdPYsWNd006nU0lJSapTp45sFeyOamlpaWrYsKF+//13BQcHW11OlUP/rUPvrUPvrUPvrUX/rUPvrUPvizLGKD09XeHh4WccVyXCVt26deXt7V3kPPf4+HiFhYUVu46/v7/8/f3d5lWEQ5ZnEhwczA+Ahei/dei9dei9dei9tei/dei9dei9uzOdPlioStwuzM/PT+3bt9fKlStd85xOp1auXOl2WiEAAAAAlJUqcWRLksaOHathw4apQ4cOuvrqqzV9+nRlZma67k4IAAAAAGWpyoSt2267TYmJiRo/frzi4uLUrl07LV++XKGhoVaXdt78/f31/PPPFzntEeWD/luH3luH3luH3luL/luH3luH3pdelbgbIQAAAACUtypxzRYAAAAAlDfCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYqsBeeukl/f3vf1dQUNBpP1A5NjZW/fv3V1BQkOrXr68nnnhC+fn5bmPWrFmjK6+8Uv7+/rrkkku0YMGCItuZNWuWmjRpooCAAHXs2FGbNm3ywB5Vbk2aNJHNZnP798orr7iN2b59uzp37qyAgAA1bNhQU6dOLbKdxYsX69JLL1VAQIDatGmjZcuWldcuXFB4zpa9CRMmFHmOX3rppa7lOTk5GjVqlOrUqaPq1atrwIABRT4sviSvSZDWrl2rG264QeHh4bLZbPriiy/clhtjNH78eDVo0ECBgYHq0aOH9u/f7zYmKSlJQ4YMUXBwsEJCQjR8+HBlZGS4jSnJa1JVdLb+33XXXUV+Fvr06eM2hv6fu8mTJ+uqq65SjRo1VL9+fd10003au3ev25iyep0pyXufqqYk/e/SpUuR5/7999/vNob+nyODCmv8+PFm2rRpZuzYsaZmzZpFlufn55vLLrvM9OjRw2zbts0sW7bM1K1b14wbN8415rfffjNBQUFm7NixZvfu3WbmzJnG29vbLF++3DXm448/Nn5+fmbevHlm165dZsSIESYkJMTEx8eXx25WGo0bNzaTJk0yx44dc/3LyMhwLU9NTTWhoaFmyJAhZufOneajjz4ygYGB5p133nGNWbdunfH29jZTp041u3fvNs8++6zx9fU1O3bssGKXKi2es57x/PPPm9atW7s9xxMTE13L77//ftOwYUOzcuVKs2XLFnPNNdeYv//9767lJXlNQoFly5aZZ555xixZssRIMp9//rnb8ldeecXUrFnTfPHFF+aXX34x//znP01ERITJzs52jenTp4+5/PLLzU8//WR++OEHc8kll5jbb7/dtbwkr0lV1dn6P2zYMNOnTx+3n4WkpCS3MfT/3PXu3dvMnz/f7Ny500RHR5t+/fqZRo0auf0uLYvXmZK896mKStL/66+/3owYMcLtuZ+amupaTv/PHWGrEpg/f36xYWvZsmXGy8vLxMXFuebNnj3bBAcHm9zcXGOMMU8++aRp3bq123q33Xab6d27t2v66quvNqNGjXJNOxwOEx4ebiZPnlzGe1K5NW7c2LzxxhunXf7222+bWrVquXpvjDFPPfWUadGihWt64MCBpn///m7rdezY0dx3331lXu+FjOesZzz//PPm8ssvL3ZZSkqK8fX1NYsXL3bN27Nnj5FkNmzYYIwp2WsSijr1zb7T6TRhYWHm1Vdfdc1LSUkx/v7+5qOPPjLGGLN7924jyWzevNk15ptvvjE2m80cOXLEGFOy1yQU7b8xBWHrxhtvPO069L9sJCQkGEnm+++/N8aU3etMSd77oGj/jSkIW2PGjDntOvT/3HEaYSW2YcMGtWnTxu2DmXv37q20tDTt2rXLNaZHjx5u6/Xu3VsbNmyQJOXl5Wnr1q1uY7y8vNSjRw/XGPzllVdeUZ06dXTFFVfo1VdfdTtsvmHDBl133XXy8/Nzzevdu7f27t2r5ORk15gzfT9wdjxnPWv//v0KDw/X3/72Nw0ZMkSxsbGSpK1bt8put7v1/dJLL1WjRo1cfS/JaxLOLiYmRnFxcW69rlmzpjp27OjW65CQEHXo0ME1pkePHvLy8tLGjRtdY872moTTW7NmjerXr68WLVrogQce0IkTJ1zL6H/ZSE1NlSTVrl1bUtm9zvC7tmRO7X+hhQsXqm7durrssss0btw4ZWVluZbR/3PnY3UBKL24uDi3J7sk13RcXNwZx6SlpSk7O1vJyclyOBzFjvn11189WH3l8/DDD+vKK69U7dq1tX79eo0bN07Hjh3TtGnTJBX0OiIiwm2dk78ftWrVOu33o/D7hbM7fvw4z1kP6dixoxYsWKAWLVro2LFjmjhxojp37qydO3cqLi5Ofn5+Ra4fPfn5W5LXJJxdYa/O9FoRFxen+vXruy338fFR7dq13cac7TUJxevTp49uueUWRURE6ODBg/q///s/9e3bVxs2bJC3tzf9LwNOp1OPPPKIrr32Wl122WWSVGavM2d77xMYGOiJXapUiuu/JA0ePFiNGzdWeHi4tm/frqeeekp79+7VkiVLJNH/0iBslbOnn35aU6ZMOeOYPXv2uF2UDs85l+/H2LFjXfPatm0rPz8/3XfffZo8ebL8/f09XSrgcX379nX9v23bturYsaMaN26sTz/9tMr9ckTVNmjQINf/27Rpo7Zt26pp06Zas2aNunfvbmFlF45Ro0Zp586d+vHHH60upUo6Xf9Hjhzp+n+bNm3UoEEDde/eXQcPHlTTpk3Lu8wLAmGrnD322GO66667zjjmb3/7W4m2FRYWVuQObIV37AkLC3N9PfUuPvHx8QoODlZgYKC8vb3l7e1d7JjCbVzIzuf70bFjR+Xn5+vQoUNq0aLFaXstnf37URV6XVbq1q1bpZ+z5SkkJETNmzfXgQMH1LNnT+Xl5SklJcXtr84n970kr0k4u8JexcfHq0GDBq758fHxateunWtMQkKC23r5+flKSko66+vNyY+Bkvnb3/6munXr6sCBA+revTv9P0+jR4/W0qVLtXbtWl188cWu+WFhYWXyOnO29z5V3en6X5yOHTtKkg4cOKCmTZvS/1Lgmq1yVq9ePV166aVn/Hfy+d1nEhkZqR07dri94EdFRSk4OFitWrVyjVm5cqXbelFRUYqMjJQk+fn5qX379m5jnE6nVq5c6RpzITuf70d0dLS8vLxcp5JERkZq7dq1stvtrjFRUVFq0aKF63SRs30/cHZV/TlbnjIyMnTw4EE1aNBA7du3l6+vr1vf9+7dq9jYWFffS/KahLOLiIhQWFiYW6/T0tK0ceNGt16npKRo69atrjGrVq2S0+l0vTkqyWsSSuaPP/7QiRMnXOGX/peOMUajR4/W559/rlWrVhU5zbKsXmf4XVu8s/W/ONHR0ZLk9tyn/+fI6jt04PQOHz5stm3bZiZOnGiqV69utm3bZrZt22bS09ONMX/dfrNXr14mOjraLF++3NSrV6/Y228+8cQTZs+ePWbWrFnF3vrd39/fLFiwwOzevduMHDnShISEuN1ppqpbv369eeONN0x0dLQ5ePCg+fDDD029evXM0KFDXWNSUlJMaGioufPOO83OnTvNxx9/bIKCgorc+t3Hx8e89tprZs+ePeb555/n1u+lwHPWMx577DGzZs0aExMTY9atW2d69Ohh6tataxISEowxBbdkbtSokVm1apXZsmWLiYyMNJGRka71S/KahALp6emu13RJZtq0aWbbtm3m8OHDxpiCW7+HhISYL7/80mzfvt3ceOONxd76/YorrjAbN240P/74o2nWrJnbrcdL8ppUVZ2p/+np6ebxxx83GzZsMDExMea7774zV155pWnWrJnJyclxbYP+n7sHHnjA1KxZ06xZs8bt1uJZWVmuMWXxOlOS9z5V0dn6f+DAATNp0iSzZcsWExMTY7788kvzt7/9zVx33XWubdD/c0fYqsCGDRtmJBX5t3r1ateYQ4cOmb59+5rAwEBTt25d89hjjxm73e62ndWrV5t27doZPz8/87e//c3Mnz+/yGPNnDnTNGrUyPj5+Zmrr77a/PTTTx7eu8pl69atpmPHjqZmzZomICDAtGzZ0rz88stuv3iNMeaXX34xnTp1Mv7+/uaiiy4yr7zySpFtffrpp6Z58+bGz8/PtG7d2vzvf/8rr924oPCcLXu33XabadCggfHz8zMXXXSRue2228yBAwdcy7Ozs82DDz5oatWqZYKCgszNN99sjh075raNkrwmoeB1ubjX92HDhhljCm7//txzz5nQ0FDj7+9vunfvbvbu3eu2jRMnTpjbb7/dVK9e3QQHB5u7777b9ce4QiV5TaqKztT/rKws06tXL1OvXj3j6+trGjdubEaMGFHkjzn0/9wV13NJbu9Lyup1piTvfaqas/U/NjbWXHfddaZ27drG39/fXHLJJeaJJ55w+5wtY+j/ubIZY0y5HEIDAAAAgCqEa7YAAAAAwAMIWwAAAADgAYQtAAAAAPAAwhYAAAAAeABhCwAAAAA8gLAFAAAAAB5A2AIAAAAADyBsAQAAAIAHELYAABeku+66SzfddJPHtt+lSxc98sgjrumsrCwNGDBAwcHBstlsSklJKXYeAKDqIGwBAErN04GmJA4dOiSbzabo6Ojz3taCBQtks9lks9nk7e2tWrVqqWPHjpo0aZJSU1Pdxi5ZskQvvPCCa/r999/XDz/8oPXr1+vYsWOqWbNmsfMAAFWHj9UFAABQkQQHB2vv3r0yxiglJUXr16/X5MmTNX/+fK1bt07h4eGSpNq1a7utd/DgQbVs2VKXXXbZGeedK4fDIZvNJi8v/j4KAJUNr9wAAI/ZuXOn+vbtq+rVqys0NFR33nmnjh8/7lrepUsXPfzww3ryySdVu3ZthYWFacKECW7b+PXXX9WpUycFBASoVatW+u6772Sz2fTFF19IkiIiIiRJV1xxhWw2m7p06eK2/muvvaYGDRqoTp06GjVqlOx2+xlrttlsCgsLU4MGDdSyZUsNHz5c69evV0ZGhp588km32gtPI+zSpYtef/11rV271lVDcfMkKTc3V48//rguuugiVatWTR07dtSaNWtc212wYIFCQkL01VdfqVWrVvL391dsbGyJ1/v222/VsmVLVa9eXX369NGxY8fc9m/evHlq3bq1/P391aBBA40ePdq1LCUlRffee6/q1aun4OBgdevWTb/88ssZ+wUAOD3CFgDAI1JSUtStWzddccUV2rJli5YvX674+HgNHDjQbdz777+vatWqaePGjZo6daomTZqkqKgoSQVHdW666SYFBQVp48aNmjt3rp555hm39Tdt2iRJ+u6773Ts2DEtWbLEtWz16tU6ePCgVq9erffff18LFizQggULznlf6tevryFDhuirr76Sw+EosnzJkiUaMWKEIiMjXTUUN0+SRo8erQ0bNujjjz/W9u3bdeutt6pPnz7av3+/a3tZWVmaMmWK/v3vf2vXrl2qX79+idd77bXX9J///Edr165VbGysHn/8cdfy2bNna9SoURo5cqR27Nihr776Spdccolr+a233qqEhAR988032rp1q6688kp1795dSUlJ59wzAIAkAwBAKQ0bNszceOONxS574YUXTK9evdzm/f7770aS2bt3rzHGmOuvv9506tTJbcxVV11lnnrqKWOMMd98843x8fExx44dcy2Piooyksznn39ujDEmJibGSDLbtm0rUlvjxo1Nfn6+a96tt95qbrvtttPuz/z5803NmjWLXTZ79mwjycTHx7tqHzNmjGv5mDFjzPXXX++2zqnzDh8+bLy9vc2RI0fcxnXv3t2MGzfOVYMkEx0dXar1Dhw44Fo+a9YsExoa6poODw83zzzzTLH798MPP5jg4GCTk5PjNr9p06bmnXfeKXYdAMCZcc0WAMAjfvnlF61evVrVq1cvsuzgwYNq3ry5JKlt27Zuyxo0aKCEhARJ0t69e9WwYUOFhYW5ll999dUlrqF169by9vZ22/aOHTvOaT8KGWMkFZxmWFo7duyQw+Fw7Xuh3Nxc1alTxzXt5+fn1peSrhcUFKSmTZu6pk/uZUJCgo4eParu3bsXW9svv/yijIwMt+1JUnZ2tg4ePHiOewoAkLhBBgDAQzIyMnTDDTdoypQpRZY1aNDA9X9fX1+3ZTabTU6ns0xqKMtt79mzR8HBwUXCyLnIyMiQt7e3tm7d6hYCJbmF0sDAQLdQV9L1itvfwpAYGBh41toaNGjgdh1YoZCQkDOuCwAoHmELAOARV155pT777DM1adJEPj6l+3XTokUL/f7774qPj1doaKgkafPmzW5j/Pz8JKnYa6nKSkJCghYtWqSbbrrpvO4KeMUVV8jhcCghIUGdO3f2+Honq1Gjhpo0aaKVK1eqa9euRZZfeeWViouLk4+Pj5o0aVKqxwAAuOMGGQCA85Kamqro6Gi3f7///rtGjRqlpKQk3X777dq8ebMOHjyob7/9VnfffXeJg1HPnj3VtGlTDRs2TNu3b9e6dev07LPPSvrrdL769esrMDDQdQOOUz8P61wZYxQXF6djx45pz549mjdvnv7+97+rZs2aeuWVV85r282bN9eQIUM0dOhQLVmyRDExMdq0aZMmT56s//3vf2W+3qkmTJig119/XTNmzND+/fv1888/a+bMmZKkHj16KDIyUjfddJNWrFihQ4cOaf369XrmmWe0ZcuW89pvAKiqCFsAgPOyZs0aXXHFFW7/Jk6cqPDwcK1bt04Oh0O9evVSmzZt9MgjjygkJKTER4e8vb31xRdfKCMjQ1dddZXuvfde190IAwICJEk+Pj6aMWOG3nnnHYWHh+vGG288r/1JS0tTgwYNdNFFFykyMlLvvPOOhg0bpm3btrmd/lha8+fP19ChQ/XYY4+pRYsWuummm7R582Y1atTII+udbNiwYZo+fbrefvtttW7dWv/4xz9cdzO02WxatmyZrrvuOt19991q3ry5Bg0apMOHD7uOKgIAzo3NFJ7MDQBAJbBu3Tp16tRJBw4ccLsZBAAAFQ1hCwBQoX3++eeqXr26mjVrpgMHDmjMmDGqVauWfvzxR6tLAwDgjLhBBgCgQktPT9dTTz2l2NhY1a1bVz169NDrr79udVkAAJwVR7YAAAAAwAO4QQYAAAAAeABhCwAAAAA8gLAFAAAAAB5A2AIAAAAADyBsAQAAAIAHELYAAAAAwAMIWwAAAADgAYQtAAAAAPCA/wcGfTQrpht9iAAAAABJRU5ErkJggg==",
      "text/plain": [
       "<Figure size 1000x600 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt  \n",
    "from collections import Counter  \n",
    "import numpy as np  \n",
    "from transformers import AutoTokenizer   \n",
    "  \n",
    "# 加载tokenizer  \n",
    "tokenizer_path = \"/mnt/lingjiejiang/textual_aesthetics/model_checkpoint/sft_merge_checkpoints/Meta-Llama-3.1-8B-Instruct\"  \n",
    "tokenizer = AutoTokenizer.from_pretrained(tokenizer_path)  \n",
    "  \n",
    "# 假设revised_data是你的数据列表  \n",
    "# revised_data = [{'response': '...', 'revised_text': '...'}, ...]  \n",
    "# revised_data = [...]  # 这里填入你的实际数据  \n",
    "  \n",
    "# 计算长度差异  \n",
    "length_differences = []  \n",
    "out_of_range_texts = []  \n",
    "  \n",
    "for index, item in enumerate(revised_data):  \n",
    "    # 对response和revised_text进行分词  \n",
    "    response_tokens = tokenizer.encode(item['response'])  \n",
    "    revised_text_tokens = tokenizer.encode(item['revised_text'])  \n",
    "  \n",
    "    response_length = len(response_tokens)  \n",
    "    revised_text_length = len(revised_text_tokens)  \n",
    "  \n",
    "    difference = revised_text_length - response_length  \n",
    "    length_differences.append(difference)  \n",
    "  \n",
    "    # 检查是否超出范围  \n",
    "    if difference < -2048 or difference > 2048:  \n",
    "        out_of_range_texts.append({  \n",
    "            'response': item['response'],  \n",
    "            'revised_text': item['revised_text'],  \n",
    "            'difference': difference,  \n",
    "            'index': index  \n",
    "        })  \n",
    "  \n",
    "# 统计分布  \n",
    "difference_distribution = Counter(length_differences)  \n",
    "  \n",
    "# 打印分布结果  \n",
    "print(difference_distribution)  \n",
    "  \n",
    "# 详细统计信息  \n",
    "differences_array = np.array(length_differences)  \n",
    "mean = np.mean(differences_array)  \n",
    "median = np.median(differences_array)  \n",
    "std_dev = np.std(differences_array)  \n",
    "  \n",
    "print(f\"Mean: {mean}, Median: {median}, Standard Deviation: {std_dev}\")  \n",
    "  \n",
    "# 长度差异的最大最小值  \n",
    "max_difference = max(length_differences)  \n",
    "min_difference = min(length_differences)  \n",
    "  \n",
    "print(f\"Max length difference: {max_difference}, Min length difference: {min_difference}\")  \n",
    "  \n",
    "# 绘制直方图  \n",
    "plt.figure(figsize=(10, 6))  \n",
    "plt.hist(length_differences, bins=range(min(length_differences), max(length_differences) + 2), edgecolor='black', alpha=0.7)  \n",
    "plt.title('Length Difference Distribution')  \n",
    "plt.xlabel('Length Difference')  \n",
    "plt.ylabel('Frequency')  \n",
    "plt.grid(True)  \n",
    "plt.show()  \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 79,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "61135"
      ]
     },
     "execution_count": 79,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(revised_data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "def get_length_diff():\n",
    "    revised_data = read_jsonl('revised_data/output_sorted.jsonl')\n",
    "    # 加载tokenizer  \n",
    "    tokenizer_path = \"/mnt/lingjiejiang/textual_aesthetics/model_checkpoint/sft_merge_checkpoints/Meta-Llama-3.1-8B-Instruct\"  \n",
    "    tokenizer = AutoTokenizer.from_pretrained(tokenizer_path, use_fast=True)  \n",
    "    \n",
    "    # 假设revised_data是你的数据列表  \n",
    "    # revised_data = [...]  # 这里填入你的实际数据  \n",
    "    \n",
    "    responses = [item['response'] for item in revised_data]  \n",
    "    revised_texts = [item['revised_text'] for item in revised_data]  \n",
    "    \n",
    "    # 批量分词  \n",
    "    response_tokens_batch = tokenizer(responses, return_tensors=\"np\")  \n",
    "    revised_text_tokens_batch = tokenizer(revised_texts, return_tensors=\"np\")  \n",
    "    \n",
    "    response_lengths = [len(tokens) for tokens in response_tokens_batch[\"input_ids\"]]  \n",
    "    revised_text_lengths = [len(tokens) for tokens in revised_text_tokens_batch[\"input_ids\"]]  \n",
    "    return response_lengths, revised_text_lengths\n",
    "response_lengths, revised_text_lengths = get_length_diff()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 96,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Mean: 49.15065020037622, Median: 13.0, Standard Deviation: 169.45465111600666\n",
      "95% Confidence Interval: [-88.0, 342.0]\n",
      "Max length difference: 2673, Min length difference: -1024\n",
      "out_of_range_texts length 6008\n"
     ]
    }
   ],
   "source": [
    "from transformers import AutoTokenizer  \n",
    "from utils import read_jsonl\n",
    "revised_data = read_jsonl('revised_data/output_sorted.jsonl')\n",
    "# 加载tokenizer  \n",
    "tokenizer_path = \"/mnt/lingjiejiang/textual_aesthetics/model_checkpoint/sft_merge_checkpoints/Meta-Llama-3.1-8B-Instruct\"  \n",
    "tokenizer = AutoTokenizer.from_pretrained(tokenizer_path, use_fast=True)  \n",
    "  \n",
    "# 假设revised_data是你的数据列表  \n",
    "# revised_data = [...]  # 这里填入你的实际数据  \n",
    "  \n",
    "responses = [item['response'] for item in revised_data]  \n",
    "revised_texts = [item['revised_text'] for item in revised_data]  \n",
    "  \n",
    "# 批量分词  \n",
    "response_tokens_batch = tokenizer(responses, return_tensors=\"np\")  \n",
    "revised_text_tokens_batch = tokenizer(revised_texts, return_tensors=\"np\")  \n",
    "  \n",
    "response_lengths = [len(tokens) for tokens in response_tokens_batch[\"input_ids\"]]  \n",
    "revised_text_lengths = [len(tokens) for tokens in revised_text_tokens_batch[\"input_ids\"]]  \n",
    "  \n",
    "# 计算长度差异  \n",
    "length_differences = []  \n",
    "out_of_range_texts = []\n",
    "\n",
    "filtered_revised_data = []\n",
    "filtered_revised_data_indices = []  \n",
    "\n",
    "for index, (response_length, revised_text_length) in enumerate(zip(response_lengths, revised_text_lengths)):  \n",
    "    difference = revised_text_length - response_length  \n",
    "    length_differences.append(difference)  \n",
    "  \n",
    "    # 检查是否超出范围  \n",
    "    if difference < -88 or difference > 350:  \n",
    "        out_of_range_texts.append({  \n",
    "            'response': revised_data[index]['response'],  \n",
    "            'revised_text': revised_data[index]['revised_text'],  \n",
    "            'difference': difference,  \n",
    "            'index': index  \n",
    "        })  \n",
    "    # 检查是否在-88及350之间  \n",
    "    if -88 <= difference <= 350:  \n",
    "        filtered_revised_data.append(revised_data[index])\n",
    "        filtered_revised_data_indices.append(revised_data[index]['index']) \n",
    "\n",
    "# 统计分布  \n",
    "difference_distribution = Counter(length_differences)  \n",
    "  \n",
    "\n",
    "  \n",
    "# 详细统计信息  \n",
    "differences_array = np.array(length_differences)  \n",
    "mean = np.mean(differences_array)  \n",
    "median = np.median(differences_array)  \n",
    "std_dev = np.std(differences_array)  \n",
    "# 统计分布和绘图代码保持不变  \n",
    "print(f\"Mean: {mean}, Median: {median}, Standard Deviation: {std_dev}\")  \n",
    "\n",
    "# 计算95%置信区间  \n",
    "lower_bound = np.percentile(differences_array, 5)  \n",
    "upper_bound = np.percentile(differences_array, 95)  \n",
    "  \n",
    "print(f\"95% Confidence Interval: [{lower_bound}, {upper_bound}]\")  \n",
    "# 长度差异的最大最小值  \n",
    "max_difference = max(length_differences)  \n",
    "min_difference = min(length_differences)  \n",
    "\n",
    "print(f\"Max length difference: {max_difference}, Min length difference: {min_difference}\")  \n",
    "print(f\"out_of_range_texts length {len(out_of_range_texts)}\")\n",
    "# # 绘制直方图  \n",
    "# plt.figure(figsize=(10, 6))  \n",
    "# plt.hist(length_differences, bins=range(min(length_differences), max(length_differences) + 2), edgecolor='black', alpha=0.7)  \n",
    "# plt.title('Length Difference Distribution')  \n",
    "# plt.xlabel('Length Difference')  \n",
    "# plt.ylabel('Frequency')  \n",
    "# plt.grid(True)  \n",
    "# plt.show()  \n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/v-lingjiang/miniconda3/envs/llama/lib/python3.10/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
      "  from .autonotebook import tqdm as notebook_tqdm\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Mean: 49.15065020037622, Median: 13.0, Standard Deviation: 169.45465111600666\n",
      "95% Confidence Interval: [-88.0, 342.0]\n",
      "Max length difference: 2673, Min length difference: -1024\n",
      "out_of_range_texts length 6008\n",
      "filtered_revised_data length 55127\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "6008"
      ]
     },
     "execution_count": 1,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import matplotlib.pyplot as plt  \n",
    "from collections import Counter  \n",
    "import numpy as np  \n",
    "from transformers import AutoTokenizer \n",
    "from utils import read_jsonl \n",
    "def get_length_diff():\n",
    "    revised_data = read_jsonl('revised_data/output_sorted.jsonl')\n",
    "    # 加载tokenizer  \n",
    "    tokenizer_path = \"/mnt/lingjiejiang/textual_aesthetics/model_checkpoint/sft_merge_checkpoints/Meta-Llama-3.1-8B-Instruct\"  \n",
    "    tokenizer = AutoTokenizer.from_pretrained(tokenizer_path, use_fast=True)  \n",
    "    \n",
    "    # 假设revised_data是你的数据列表  \n",
    "    # revised_data = [...]  # 这里填入你的实际数据  \n",
    "    \n",
    "    responses = [item['response'] for item in revised_data]  \n",
    "    revised_texts = [item['revised_text'] for item in revised_data]  \n",
    "    \n",
    "    # 批量分词  \n",
    "    response_tokens_batch = tokenizer(responses, return_tensors=\"np\")  \n",
    "    revised_text_tokens_batch = tokenizer(revised_texts, return_tensors=\"np\")  \n",
    "    \n",
    "    response_lengths = [len(tokens) for tokens in response_tokens_batch[\"input_ids\"]]  \n",
    "    revised_text_lengths = [len(tokens) for tokens in revised_text_tokens_batch[\"input_ids\"]]  \n",
    "    return response_lengths, revised_text_lengths\n",
    "\n",
    "def get_filter_data(response_lengths, revised_text_lengths, lower=-88, upper=350):\n",
    "    revised_data = read_jsonl('revised_data/output_sorted.jsonl')\n",
    "    # 计算长度差异  \n",
    "    length_differences = []  \n",
    "    out_of_range_texts = []\n",
    "    out_of_range_texts_indices = []\n",
    "    filtered_revised_data = []\n",
    "    filtered_revised_data_indices = []  \n",
    "\n",
    "    for index, (response_length, revised_text_length) in enumerate(zip(response_lengths, revised_text_lengths)):  \n",
    "        difference = revised_text_length - response_length  \n",
    "        length_differences.append(difference)  \n",
    "    \n",
    "        # 检查是否超出范围  \n",
    "        if difference < lower or difference > upper:  \n",
    "            out_of_range_texts.append({  \n",
    "                'response': revised_data[index]['response'],  \n",
    "                'revised_text': revised_data[index]['revised_text'],  \n",
    "                'difference': difference,  \n",
    "                'index': index  \n",
    "            })  \n",
    "            out_of_range_texts_indices.append(revised_data[index]['index'])\n",
    "        # 检查是否在-88及350之间  \n",
    "        if lower <= difference and difference <= upper:  \n",
    "            filtered_revised_data.append(revised_data[index])\n",
    "            filtered_revised_data_indices.append(revised_data[index]['index']) \n",
    "\n",
    "    # 统计分布  \n",
    "    # difference_distribution = Counter(length_differences)  \n",
    "        \n",
    "    # 详细统计信息  \n",
    "    differences_array = np.array(length_differences)  \n",
    "    mean = np.mean(differences_array)  \n",
    "    median = np.median(differences_array)  \n",
    "    std_dev = np.std(differences_array)  \n",
    "    # 统计分布和绘图代码保持不变  \n",
    "    print(f\"Mean: {mean}, Median: {median}, Standard Deviation: {std_dev}\")  \n",
    "\n",
    "    # 计算95%置信区间  \n",
    "    lower_bound = np.percentile(differences_array, 5)  \n",
    "    upper_bound = np.percentile(differences_array, 95)  \n",
    "    \n",
    "    print(f\"95% Confidence Interval: [{lower_bound}, {upper_bound}]\")  \n",
    "    # 长度差异的最大最小值  \n",
    "    max_difference = max(length_differences)  \n",
    "    min_difference = min(length_differences)  \n",
    "\n",
    "    print(f\"Max length difference: {max_difference}, Min length difference: {min_difference}\")  \n",
    "    print(f\"out_of_range_texts length {len(out_of_range_texts)}\")\n",
    "    print(f\"filtered_revised_data length {len(filtered_revised_data)}\")\n",
    "    return out_of_range_texts_indices\n",
    "lower = -88\n",
    "upper = 350\n",
    "# out_of_range_texts_indices = get_filter_data(lower, upper)\n",
    "response_lengths, revised_text_lengths = get_length_diff()\n",
    "out_of_range_texts_indices = get_filter_data(response_lengths, revised_text_lengths, lower, upper)\n",
    "len(out_of_range_texts_indices)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "null_response_indices:136\n",
      "null_revised_indices:5525\n",
      "noneed_revised_indices:5524\n",
      "same_revised_text_indices:335\n",
      "indices_to_discard: 5858\n",
      "indices_to_discard add length: 10745\n",
      "length of revised data: 50390\n",
      "textual_aesthetics_chosen:50390  textual_aesthetics_rejected:50390, textual_aesthetics_triple:50390, textual_aesthetics_uf:50390\n"
     ]
    }
   ],
   "source": [
    "from datasets import load_dataset, Dataset\n",
    "import pandas as pd\n",
    "import json\n",
    "data = read_jsonl(\"revised_data/output_sorted.jsonl\")\n",
    "not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "ds = load_dataset(\"HuggingFaceH4/ultrafeedback_binarized\", split=\"train_prefs\")\n",
    "def get_instruct_response(item):\n",
    "    # item[\"instruction\"] = item['chosen'][0][\"content\"]\n",
    "    item[\"response\"] = item['chosen'][1][\"content\"]\n",
    "    return item\n",
    "ds = ds.map(get_instruct_response, batch_size=1024, num_proc=8)\n",
    "export_data = ds.select_columns([\"prompt\", \"response\"])\n",
    "# export_data\n",
    "# data = filtered_revised_data\n",
    "not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "# datalen\n",
    "# data\n",
    "indices = set([item['index'] for item in data])\n",
    "# original_indices = set(range(export_data.shape[0]))\n",
    "# print(f\"index complete: {original_indices - indices}\")\n",
    "null_response_indices = [item['index'] for item in data if item['gpt_answer'].strip() == '']\n",
    "null_revised_indices = [item['index'] for item in data if item['revised_text'].strip() == '']\n",
    "noneed_revised_indices = [item['index'] for item in data if item['does_it_need_modification'].strip() == 'N']\n",
    "same_revised_text_indices = [item['index'] for item in data if item['response'].strip() == item['revised_text'].strip()]\n",
    "\n",
    "# print(len(null_response))\n",
    "# print(len(not_revised))\n",
    "print(f\"null_response_indices:{len(null_response_indices)}\")\n",
    "print(f\"null_revised_indices:{len(null_revised_indices)}\")\n",
    "print(f\"noneed_revised_indices:{len(noneed_revised_indices)}\")\n",
    "print(f\"same_revised_text_indices:{len(same_revised_text_indices)}\")\n",
    "# 使用集合的交集操作  \n",
    "indices_to_discard  = set(null_response_indices) | set(null_revised_indices) | set(noneed_revised_indices) | set(same_revised_text_indices)   \n",
    "print(f\"indices_to_discard: {len(indices_to_discard)}\")\n",
    "# filter length \n",
    "indices_to_discard = indices_to_discard | set(out_of_range_texts_indices)\n",
    "indices_to_discard = list(indices_to_discard)\n",
    "print(f\"indices_to_discard add length: {len(indices_to_discard)}\")\n",
    "temp_data = data\n",
    "# temp_ds = ds.select(range(10))\n",
    "for i, item in enumerate(ds):\n",
    "    # print(item['rejected'])\n",
    "    # index=item['index']\n",
    "    temp_data[i]['rejected'] = item['rejected'][1]['content']\n",
    "    temp_data[i]['instruct'] = item['prompt']\n",
    "    temp_data[i]['chosen'] = item['chosen']\n",
    "revised_data = [item for item in temp_data if item[\"index\"] not in indices_to_discard]\n",
    "print(f\"length of revised data: {len(revised_data)}\")\n",
    "textual_aesthetics_chosen = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"response\"]} for item in revised_data]\n",
    "# with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_chosen_v2_{lower}_{upper}.json\", 'w') as f:\n",
    "#     json.dump(textual_aesthetics_chosen, f, indent=4)\n",
    "textual_aesthetics_uf = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"response\"], \"rejected\": item[\"rejected\"]} for item in revised_data]\n",
    "# textual_aesthetics_chosen = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"response\"], \"rejected\": item[\"rejected\"]} for item in revised_data]\n",
    "textual_aesthetics_rejected = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"rejected\"]} for item in revised_data]\n",
    "textual_aesthetics_triple = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"rejected\"], \"middle\": item[\"response\"]} for item in revised_data]\n",
    "# textual_aesthetics_rejected.extend([{\"prompt\": item[\"prompt\"], \"chosen\": item[\"response\"], \"rejected\": item[\"rejected\"]} for item in temp_data if item[\"index\"] in noneed_revised_indices])  \n",
    "# with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_triple_v2_{lower}_{upper}_noneed.json\", 'w') as f:\n",
    "#     json.dump(textual_aesthetics_triple, f, indent=4)\n",
    "# noneed_with_length_filter = list(set(noneed_revised_indices) | set(out_of_range_texts_indices))\n",
    "# print(f\"noneed_with length filter: {len(noneed_with_length_filter)}\")\n",
    "# textual_aesthetics_rejected.extend([{\"prompt\": item[\"prompt\"], \"chosen\": item[\"response\"], \"rejected\": item[\"rejected\"]} for item in temp_data if item[\"index\"] in noneed_with_length_filter])  \n",
    "with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_uf_tribledpo_{lower}_{upper}.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_uf, f, indent=4)\n",
    "with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_rejected_tribledpo_{lower}_{upper}.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_rejected, f, indent=4)\n",
    "with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_chosen_tribledpo_{lower}_{upper}.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_chosen, f, indent=4)\n",
    "print(f\"textual_aesthetics_chosen:{len(textual_aesthetics_chosen)}  textual_aesthetics_rejected:{len(textual_aesthetics_rejected)}, textual_aesthetics_triple:{len(textual_aesthetics_triple)}, textual_aesthetics_uf:{len(textual_aesthetics_uf)}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Downloading readme: 100%|██████████| 6.76k/6.76k [00:00<00:00, 77.4kB/s]\n",
      "Downloading data: 100%|██████████| 226M/226M [00:01<00:00, 113MB/s]  \n",
      "Downloading data: 100%|██████████| 226M/226M [00:01<00:00, 117MB/s]  \n",
      "Downloading data: 100%|██████████| 7.29M/7.29M [00:00<00:00, 23.9MB/s]\n",
      "Downloading data: 100%|██████████| 3.72M/3.72M [00:00<00:00, 7.90MB/s]\n",
      "Downloading data: 100%|██████████| 184M/184M [00:01<00:00, 120MB/s]  \n",
      "Downloading data: 100%|██████████| 3.02M/3.02M [00:00<00:00, 8.57MB/s]\n",
      "Generating train_prefs split: 100%|██████████| 61135/61135 [00:00<00:00, 79459.85 examples/s]\n",
      "Generating train_sft split: 100%|██████████| 61135/61135 [00:00<00:00, 80858.75 examples/s]\n",
      "Generating test_prefs split: 100%|██████████| 2000/2000 [00:00<00:00, 74443.65 examples/s]\n",
      "Generating test_sft split: 100%|██████████| 1000/1000 [00:00<00:00, 69052.27 examples/s]\n",
      "Generating train_gen split: 100%|██████████| 61135/61135 [00:00<00:00, 92633.23 examples/s]\n",
      "Generating test_gen split: 100%|██████████| 1000/1000 [00:00<00:00, 75126.35 examples/s]\n",
      "Map (num_proc=8): 100%|██████████| 61135/61135 [00:01<00:00, 38198.08 examples/s]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "null_response_indices:136\n",
      "null_revised_indices:5525\n",
      "noneed_revised_indices:5524\n",
      "same_revised_text_indices:335\n",
      "indices_to_discard: 5858\n",
      "indices_to_discard add length: 10745\n",
      "length of revised data: 1000\n",
      "textual_aesthetics_chosen:1000  textual_aesthetics_rejected:1000, textual_aesthetics_triple:1000\n"
     ]
    }
   ],
   "source": [
    "from datasets import load_dataset, Dataset\n",
    "import pandas as pd\n",
    "import json\n",
    "data = read_jsonl(\"revised_data/output_sorted.jsonl\")\n",
    "not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "ds = load_dataset(\"HuggingFaceH4/ultrafeedback_binarized\", split=\"train_prefs\")\n",
    "def get_instruct_response(item):\n",
    "    # item[\"instruction\"] = item['chosen'][0][\"content\"]\n",
    "    item[\"response\"] = item['chosen'][1][\"content\"]\n",
    "    return item\n",
    "ds = ds.map(get_instruct_response, batch_size=1024, num_proc=8)\n",
    "export_data = ds.select_columns([\"prompt\", \"response\"])\n",
    "# export_data\n",
    "# data = filtered_revised_data\n",
    "not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "# datalen\n",
    "# data\n",
    "indices = set([item['index'] for item in data])\n",
    "# original_indices = set(range(export_data.shape[0]))\n",
    "# print(f\"index complete: {original_indices - indices}\")\n",
    "null_response_indices = [item['index'] for item in data if item['gpt_answer'].strip() == '']\n",
    "null_revised_indices = [item['index'] for item in data if item['revised_text'].strip() == '']\n",
    "noneed_revised_indices = [item['index'] for item in data if item['does_it_need_modification'].strip() == 'N']\n",
    "same_revised_text_indices = [item['index'] for item in data if item['response'].strip() == item['revised_text'].strip()]\n",
    "\n",
    "# print(len(null_response))\n",
    "# print(len(not_revised))\n",
    "print(f\"null_response_indices:{len(null_response_indices)}\")\n",
    "print(f\"null_revised_indices:{len(null_revised_indices)}\")\n",
    "print(f\"noneed_revised_indices:{len(noneed_revised_indices)}\")\n",
    "print(f\"same_revised_text_indices:{len(same_revised_text_indices)}\")\n",
    "# 使用集合的交集操作  \n",
    "indices_to_discard  = set(null_response_indices) | set(null_revised_indices) | set(noneed_revised_indices) | set(same_revised_text_indices)   \n",
    "print(f\"indices_to_discard: {len(indices_to_discard)}\")\n",
    "# filter length \n",
    "indices_to_discard = indices_to_discard | set(out_of_range_texts_indices)\n",
    "indices_to_discard = list(indices_to_discard)\n",
    "print(f\"indices_to_discard add length: {len(indices_to_discard)}\")\n",
    "temp_data = data\n",
    "# temp_ds = ds.select(range(10))\n",
    "for i, item in enumerate(ds):\n",
    "    # print(item['rejected'])\n",
    "    # index=item['index']\n",
    "    temp_data[i]['rejected'] = item['rejected'][1]['content']\n",
    "    temp_data[i]['instruct'] = item['prompt']\n",
    "    temp_data[i]['chosen'] = item['chosen']\n",
    "revised_data = [item for item in temp_data if item[\"index\"] not in indices_to_discard]\n",
    "revised_data = revised_data[:1000]\n",
    "print(f\"length of revised data: {len(revised_data)}\")\n",
    "textual_aesthetics_chosen = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"response\"]} for item in revised_data]\n",
    "# with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_chosen_v2_{lower}_{upper}.json\", 'w') as f:\n",
    "#     json.dump(textual_aesthetics_chosen, f, indent=4)\n",
    "textual_aesthetics_rejected = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"rejected\"]} for item in revised_data]\n",
    "textual_aesthetics_triple = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"rejected\"], \"middle\": item[\"response\"]} for item in revised_data]\n",
    "# textual_aesthetics_rejected.extend([{\"prompt\": item[\"prompt\"], \"chosen\": item[\"response\"], \"rejected\": item[\"rejected\"]} for item in temp_data if item[\"index\"] in noneed_revised_indices])  \n",
    "with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_triple_v2_{lower}_{upper}_debug.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_triple, f, indent=4)\n",
    "with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_rejected_v2_{lower}_{upper}_debug.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_triple, f, indent=4)\n",
    "# noneed_with_length_filter = list(set(noneed_revised_indices) | set(out_of_range_texts_indices))\n",
    "# print(f\"noneed_with length filter: {len(noneed_with_length_filter)}\")\n",
    "# textual_aesthetics_rejected.extend([{\"prompt\": item[\"prompt\"], \"chosen\": item[\"response\"], \"rejected\": item[\"rejected\"]} for item in temp_data if item[\"index\"] in noneed_with_length_filter])  \n",
    "# with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_rejected_v2_{lower}_{upper}_noneed_length_filter.json\", 'w') as f:\n",
    "#     json.dump(textual_aesthetics_rejected, f, indent=4)\n",
    "print(f\"textual_aesthetics_chosen:{len(textual_aesthetics_chosen)}  textual_aesthetics_rejected:{len(textual_aesthetics_rejected)}, textual_aesthetics_triple:{len(textual_aesthetics_triple)}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[{'prompt': 'how can i develop a habit of drawing daily',\n",
       "  'chosen': \"Developing a daily habit of drawing can be challenging, but with consistent practice and a few tips, it can become an enjoyable and rewarding part of your daily routine. Here are some strategies to help you develop the habit of drawing daily:\\n\\n1. **Set a specific time**: Allocate a specific time of the day to draw. It could be in the morning, afternoon, or evening. Make drawing a part of your daily routine.\\n\\n2. **Set a specific duration**: Determine the amount of time you want to spend on drawing each day. It can be as little as 10 minutes or as long as an hour. Be consistent with the duration to help build the habit.\\n\\n3. **Start small and simple**: Don't try to create a masterpiece every day. Start with simple and easy-to-do sketches. Focus on improving your skills gradually.\\n\\n4. **Use a variety of tools and mediums**: Experiment with different tools like pencils, pens, markers, and different mediums like paper, canvas, or digital apps to keep your drawing practice interesting and engaging.\\n\\n5. **Take breaks and rest**: Taking breaks and resting after some time of drawing can help you avoid burnout and stay motivated.\\n\\n6. **Challenge yourself**: Set challenges like drawing objects from memory or a specific subject to improve your skills and keep your drawing practice interesting.\\n\\n7. **Track your progress**: Keep a record of your daily drawing practice and track your progress. This can be a source of motivation and help you see how far you've come.\\n\\nRemember, developing a habit takes time and patience. Stay consistent with your drawing practice, be flexible and open to trying new things, and with time, you'll develop a habit of daily drawing that brings you joy and satisfaction.\",\n",
       "  'rejected': \"As an AI language model, I cannot personally develop habits for you. But, here are some tips for developing a habit of drawing daily:\\n\\n1. Start small: Start with simple drawings or doodles and gradually increase the complexity of your drawings.\\n\\n2. Set a schedule: Set a specific time every day to draw, and try to stick to it as much as possible.\\n\\n3. Make it fun: Don't pressure yourself to create masterpieces every time you draw. Make it a relaxing and enjoyable experience.\\n\\n4. Use resources: There are many drawing tutorials available online. Use resources like YouTube or online drawing courses to help you improve your skills.\\n\\n5. Surround yourself with inspiration: Expose yourself to a variety of art forms, such as paintings, illustrations, and photographs, to inspire and motivate you.\\n\\nRemember, everyone has their own creative style and pace. Just keep practicing and enjoying the process of drawing.\"},\n",
       " {'prompt': \"how can I transform the getPosition method of antv/g's group in zrender?\",\n",
       "  'chosen': \"Modifying built-in methods is generally not recommended as it can lead to unexpected results and potential bugs. Instead, consider the following alternatives:\\n\\n1. **Develop a New Method**: Create a new method that achieves your desired outcome without altering the existing built-in methods.\\n2. **Explore Other Methods**: Look into other methods provided by the library that might offer the functionality you need.\\n3. **Use Other Libraries**: Search for other libraries or modules that provide similar functionalities.\\n4. **Seek Support**: Reach out to the library's support team or community for assistance and guidance.\\n\\nBy following these alternatives, you can achieve your goals while maintaining the stability and reliability of your code.\",\n",
       "  'rejected': 'Thank you for reaching out for assistance! I\\'m here to help you with your question. However, I must point out that the question itself may not be meaningful.\\n\\nThe `getPosition` method is a part of the AntV/G library, which is a gradient boosting framework. It is not clear what you mean by \"transforming\" this method, as it is not a functional programming concept. Additionally, the concept of \"zrender\" is not related to AntV/G.\\n\\nCould you please provide more context or clarify your question? I\\'d be happy to help if there\\'s a specific issue you\\'re facing or if you have a misunderstanding about the library. I\\'m here to assist you in a safe, respectful, and helpful manner.'}]"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "textual_aesthetics_rejected[:2]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[{'prompt': 'how can i develop a habit of drawing daily',\n",
       "  'chosen': \"Developing a daily habit of drawing can be challenging, but with consistent practice and a few tips, it can become an enjoyable and rewarding part of your daily routine. Here are some strategies to help you develop the habit of drawing daily:\\n\\n1. **Set a specific time**: Allocate a specific time of the day to draw. It could be in the morning, afternoon, or evening. Make drawing a part of your daily routine.\\n\\n2. **Set a specific duration**: Determine the amount of time you want to spend on drawing each day. It can be as little as 10 minutes or as long as an hour. Be consistent with the duration to help build the habit.\\n\\n3. **Start small and simple**: Don't try to create a masterpiece every day. Start with simple and easy-to-do sketches. Focus on improving your skills gradually.\\n\\n4. **Use a variety of tools and mediums**: Experiment with different tools like pencils, pens, markers, and different mediums like paper, canvas, or digital apps to keep your drawing practice interesting and engaging.\\n\\n5. **Take breaks and rest**: Taking breaks and resting after some time of drawing can help you avoid burnout and stay motivated.\\n\\n6. **Challenge yourself**: Set challenges like drawing objects from memory or a specific subject to improve your skills and keep your drawing practice interesting.\\n\\n7. **Track your progress**: Keep a record of your daily drawing practice and track your progress. This can be a source of motivation and help you see how far you've come.\\n\\nRemember, developing a habit takes time and patience. Stay consistent with your drawing practice, be flexible and open to trying new things, and with time, you'll develop a habit of daily drawing that brings you joy and satisfaction.\",\n",
       "  'rejected': \"As an AI language model, I cannot personally develop habits for you. But, here are some tips for developing a habit of drawing daily:\\n\\n1. Start small: Start with simple drawings or doodles and gradually increase the complexity of your drawings.\\n\\n2. Set a schedule: Set a specific time every day to draw, and try to stick to it as much as possible.\\n\\n3. Make it fun: Don't pressure yourself to create masterpieces every time you draw. Make it a relaxing and enjoyable experience.\\n\\n4. Use resources: There are many drawing tutorials available online. Use resources like YouTube or online drawing courses to help you improve your skills.\\n\\n5. Surround yourself with inspiration: Expose yourself to a variety of art forms, such as paintings, illustrations, and photographs, to inspire and motivate you.\\n\\nRemember, everyone has their own creative style and pace. Just keep practicing and enjoying the process of drawing.\",\n",
       "  'middle': \"Developing a daily habit of drawing can be challenging but with consistent practice and a few tips, it can become an enjoyable and rewarding part of your daily routine. Here are some strategies to help you develop the habit of drawing daily:\\n\\n1. Set a specific time: Allocate a specific time of the day to draw. It could be in the morning, afternoon, or evening. Make drawing a part of your daily routine.\\n2. Set a specific duration: Determine the amount of time you want to spend on drawing each day. It can be as little as 10 minutes or as long as an hour. Be consistent with the duration to help build the habit.\\n3. Start small and simple: Don't try to create a masterpiece every day, start with simple and easy-to-do sketches. Focus on improving your skills gradually.\\n4. Use a variety of tools and mediums: Experiment with different tools like pencils, pens, markers, and different mediums like paper, canvas, or digital apps to keep your drawing practice interesting and engaging.\\n5. Take breaks and rest: Taking breaks and resting after some time of drawing can help you avoid burnout and stay motivated.\\n6. Challenge yourself: Set challenges like drawing objects from memory or a specific subject to improve your skills and keep your drawing practice interesting.\\n7. Track your progress: Keep a record of your daily drawing practice and track your progress. This can be a source of motivation and help you see how far you've come.\\n\\nRemember, developing a habit takes time and patience. Stay consistent with your drawing practice, be flexible and open to trying new things, and with time, you'll develop a habit of daily drawing that brings you joy and satisfaction.\"},\n",
       " {'prompt': \"how can I transform the getPosition method of antv/g's group in zrender?\",\n",
       "  'chosen': \"Modifying built-in methods is generally not recommended as it can lead to unexpected results and potential bugs. Instead, consider the following alternatives:\\n\\n1. **Develop a New Method**: Create a new method that achieves your desired outcome without altering the existing built-in methods.\\n2. **Explore Other Methods**: Look into other methods provided by the library that might offer the functionality you need.\\n3. **Use Other Libraries**: Search for other libraries or modules that provide similar functionalities.\\n4. **Seek Support**: Reach out to the library's support team or community for assistance and guidance.\\n\\nBy following these alternatives, you can achieve your goals while maintaining the stability and reliability of your code.\",\n",
       "  'rejected': 'Thank you for reaching out for assistance! I\\'m here to help you with your question. However, I must point out that the question itself may not be meaningful.\\n\\nThe `getPosition` method is a part of the AntV/G library, which is a gradient boosting framework. It is not clear what you mean by \"transforming\" this method, as it is not a functional programming concept. Additionally, the concept of \"zrender\" is not related to AntV/G.\\n\\nCould you please provide more context or clarify your question? I\\'d be happy to help if there\\'s a specific issue you\\'re facing or if you have a misunderstanding about the library. I\\'m here to assist you in a safe, respectful, and helpful manner.',\n",
       "  'middle': \"It is not recommended to modify built-in methods as it can lead to unexpected results and potential bugs. You may consider developing a new method or exploring other methods to achieve your desired outcome. Alternatively, you can search for other libraries or modules that offer similar functionalities or reach out to the library's support team for assistance.\"}]"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "textual_aesthetics_triple[:2]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": [
    "from datasets import load_dataset, Dataset\n",
    "import pandas as pd\n",
    "import json\n",
    "data = read_jsonl(\"revised_data/output_sorted.jsonl\")\n",
    "not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "ds = load_dataset(\"HuggingFaceH4/ultrafeedback_binarized\", split=\"train_prefs\")\n",
    "def get_instruct_response(item):\n",
    "    # item[\"instruction\"] = item['chosen'][0][\"content\"]\n",
    "    item[\"response\"] = item['chosen'][1][\"content\"]\n",
    "    return item\n",
    "ds = ds.map(get_instruct_response, batch_size=1024, num_proc=8)\n",
    "export_data = ds.select_columns([\"prompt\", \"response\"])\n",
    "# export_data\n",
    "# data = filtered_revised_data\n",
    "not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "# datalen\n",
    "# data\n",
    "indices = set([item['index'] for item in data])\n",
    "# original_indices = set(range(export_data.shape[0]))\n",
    "# print(f\"index complete: {original_indices - indices}\")\n",
    "null_response_indices = [item['index'] for item in data if item['gpt_answer'].strip() == '']\n",
    "null_revised_indices = [item['index'] for item in data if item['revised_text'].strip() == '']\n",
    "noneed_revised_indices = [item['index'] for item in data if item['does_it_need_modification'].strip() == 'N']\n",
    "same_revised_text_indices = [item['index'] for item in data if item['response'].strip() == item['revised_text'].strip()]\n",
    "\n",
    "# print(len(null_response))\n",
    "# print(len(not_revised))\n",
    "print(f\"null_response_indices:{len(null_response_indices)}\")\n",
    "print(f\"null_revised_indices:{len(null_revised_indices)}\")\n",
    "print(f\"noneed_revised_indices:{len(noneed_revised_indices)}\")\n",
    "print(f\"same_revised_text_indices:{len(same_revised_text_indices)}\")\n",
    "# 使用集合的交集操作  \n",
    "indices_to_discard  = set(null_response_indices) | set(null_revised_indices) | set(noneed_revised_indices) | set(same_revised_text_indices)   \n",
    "print(f\"indices_to_discard: {len(indices_to_discard)}\")\n",
    "# filter length \n",
    "indices_to_discard = indices_to_discard | set(out_of_range_texts_indices)\n",
    "indices_to_discard = list(indices_to_discard)\n",
    "print(f\"indices_to_discard add length: {len(indices_to_discard)}\")\n",
    "temp_data = data\n",
    "# temp_ds = ds.select(range(10))\n",
    "for i, item in enumerate(ds):\n",
    "    # print(item['rejected'])\n",
    "    # index=item['index']\n",
    "    temp_data[i]['rejected'] = item['rejected'][1]['content']\n",
    "    temp_data[i]['instruct'] = item['prompt']\n",
    "    temp_data[i]['chosen'] = item['chosen']\n",
    "revised_data = [item for item in temp_data if item[\"index\"] not in indices_to_discard]\n",
    "print(f\"length of revised data: {len(revised_data)}\")\n",
    "textual_aesthetics_chosen = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"response\"]} for item in revised_data]\n",
    "# with open(\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_chosen_v4_{lower}_{upper}.json\", 'w') as f:\n",
    "#     json.dump(textual_aesthetics_chosen, f, indent=4)\n",
    "textual_aesthetics_rejected = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"rejected\"]} for item in revised_data]\n",
    "with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_rejected_v4_{lower}_{upper}.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_rejected, f, indent=4)\n",
    "print(f\"textual_aesthetics_chosen:{len(textual_aesthetics_chosen)}  textual_aesthetics_rejected:{len(textual_aesthetics_rejected)}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Counter({0: 1566, -1: 1316, 1: 1107, 2: 995, 3: 858, 4: 784, -2: 764, 5: 697, 6: 676, -6: 650, 7: 634, -3: 631, 10: 625, 9: 616, 8: 613, 12: 605, 11: 576, 13: 559, -7: 558, 18: 550, -4: 543, 15: 537, 20: 537, -5: 533, 14: 530, 16: 507, 19: 499, 21: 494, -8: 482, 17: 482, 23: 482, 24: 477, 22: 440, 29: 417, -10: 415, 25: 415, 27: 414, -9: 414, 30: 413, 26: 408, 31: 403, 28: 400, 34: 378, 33: 375, 32: 373, 39: 364, -12: 362, 35: 359, -13: 348, 36: 345, -11: 345, -15: 334, 37: 329, 42: 324, 38: 318, 40: 313, 43: 313, -14: 307, 44: 305, -16: 303, -17: 291, -18: 284, 48: 281, 41: 281, 46: 275, 45: 266, -20: 254, 50: 251, -19: 244, 47: 243, 56: 241, 51: 241, -21: 238, -22: 229, 54: 226, -24: 224, 49: 224, -23: 215, 53: 212, -25: 207, -26: 202, 55: 201, 52: 201, -30: 191, -29: 189, 60: 189, -33: 184, -27: 184, -28: 183, 57: 182, 62: 181, -32: 181, 58: 176, -31: 175, 63: 167, 59: 165, 61: 165, -35: 162, 70: 160, -36: 158, 67: 158, -34: 157, 69: 153, 68: 152, 65: 149, 64: 148, 66: 148, 71: 145, -39: 145, -42: 139, -38: 137, -37: 133, -40: 132, 74: 130, -49: 126, 73: 125, -41: 125, 77: 124, 87: 123, -46: 122, 78: 119, -43: 118, -47: 117, 72: 117, 81: 117, 79: 113, -48: 113, 76: 112, 75: 112, -44: 109, -45: 109, 83: 104, -53: 100, 84: 100, 85: 97, -50: 96, -52: 96, 82: 94, 80: 94, 89: 94, -55: 93, 96: 92, -51: 91, 92: 90, -59: 90, -61: 89, -56: 89, -54: 88, -60: 87, 88: 86, -62: 85, 95: 84, -66: 84, -58: 84, 94: 83, 86: 82, -57: 80, 93: 79, 105: 79, -63: 78, 100: 77, -67: 75, 90: 75, -65: 74, 91: 73, 117: 73, -74: 72, -69: 72, 99: 72, 111: 71, -64: 70, -68: 67, 104: 67, 107: 67, 98: 66, 103: 66, 136: 65, 114: 64, 102: 64, 106: 63, 108: 63, 101: 63, -76: 62, -78: 62, -73: 61, 116: 61, -80: 60, 123: 60, -89: 59, -79: 59, 97: 59, 125: 58, 121: 57, 118: 57, -84: 57, 115: 56, 109: 56, 110: 56, -70: 56, -71: 56, 135: 56, -75: 55, -83: 55, 122: 54, 112: 54, -72: 53, 113: 53, -77: 53, -91: 52, -86: 51, 128: 51, -82: 50, 137: 50, 126: 50, 130: 50, 124: 49, 119: 49, 134: 48, 139: 48, 157: 48, -85: 47, -88: 47, 127: 47, 169: 46, -90: 46, 129: 46, 145: 46, 120: 46, 138: 45, 133: 44, 155: 44, 140: 43, 146: 43, -81: 43, 156: 42, 164: 42, -97: 42, 177: 42, 175: 41, 158: 41, 149: 41, -95: 40, 154: 40, -102: 39, 165: 39, 143: 39, -87: 38, 160: 38, 131: 38, -103: 38, -94: 38, 163: 37, 152: 37, 132: 37, 144: 37, -96: 36, -100: 36, 228: 36, 161: 36, 142: 35, 141: 35, 166: 35, 153: 35, -92: 34, -118: 34, 184: 34, 147: 34, 159: 34, 213: 34, -98: 33, -99: 33, 174: 33, -123: 32, -115: 32, 172: 31, 197: 31, 182: 31, 193: 31, 200: 31, 170: 31, -113: 31, 148: 31, 190: 30, -106: 30, -107: 30, 201: 29, 212: 29, -111: 29, 189: 29, 180: 29, -93: 29, 203: 28, 192: 28, -105: 28, 225: 28, 183: 28, -121: 27, -101: 27, 202: 27, -117: 27, 167: 26, 214: 26, -104: 26, -116: 26, 151: 26, 218: 26, 195: 26, -110: 25, -133: 25, 186: 25, 427: 25, 247: 25, 181: 25, 248: 25, 426: 25, 168: 25, -122: 24, -114: 24, 204: 24, 150: 24, 179: 24, 272: 24, 244: 24, -109: 24, 185: 24, -128: 24, 215: 24, 237: 24, 231: 24, 171: 23, -143: 23, 178: 23, -120: 23, 198: 23, -132: 23, 216: 23, 187: 23, 173: 23, 233: 23, -135: 23, -125: 23, 176: 23, 262: 23, 229: 23, 280: 23, -126: 22, -150: 22, -131: 22, 256: 22, 252: 22, 162: 22, -112: 22, 199: 22, 255: 22, 191: 22, 251: 22, 220: 22, 227: 22, -127: 22, 240: 22, -142: 22, 230: 21, 223: 21, 226: 21, 234: 21, 296: 21, 194: 21, 270: 21, -124: 21, -138: 21, 221: 21, 206: 21, -119: 21, 219: 21, -129: 20, -145: 20, 242: 20, 245: 20, 205: 20, -149: 20, 236: 20, 217: 20, 269: 20, -108: 20, 207: 20, 263: 19, 259: 19, 428: 19, -137: 19, 224: 19, 273: 19, -136: 19, 243: 19, 208: 19, 196: 18, 267: 18, 447: 18, 258: 18, 289: 18, 283: 18, 239: 18, -157: 18, 264: 17, -139: 17, -140: 17, -153: 17, 361: 17, 222: 17, 275: 17, 389: 17, -151: 17, 355: 17, 339: 17, 241: 17, 235: 17, 238: 17, 421: 16, 358: 16, 284: 16, -197: 16, 310: 16, 249: 16, 188: 16, 305: 16, 444: 16, 370: 16, 276: 16, 303: 16, 425: 16, -163: 16, 295: 16, 271: 16, 253: 16, 306: 16, 291: 16, 408: 16, 342: 15, 329: 15, 246: 15, -155: 15, 422: 15, 286: 15, -148: 15, 312: 15, 423: 15, 211: 15, -165: 15, 210: 15, -144: 15, 363: 15, 410: 15, -147: 15, 265: 15, 300: 15, 294: 15, 457: 15, 372: 14, 288: 14, 316: 14, 344: 14, 397: 14, 268: 14, 330: 14, 519: 14, 446: 14, 261: 14, 418: 14, 336: 14, 331: 14, 449: 14, 257: 14, 277: 14, 287: 14, 420: 14, 250: 14, -161: 14, -173: 14, 311: 14, 327: 13, -168: 13, 254: 13, 320: 13, 337: 13, 297: 13, 232: 13, -169: 13, 274: 13, -158: 13, -170: 13, 324: 13, 285: 13, 455: 13, 385: 13, -159: 13, -130: 13, -141: 12, 409: 12, -166: 12, 266: 12, -201: 12, 282: 12, 260: 12, 412: 12, 347: 12, 381: 12, 442: 12, -156: 12, 354: 12, 278: 12, 400: 12, 299: 12, -152: 12, -146: 12, 293: 12, -176: 12, -199: 11, 432: 11, -177: 11, 319: 11, 430: 11, -167: 11, 341: 11, 419: 11, 441: 11, 333: 11, 518: 11, -164: 11, 209: 11, 368: 11, 417: 11, 393: 11, 328: 11, -213: 11, 450: 11, 405: 11, 488: 11, 462: 11, 480: 11, 390: 11, 302: 11, 388: 11, 346: 11, -162: 11, 481: 11, 335: 11, 378: 11, 487: 10, 639: 10, 435: 10, 440: 10, -225: 10, 402: 10, 406: 10, 401: 10, 505: 10, 359: 10, 464: 10, -182: 10, -134: 10, 290: 10, 377: 10, 415: 10, 511: 10, 314: 10, 298: 10, -179: 10, -154: 10, -191: 10, 467: 10, 323: 10, -160: 10, -190: 10, 334: 10, 436: 10, 383: 10, 544: 10, 308: 10, -186: 10, 313: 10, 315: 10, 349: 9, -207: 9, 497: 9, 460: 9, 529: 9, 474: 9, 382: 9, 403: 9, 394: 9, 326: 9, -184: 9, 490: 9, 516: 9, -212: 9, -180: 9, 340: 9, 484: 9, 416: 9, 500: 9, 392: 9, 453: 9, 614: 9, 371: 9, 530: 9, 404: 9, 592: 9, 279: 9, 367: 9, 281: 9, 424: 9, -194: 9, 304: 9, 445: 9, 380: 9, 387: 9, 413: 9, 332: 9, -221: 8, -238: 8, 501: 8, 658: 8, 362: 8, -206: 8, 506: 8, 461: 8, 307: 8, 451: 8, 338: 8, 443: 8, -231: 8, -178: 8, -211: 8, 521: 8, 348: 8, 465: 8, 486: 8, 523: 8, -289: 8, 478: 8, 485: 8, -222: 8, 532: 8, -257: 8, -195: 8, -202: 8, 398: 8, 321: 8, 434: 8, 429: 8, 384: 8, 492: 8, -254: 8, 475: 8, 493: 8, 366: 8, 301: 8, -227: 7, 578: 7, 468: 7, 350: 7, 536: 7, 520: 7, 508: 7, 351: 7, -240: 7, 433: 7, 439: 7, 375: 7, 601: 7, -217: 7, 743: 7, -242: 7, -200: 7, 513: 7, 593: 7, 634: 7, 524: 7, 526: 7, 509: 7, 489: 7, -188: 7, 527: 7, 559: 7, 352: 7, 680: 7, 356: 7, 407: 7, 373: 7, 557: 7, 343: 7, 564: 7, 596: 7, 399: 7, -185: 7, 396: 7, 494: 7, 589: 7, 504: 7, -214: 7, 345: 6, 317: 6, 587: 6, 638: 6, 552: 6, -196: 6, 379: 6, -205: 6, -193: 6, 459: 6, 633: 6, 566: 6, 577: 6, -204: 6, -311: 6, 476: 6, 612: 6, 318: 6, 551: 6, 364: 6, -174: 6, 623: 6, 651: 6, 562: 6, 507: 6, 555: 6, 470: 6, 661: 6, 322: 6, 437: 6, 620: 6, -250: 6, 687: 6, 617: 6, 528: 6, -220: 6, 448: 6, -209: 6, -298: 6, -233: 6, 753: 6, -224: 6, 431: 6, -183: 6, 556: 6, 579: 6, 1894: 6, 554: 5, 292: 5, 411: 5, 667: 5, 365: 5, -317: 5, -187: 5, -232: 5, 649: 5, 681: 5, -241: 5, -234: 5, -236: 5, -226: 5, 510: 5, -356: 5, 696: 5, 540: 5, 357: 5, 622: 5, 482: 5, 595: 5, 840: 5, 376: 5, -228: 5, -215: 5, -237: 5, -246: 5, 496: 5, 701: 5, 515: 5, -256: 5, 792: 5, -181: 5, -329: 5, 537: 5, -175: 5, -270: 5, 581: 5, 784: 5, -294: 5, -218: 5, -371: 5, 640: 5, 503: 5, 477: 5, 636: 5, -292: 5, 534: 5, -244: 5, 624: 5, 325: 5, 627: 5, 353: 5, 533: 5, 631: 5, 662: 5, -210: 5, 369: 5, 591: 5, 483: 5, 386: 5, 856: 5, 576: 5, 414: 5, 664: 5, 770: 5, 514: 5, -266: 5, 642: 5, -198: 5, 547: 5, 309: 5, 934: 4, 580: 4, -309: 4, 517: 4, 647: 4, -297: 4, 473: 4, -229: 4, 697: 4, 588: 4, -324: 4, -343: 4, 573: 4, -269: 4, 778: 4, 898: 4, 395: 4, 914: 4, 599: 4, 616: 4, -284: 4, -203: 4, 761: 4, 654: 4, 391: 4, 684: 4, 825: 4, -251: 4, 648: 4, 539: 4, 602: 4, 796: 4, 575: 4, 605: 4, 615: 4, 463: 4, 668: 4, -272: 4, -403: 4, 719: 4, 643: 4, 674: 4, 600: 4, 626: 4, 495: 4, 653: 4, -391: 4, -346: 4, 666: 4, -480: 4, 454: 4, 472: 4, 565: 4, 438: 4, -333: 4, 619: 4, -381: 4, 670: 4, 1892: 4, 754: 4, -219: 4, -245: 4, 810: 4, 645: 4, 590: 4, 553: 4, 924: 4, 689: 4, 561: 4, 734: 4, -192: 4, 584: 4, -189: 4, -249: 4, 558: 4, 675: 4, 360: 4, 621: 4, -223: 4, -344: 4, 717: 4, 548: 4, 609: 4, 669: 4, 512: 4, -263: 4, -258: 4, -267: 4, -369: 4, -172: 4, -208: 4, 560: 4, 374: 4, 706: 4, 586: 4, -340: 4, 797: 3, -463: 3, 782: 3, -296: 3, -216: 3, 499: 3, -394: 3, 629: 3, -436: 3, 572: 3, 765: 3, -306: 3, -373: 3, 452: 3, 604: 3, 789: 3, -271: 3, -230: 3, 571: 3, -268: 3, -477: 3, 1106: 3, 979: 3, 663: 3, 1008: 3, -457: 3, 828: 3, 693: 3, 694: 3, 545: 3, -363: 3, 456: 3, -303: 3, -318: 3, 727: 3, 699: 3, 613: 3, 635: 3, -302: 3, -338: 3, 568: 3, 745: 3, 714: 3, 865: 3, -487: 3, 723: 3, 884: 3, 665: 3, -247: 3, 672: 3, -262: 3, 646: 3, -239: 3, -280: 3, 764: 3, 543: 3, -434: 3, -482: 3, 921: 3, 741: 3, 709: 3, -379: 3, -366: 3, -275: 3, 970: 3, -314: 3, -253: 3, 931: 3, 630: 3, -326: 3, 531: 3, 650: 3, 958: 3, -500: 3, 574: 3, 900: 3, -287: 3, 597: 3, -288: 3, 585: 3, 703: 3, 685: 3, 917: 3, 827: 3, -305: 3, 628: 3, -445: 3, 471: 3, -171: 3, 777: 3, 1171: 3, -410: 3, 829: 3, -417: 3, -525: 3, -374: 3, 611: 3, 546: 3, 756: 3, -323: 3, 563: 3, -291: 3, 1098: 3, 538: 3, 843: 3, -476: 3, 469: 3, -370: 3, 853: 3, 632: 3, -252: 3, 1891: 3, 861: 3, 660: 3, 491: 3, -437: 3, -327: 3, 838: 3, 973: 3, -386: 3, 732: 3, 1004: 3, 657: 3, 845: 3, 677: 3, 805: 2, 695: 2, -415: 2, 1844: 2, -768: 2, 794: 2, 820: 2, -397: 2, 1099: 2, 760: 2, 907: 2, 1026: 2, -337: 2, -646: 2, -462: 2, -281: 2, -248: 2, 1540: 2, -447: 2, 1027: 2, -438: 2, 725: 2, -635: 2, 918: 2, 1189: 2, -365: 2, 740: 2, 1508: 2, 804: 2, -712: 2, 749: 2, 1082: 2, 1897: 2, 1116: 2, 594: 2, 618: 2, 1172: 2, 679: 2, -428: 2, 729: 2, 567: 2, -355: 2, 1144: 2, -310: 2, -279: 2, 690: 2, -282: 2, -357: 2, 881: 2, 971: 2, 834: 2, 479: 2, 1181: 2, 673: 2, 877: 2, 1170: 2, 844: 2, 569: 2, 852: 2, 625: 2, 954: 2, -652: 2, 752: 2, 1137: 2, 466: 2, -259: 2, 1233: 2, -651: 2, -607: 2, 987: 2, 813: 2, 911: 2, 980: 2, 826: 2, -472: 2, 823: 2, 1282: 2, 716: 2, 1043: 2, 535: 2, 1201: 2, 1979: 2, 1359: 2, -364: 2, -425: 2, 644: 2, 498: 2, -458: 2, 1101: 2, -569: 2, 920: 2, -553: 2, -315: 2, 686: 2, 726: 2, -573: 2, -405: 2, 522: 2, 570: 2, 1006: 2, 678: 2, -662: 2, 606: 2, 806: 2, 969: 2, -402: 2, -339: 2, -362: 2, 835: 2, 637: 2, -243: 2, -515: 2, -426: 2, -429: 2, 983: 2, -299: 2, -312: 2, -490: 2, 1092: 2, 1033: 2, 988: 2, 938: 2, -235: 2, 659: 2, 972: 2, -603: 2, 869: 2, -261: 2, -335: 2, -393: 2, 790: 2, 883: 2, -265: 2, 525: 2, 793: 2, -375: 2, 715: 2, -432: 2, 747: 2, 705: 2, 1097: 2, -554: 2, -548: 2, -295: 2, 854: 2, -330: 2, 1210: 2, 458: 2, 1042: 2, 550: 2, 700: 2, 762: 2, 1696: 2, 711: 2, -570: 2, 788: 2, -277: 2, 641: 2, 816: 2, 1014: 2, 1110: 2, 656: 2, 948: 2, 910: 2, 1155: 2, 1331: 2, 603: 2, 799: 2, 682: 2, 1076: 2, 1297: 2, 1893: 2, -409: 2, 766: 2, 1016: 2, -528: 2, -322: 2, 1241: 2, -413: 2, -421: 2, -334: 2, -290: 2, -461: 2, 1399: 2, 893: 2, -320: 2, 779: 2, -551: 2, 894: 2, 772: 2, 798: 2, 811: 2, 964: 2, -382: 2, 758: 2, 702: 2, 691: 2, 1075: 2, 1059: 2, -341: 2, 1052: 2, 724: 2, 943: 2, 759: 2, 1187: 2, 776: 2, 1183: 2, 610: 2, -450: 2, 876: 2, -467: 2, 1003: 2, 757: 2, 733: 2, 542: 2, 598: 2, 1220: 1, 1134: 1, -508: 1, 1455: 1, 1289: 1, 1009: 1, -780: 1, 975: 1, -714: 1, -762: 1, 1093: 1, 1280: 1, 1064: 1, 998: 1, -449: 1, -398: 1, 1211: 1, 1466: 1, -647: 1, 960: 1, 863: 1, -513: 1, -633: 1, 867: 1, 1196: 1, 1272: 1, -558: 1, 1242: 1, 1215: 1, -826: 1, 704: 1, 707: 1, -274: 1, -691: 1, -590: 1, 1878: 1, 1045: 1, 1192: 1, 864: 1, 1452: 1, -754: 1, 1332: 1, -486: 1, 1614: 1, 976: 1, 1010: 1, -724: 1, -475: 1, -383: 1, -1024: 1, -577: 1, -580: 1, 1635: 1, 502: 1, 850: 1, 1925: 1, -501: 1, -368: 1, 815: 1, 871: 1, -454: 1, 846: 1, 737: 1, -597: 1, -934: 1, 1227: 1, 1987: 1, 787: 1, 791: 1, -692: 1, -709: 1, 978: 1, 1238: 1, -519: 1, -285: 1, -406: 1, 1350: 1, 1372: 1, 1234: 1, 1136: 1, 795: 1, 1096: 1, -536: 1, 912: 1, 803: 1, 1060: 1, 1401: 1, 897: 1, 722: 1, 1646: 1, 951: 1, 1057: 1, 1340: 1, -850: 1, -495: 1, 990: 1, -680: 1, 731: 1, 925: 1, 860: 1, -392: 1, 858: 1, 1692: 1, 1747: 1, 1330: 1, 895: 1, -687: 1, 1362: 1, 1776: 1, -681: 1, 942: 1, -468: 1, -489: 1, -332: 1, 1469: 1, 721: 1, -331: 1, -336: 1, 771: 1, -512: 1, 688: 1, 773: 1, -441: 1, 968: 1, 1904: 1, 1145: 1, 1287: 1, 944: 1, 671: 1, -833: 1, 1118: 1, -442: 1, -811: 1, 906: 1, 1114: 1, -630: 1, 1065: 1, -757: 1, -378: 1, 1163: 1, -499: 1, 780: 1, -260: 1, 887: 1, 1885: 1, -698: 1, -643: 1, -328: 1, 953: 1, 995: 1, 807: 1, -424: 1, -308: 1, 1184: 1, -423: 1, -563: 1, -469: 1, 1047: 1, 1439: 1, 1195: 1, 961: 1, 1333: 1, 728: 1, -792: 1, -443: 1, -1018: 1, 1129: 1, 901: 1, 1051: 1, 698: 1, -860: 1, 833: 1, -439: 1, -719: 1, 1120: 1, -361: 1, -479: 1, -638: 1, 1838: 1, -407: 1, -430: 1, -676: 1, -616: 1, -708: 1, 1159: 1, 1257: 1, -560: 1, 1040: 1, -761: 1, 841: 1, -478: 1, 1547: 1, 1094: 1, 1966: 1, 1274: 1, 1219: 1, 583: 1, 582: 1, -867: 1, 1090: 1, -399: 1, 1266: 1, 755: 1, 1022: 1, 1044: 1, 1367: 1, -283: 1, 1062: 1, 655: 1, 1235: 1, -529: 1, -605: 1, -716: 1, 909: 1, 1028: 1, 1927: 1, 956: 1, 1049: 1, 785: 1, -538: 1, 1150: 1, -388: 1, 1292: 1, 1458: 1, -659: 1, 1440: 1, 713: 1, -506: 1, -385: 1, -503: 1, 720: 1, 930: 1, -316: 1, 872: 1, 1154: 1, -670: 1, 1437: 1, 1907: 1, -255: 1, 549: 1, -669: 1, 992: 1, 974: 1, 1911: 1, -556: 1, -654: 1, 809: 1, 880: 1, -944: 1, -583: 1, -631: 1, 708: 1, 1237: 1, -494: 1, 1041: 1, 1286: 1, -622: 1, 1336: 1, -533: 1, 652: 1, 1666: 1, 1179: 1, 1537: 1, 905: 1, 1250: 1, 812: 1, 1442: 1, -701: 1, -304: 1, -505: 1, 1111: 1, -293: 1, 1025: 1, -787: 1, 1858: 1, 1125: 1, -592: 1, 1541: 1, -313: 1, -637: 1, -608: 1, -739: 1, -540: 1, 710: 1, -456: 1, 922: 1, -593: 1, 2673: 1, 1035: 1, 1279: 1, 1133: 1, -562: 1, 1410: 1, -459: 1, 1078: 1, 1029: 1, -527: 1, 739: 1, -596: 1, 1777: 1, 1071: 1, 746: 1, 874: 1, 786: 1, -422: 1, -606: 1, -783: 1, 836: 1, 1586: 1, 1216: 1, 945: 1, 903: 1, -614: 1, 1928: 1, 541: 1, -485: 1, -618: 1, 847: 1, -752: 1, 1072: 1, 750: 1, 1084: 1, -347: 1, 1131: 1, 1138: 1, -359: 1, -619: 1, 1063: 1, -629: 1, -440: 1, 1853: 1, 1124: 1, 1074: 1, 1182: 1, 927: 1, -433: 1, -286: 1, 774: 1, 886: 1, -737: 1, 1206: 1, 676: 1, 1229: 1, 1146: 1, -273: 1, 991: 1, -301: 1, -674: 1, 941: 1, 932: 1, 937: 1, -796: 1, 848: 1, 1814: 1, 1254: 1, -350: 1, -352: 1, -404: 1, 1304: 1, -523: 1, 1326: 1, 890: 1, 904: 1, -321: 1, 1772: 1, 947: 1, 608: 1, 1638: 1, 959: 1, 873: 1, -325: 1, -763: 1, 977: 1, -648: 1, 1392: 1, 1347: 1, 928: 1, -587: 1, 718: 1, -474: 1, -389: 1, -966: 1, 1148: 1, 1856: 1, 1481: 1, -522: 1, 1800: 1, -568: 1, 892: 1, -264: 1, 1577: 1, 1953: 1, -541: 1, 1916: 1, 955: 1, 1636: 1, -853: 1, 1863: 1, 751: 1, 1066: 1, 683: 1, -547: 1, 1387: 1, 889: 1, -897: 1, 1117: 1, 1598: 1, 1839: 1, 822: 1, -342: 1, -451: 1, 814: 1, -484: 1, 1823: 1, 775: 1, 1901: 1, -376: 1, -588: 1, 999: 1, -628: 1, -679: 1, 896: 1, -657: 1, 1077: 1, 1446: 1, 1103: 1, -420: 1, -604: 1, -411: 1, 1212: 1, 1295: 1, 1785: 1, -731: 1, -470: 1, -412: 1, 963: 1, 936: 1, 1152: 1, 1988: 1, 859: 1, 744: 1, 1247: 1, 1903: 1, 837: 1, -642: 1, 1861: 1, 1165: 1, 730: 1, 800: 1, 1329: 1, 1156: 1, 1625: 1, 1132: 1, 1299: 1, 1180: 1, 1603: 1, 1036: 1, -481: 1, 1361: 1, 1811: 1, 1365: 1, 1569: 1, -349: 1, 1015: 1, 1149: 1, 1020: 1, -520: 1, 817: 1, -634: 1, 1889: 1, -380: 1})\n",
      "Mean: 49.15065020037622, Median: 13.0, Standard Deviation: 169.45465111600666\n",
      "90% Confidence Interval: [-143.0, 342.0]\n",
      "Max length difference: 2673, Min length difference: -1024\n",
      "out_of_range_texts length 4638\n"
     ]
    },
    {
     "data": {
      "image/png": "iVBORw0KGgoAAAANSUhEUgAAA1sAAAIjCAYAAAD1OgEdAAAAOXRFWHRTb2Z0d2FyZQBNYXRwbG90bGliIHZlcnNpb24zLjkuMSwgaHR0cHM6Ly9tYXRwbG90bGliLm9yZy/TGe4hAAAACXBIWXMAAA9hAAAPYQGoP6dpAABy5UlEQVR4nO3dd3hUddrG8XvSEyCEmhClZBEQEERBMSsova5rYUUEBRXBAopi5VURsCCoiCCCuAK6goUVG4tIpIgC0iRSpRmIAimQ3iczv/ePmJEhAULI5CTk+7kurnDO+Z0zz3kymcydU8ZmjDECAAAAAJQpL6sLAAAAAIALEWELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAKqwLl266LLLLivXx7TZbJowYYLbvM2bN+vvf/+7qlWrJpvNpujoaEnS8uXL1a5dOwUEBMhmsyklJaVca63s7rrrLjVp0qRcHqtJkya66667XNMLFiyQzWbTli1byuXxu3Tpoi5dupTLYwFASRG2AOA8lfebynN19OhRTZgwwRVgylKTJk1ks9lks9nk5eWlkJAQtWnTRiNHjtTGjRtLtA273a5bb71VSUlJeuONN/Sf//xHjRs31okTJzRw4EAFBgZq1qxZ+s9//qNq1aqV+T5UFhMmTHD12mazKSgoSI0aNdINN9yg+fPnKzc3t0weZ/fu3ZowYYIOHTpUJtsrSxW5NgAojo/VBQAAPOvo0aOaOHGimjRponbt2pX59tu1a6fHHntMkpSenq49e/Zo8eLFevfdd/Xoo49q2rRpbuOzs7Pl4/PXr5+DBw/q8OHDevfdd3Xvvfe65i9fvlzp6el64YUX1KNHjzKvu7KaPXu2qlevrtzcXB05ckTffvut7rnnHk2fPl1Lly5Vw4YNXWPfffddOZ3Oc9r+7t27NXHiRHXp0uWcjort3btXXl6e/RvumWpbsWKFRx8bAEqDsAUAOC8XXXSR7rjjDrd5U6ZM0eDBg/XGG2+oWbNmeuCBB1zLAgIC3MYmJCRIkkJCQko0/3xkZmZW+qNj//rXv1S3bl3X9Pjx47Vw4UINHTpUt956q3766SfXMl9fX4/WYoxRTk6OAgMD5e/v79HHOhs/Pz9LHx8AisNphABQTo4cOaJ77rlHoaGh8vf3V+vWrTVv3jy3MWvWrJHNZtOnn36ql156SRdffLECAgLUvXt3HThwoMg2Z82apb/97W8KDAzU1VdfrR9++MHt2pU1a9boqquukiTdfffdrlPQFixY4Lad3bt3q2vXrgoKCtJFF12kqVOnnte+BgYG6j//+Y9q166tl156ScYY17KTr9m66667dP3110uSbr31VtlsNlf9w4YNkyRdddVVstlsbtcDbdy4UX369FHNmjUVFBSk66+/XuvWrXOrofC0u927d2vw4MGqVauWOnXq5Fr+4Ycfqn379goMDFTt2rU1aNAg/f77727bKLymrST9ycnJ0YQJE9S8eXMFBASoQYMGuuWWW3Tw4EHXGKfTqenTp6t169YKCAhQaGio7rvvPiUnJ5eu0X8aMmSI7r33Xm3cuFFRUVGu+cVds/Xxxx+rffv2qlGjhoKDg9WmTRu9+eabkgpOib311lslSV27dnU9X9asWSOp4LTRf/zjH/r222/VoUMHBQYG6p133nEtO/l7VCgrK0v33Xef6tSpo+DgYA0dOrTI/hZ3Hd+p2zxbbcVds5WQkKDhw4crNDRUAQEBuvzyy/X++++7jTl06JBsNptee+01zZ07V02bNpW/v7+uuuoqbd68udh+A0BJcWQLAMpBfHy8rrnmGtlsNo0ePVr16tXTN998o+HDhystLU2PPPKI2/hXXnlFXl5eevzxx5WamqqpU6dqyJAhbtdBzZ49W6NHj1bnzp316KOP6tChQ7rppptUq1YtXXzxxZKkli1batKkSRo/frxGjhypzp07S5L+/ve/u7aTnJysPn366JZbbtHAgQP13//+V0899ZTatGmjvn37lnqfq1evrptvvlnvvfeedu/erdatWxcZc9999+miiy7Syy+/rIcfflhXXXWVQkNDJUktWrTQ3LlzNWnSJEVERKhp06aSpFWrVqlv375q3769nn/+eXl5eWn+/Pnq1q2bfvjhB1199dVuj3HrrbeqWbNmevnll12h76WXXtJzzz2ngQMH6t5771ViYqJmzpyp6667Ttu2bXM7mlaS/jgcDv3jH//QypUrNWjQII0ZM0bp6emKiorSzp07XbXfd999WrBgge6++249/PDDiomJ0VtvvaVt27Zp3bp153Uk6s4779TcuXO1YsUK9ezZs9gxUVFRuv3229W9e3dNmTJFkrRnzx6tW7dOY8aM0XXXXaeHH35YM2bM0P/93/+pZcuWkuT6KhWcLnj77bfrvvvu04gRI9SiRYsz1jV69GiFhIRowoQJ2rt3r2bPnq3Dhw+7/rBQUiWp7WTZ2dnq0qWLDhw4oNGjRysiIkKLFy/WXXfdpZSUFI0ZM8Zt/KJFi5Senq777rtPNptNU6dO1S233KLffvvN40cIAVzADADgvMyfP99IMps3bz7tmOHDh5sGDRqY48ePu80fNGiQqVmzpsnKyjLGGLN69WojybRs2dLk5ua6xr355ptGktmxY4cxxpjc3FxTp04dc9VVVxm73e4at2DBAiPJXH/99a55mzdvNpLM/Pnzi9R1/fXXG0nmgw8+cM3Lzc01YWFhZsCAAWfd98aNG5v+/fufdvkbb7xhJJkvv/zSNU+Sef75513Thfu8ePFit3WL66vT6TTNmjUzvXv3Nk6n0zU/KyvLREREmJ49e7rmPf/880aSuf322922e+jQIePt7W1eeuklt/k7duwwPj4+bvNL2p958+YZSWbatGlFelBY5w8//GAkmYULF7otX758ebHzT1W4P4mJicUuT05ONpLMzTff7Jo3bNgw07hxY9f0mDFjTHBwsMnPzz/t4yxevNhIMqtXry6yrHHjxkaSWb58ebHLhg0b5pou/P61b9/e5OXlueZPnTr1rM+J023zTLVdf/31bs/76dOnG0nmww8/dM3Ly8szkZGRpnr16iYtLc0YY0xMTIyRZOrUqWOSkpJcY7/88ksjyXz99ddFHgsASorTCAHAw4wx+uyzz3TDDTfIGKPjx4+7/vXu3Vupqan6+eef3da5++673a5BKTwi9dtvv0mStmzZohMnTmjEiBFuN5sYMmSIatWqdU71Va9e3e2aKz8/P1199dWuxzof1atXl1Rw44yyEB0drf3792vw4ME6ceKEq4+ZmZnq3r271q5dW+SGEPfff7/b9JIlS+R0OjVw4EC370VYWJiaNWum1atXF9mHs/Xns88+U926dfXQQw8Vqbnw6M3ixYtVs2ZN9ezZ0+1x27dvr+rVqxd53HNVkl6HhIQoMzPT7VTDcxUREaHevXuXePzIkSPdjgw98MAD8vHx0bJly0pdQ0ksW7ZMYWFhuv32213zfH199fDDDysjI0Pff/+92/jbbrvN7Wfn1J85ACgNTiMEAA9LTExUSkqK5s6dq7lz5xY7pvBmEIUaNWrkNl34JrDwWpfDhw9Lki655BK3cT4+Puf8uUoXX3xxkdO5atWqpe3bt5/TdoqTkZEhSapRo8Z5b0uS9u/fL0mu67mKk5qa6vamOSIiosg2jDFq1qxZseufespYSfpz8OBBtWjRwi34Fld7amqq6tevX+zyU58D56okvX7wwQf16aefqm/fvrrooovUq1cvDRw4UH369Cnx45zaz7M5tc/Vq1dXgwYNPH779sOHD6tZs2ZF7pBYeNph4c9QobP9zAFAaRC2AMDDCo+03HHHHacNCW3btnWb9vb2LnacOelGE2XFk4+1c+dOSUVDYWkV9vLVV1897W3sC4/wFAoMDCyyDZvNpm+++abYfT91/bLqj9PpVP369bVw4cJil9erV++ctneqkvS6fv36io6O1rfffqtvvvlG33zzjebPn6+hQ4cWuXHE6ZzaT09yOBzl9ljl+TMHoOogbAGAh9WrV081atSQw+Eos8+Laty4sSTpwIED6tq1q2t+fn6+Dh065BbezuUmBGUpIyNDn3/+uRo2bHjamxicq8IbTQQHB5e6l02bNpUxRhEREWrevHmZ1bVx40bZ7fbT3kyhadOm+u6773Tttdd6JLD85z//kaSznuLn5+enG264QTfccIOcTqcefPBBvfPOO3ruued0ySWXlPnzZf/+/W7P0YyMDB07dkz9+vVzzatVq5ZSUlLc1svLy9OxY8fc5p1LbY0bN9b27dvldDrdjm79+uuvruUA4GlcswUAHubt7a0BAwbos88+cx19OFliYuI5b7NDhw6qU6eO3n33XeXn57vmL1y4sMhpT4WfK3Xqm1lPys7O1p133qmkpCQ988wzZfYGvn379mratKlee+0112lzJytJL2+55RZ5e3tr4sSJRY5aGGN04sSJc65rwIABOn78uN56660iywofY+DAgXI4HHrhhReKjMnPzz+v78+iRYv073//W5GRkerevftpx526b15eXq5gnpubK6nsny9z586V3W53Tc+ePVv5+flud7ps2rSp1q5dW2S9U49snUtt/fr1U1xcnD755BPXvPz8fM2cOVPVq1d3feQAAHgSR7YAoIzMmzdPy5cvLzJ/zJgxeuWVV7R69Wp17NhRI0aMUKtWrZSUlKSff/5Z3333nZKSks7psfz8/DRhwgQ99NBD6tatmwYOHKhDhw5pwYIFatq0qVu4adq0qUJCQjRnzhzVqFFD1apVU8eOHc/52pvTOXLkiD788ENJBUctdu/ercWLFysuLk6PPfaY7rvvvjJ5HKkgHPz73/9W37591bp1a91999266KKLdOTIEa1evVrBwcH6+uuvz7iNpk2b6sUXX9S4ceNct8uvUaOGYmJi9Pnnn2vkyJF6/PHHz6muoUOH6oMPPtDYsWO1adMmde7cWZmZmfruu+/04IMP6sYbb9T111+v++67T5MnT1Z0dLR69eolX19f7d+/X4sXL9abb76pf/3rX2d9rP/+97+qXr268vLydOTIEX377bdat26dLr/8ci1evPiM6957771KSkpSt27ddPHFF+vw4cOaOXOm2rVr5zr62K5dO3l7e2vKlClKTU2Vv7+/unXrdtprzc4mLy9P3bt318CBA7V37169/fbb6tSpk/75z3+61XX//fdrwIAB6tmzp3755Rd9++23bh/efK61jRw5Uu+8847uuusubd26VU2aNNF///tfrVu3TtOnTy+z6wgB4EwIWwBQRmbPnl3s/LvuuksXX3yxNm3apEmTJmnJkiV6++23VadOHbVu3dr1eUfnavTo0TLG6PXXX9fjjz+uyy+/XF999ZUefvhhBQQEuMb5+vrq/fff17hx43T//fcrPz9f8+fPL7OwFR0drTvvvFM2m001atRQw4YNdcMNN+jee+8t8plXZaFLly7asGGDXnjhBb311lvKyMhQWFiYOnbsWOJg9/TTT6t58+Z64403NHHiRElSw4YN1atXL7cQUFLe3t5atmyZXnrpJS1atEifffaZ6tSpo06dOqlNmzaucXPmzFH79u31zjvv6P/+7/9cNzS54447dO2115bosR544AFJUkBAgOrWrat27dpp3rx5Gjx4sPz9/c+47h133KG5c+fq7bffVkpKisLCwnTbbbdpwoQJrlPtwsLCNGfOHE2ePFnDhw+Xw+HQ6tWrSx223nrrLS1cuFDjx4+X3W7X7bffrhkzZrj9QWDEiBGKiYnRe++9p+XLl6tz586KiooqcpTuXGoLDAzUmjVr9PTTT+v9999XWlqaWrRoofnz5xf74csA4Ak2w5WfAHDBcDqdqlevnm655Ra9++67VpcDAECVxjVbAFBJ5eTkFLnm6IMPPlBSUpK6dOliTVEAAMCFI1sAUEmtWbNGjz76qG699VbVqVNHP//8s9577z21bNlSW7dudftQZAAAUP64ZgsAKqkmTZqoYcOGmjFjhpKSklS7dm0NHTpUr7zyCkELAIAKgCNbAAAAAOABXLMFAAAAAB5A2AIAAAAAD+CarRJyOp06evSoatSo4fbZIAAAAACqFmOM0tPTFR4e7vqcwuIQtkro6NGjatiwodVlAAAAAKggfv/9d1188cWnXU7YKqEaNWpIKmhocHCwxdW4s9vtWrFihXr16iVfX1+ry6ly6L916L116L116L216L916L116H1RaWlpatiwoSsjnA5hq4QKTx0MDg6ukGErKChIwcHB/ABYgP5bh95bh95bh95bi/5bh95bh96f3tkuL+IGGQAAAADgAYQtAAAAAPAAwhYAAAAAeABhCwAAAAA8gLAFAAAAAB5gadhau3atbrjhBoWHh8tms+mLL74oMmbPnj365z//qZo1a6patWq66qqrFBsb61qek5OjUaNGqU6dOqpevboGDBig+Ph4t23Exsaqf//+CgoKUv369fXEE08oPz/f07sHAAAAoAqzNGxlZmbq8ssv16xZs4pdfvDgQXXq1EmXXnqp1qxZo+3bt+u5555TQECAa8yjjz6qr7/+WosXL9b333+vo0eP6pZbbnEtdzgc6t+/v/Ly8rR+/Xq9//77WrBggcaPH+/x/QMAAABQdVn6OVt9+/ZV3759T7v8mWeeUb9+/TR16lTXvKZNm7r+n5qaqvfee0+LFi1St27dJEnz589Xy5Yt9dNPP+maa67RihUrtHv3bn333XcKDQ1Vu3bt9MILL+ipp57ShAkT5Ofn57kdBAAAAFBlVdgPNXY6nfrf//6nJ598Ur1799a2bdsUERGhcePG6aabbpIkbd26VXa7XT169HCtd+mll6pRo0basGGDrrnmGm3YsEFt2rRRaGioa0zv3r31wAMPaNeuXbriiiuKffzc3Fzl5ua6ptPS0iQVfKib3W73wB6XXmE9Fa2uqoL+W4feW4feW4feW4v+W4feW4feF1XSXlTYsJWQkKCMjAy98sorevHFFzVlyhQtX75ct9xyi1avXq3rr79ecXFx8vPzU0hIiNu6oaGhiouLkyTFxcW5Ba3C5YXLTmfy5MmaOHFikfkrVqxQUFDQee6dZ0RFRVldQpVG/61D761D761D761F/61D761D7/+SlZVVonEVNmw5nU5J0o033qhHH31UktSuXTutX79ec+bM0fXXX+/Rxx83bpzGjh3rmk5LS1PDhg3Vq1cvBQcHe/Sxz5XdbldUVJR69uwpX19fq8upcui/dei9dei9dei9tei/dei9deh9UYVnvZ1NhQ1bdevWlY+Pj1q1auU2v2XLlvrxxx8lSWFhYcrLy1NKSorb0a34+HiFhYW5xmzatMltG4V3KywcUxx/f3/5+/sXme/r61thn2QVubaqgP5bh95bh95bh95bi/5bh95bh97/paR9qLCfs+Xn56errrpKe/fudZu/b98+NW7cWJLUvn17+fr6auXKla7le/fuVWxsrCIjIyVJkZGR2rFjhxISElxjoqKiFBwcXCTIAQAAAEBZsfTIVkZGhg4cOOCajomJUXR0tGrXrq1GjRrpiSee0G233abrrrtOXbt21fLly/X1119rzZo1kqSaNWtq+PDhGjt2rGrXrq3g4GA99NBDioyM1DXXXCNJ6tWrl1q1aqU777xTU6dOVVxcnJ599lmNGjWq2CNXAAAAAFAWLA1bW7ZsUdeuXV3ThddIDRs2TAsWLNDNN9+sOXPmaPLkyXr44YfVokULffbZZ+rUqZNrnTfeeENeXl4aMGCAcnNz1bt3b7399tuu5d7e3lq6dKkeeOABRUZGqlq1aho2bJgmTZpUfjsKAAAAoMqxNGx16dJFxpgzjrnnnnt0zz33nHZ5QECAZs2addoPRpakxo0ba9myZaWuEwAAAADOVYW9ZgsAAAAAKjPCFgAAAAB4AGELAAAAADyAsAWg0kpOTnb7CgAAUJEQtgBUWikpKW5fAQAAKhLCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ABLw9batWt1ww03KDw8XDabTV988cVpx95///2y2WyaPn262/ykpCQNGTJEwcHBCgkJ0fDhw5WRkeE2Zvv27ercubMCAgLUsGFDTZ061QN7AwAAAAB/sTRsZWZm6vLLL9esWbPOOO7zzz/XTz/9pPDw8CLLhgwZol27dikqKkpLly7V2rVrNXLkSNfytLQ09erVS40bN9bWrVv16quvasKECZo7d26Z7w8AAAAAFPKx8sH79u2rvn37nnHMkSNH9NBDD+nbb79V//793Zbt2bNHy5cv1+bNm9WhQwdJ0syZM9WvXz+99tprCg8P18KFC5WXl6d58+bJz89PrVu3VnR0tKZNm+YWygAAAACgLFkats7G6XTqzjvv1BNPPKHWrVsXWb5hwwaFhIS4gpYk9ejRQ15eXtq4caNuvvlmbdiwQdddd538/PxcY3r37q0pU6YoOTlZtWrVKvaxc3NzlZub65pOS0uTJNntdtnt9rLaxTJRWE9Fq6uqoP/WcTgcrq/0v3zxvLcOvbcW/bcOvbcOvS+qpL2o0GFrypQp8vHx0cMPP1zs8ri4ONWvX99tno+Pj2rXrq24uDjXmIiICLcxoaGhrmWnC1uTJ0/WxIkTi8xfsWKFgoKCznlfykNUVJTVJVRp9N86+/bt0759+6wuo0rieW8dem8t+m8dem8dev+XrKysEo2rsGFr69atevPNN/Xzzz/LZrOV++OPGzdOY8eOdU2npaWpYcOG6tWrl4KDg8u9njOx2+2KiopSz5495evra3U5VQ79t86BAwe0b98+NW/eXJdcconV5VQpPO+tQ++tRf+tQ++tQ++LKjzr7WwqbNj64YcflJCQoEaNGrnmORwOPfbYY5o+fboOHTqksLAwJSQkuK2Xn5+vpKQkhYWFSZLCwsIUHx/vNqZwunBMcfz9/eXv719kvq+vb4V9klXk2qoC+l/+vL29XV/pvTV43luH3luL/luH3luH3v+lpH2osJ+zdeedd2r79u2Kjo52/QsPD9cTTzyhb7/9VpIUGRmplJQUbd261bXeqlWr5HQ61bFjR9eYtWvXup1XGRUVpRYtWpz2FEIAAAAAOF+WHtnKyMjQgQMHXNMxMTGKjo5W7dq11ahRI9WpU8dtvK+vr8LCwtSiRQtJUsuWLdWnTx+NGDFCc+bMkd1u1+jRozVo0CDXbeIHDx6siRMnavjw4Xrqqae0c+dOvfnmm3rjjTfKb0cBAAAAVDmWhq0tW7aoa9eurunCa6SGDRumBQsWlGgbCxcu1OjRo9W9e3d5eXlpwIABmjFjhmt5zZo1tWLFCo0aNUrt27dX3bp1NX78eG77DgAAAMCjLA1bXbp0kTGmxOMPHTpUZF7t2rW1aNGiM67Xtm1b/fDDD+daHgAAAACUWoW9ZgsAAAAAKjPCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFoBKKzU11e0rAABARULYAlBppaWluX0FAACoSAhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAgAAAAAPIGwBAAAAgAcQtgAAAADAAwhbAAAAAOABhC0AAAAA8ADCFgAAAAB4gKVha+3atbrhhhsUHh4um82mL774wrXMbrfrqaeeUps2bVStWjWFh4dr6NChOnr0qNs2kpKSNGTIEAUHByskJETDhw9XRkaG25jt27erc+fOCggIUMOGDTV16tTy2D0AAAAAVZilYSszM1OXX365Zs2aVWRZVlaWfv75Zz333HP6+eeftWTJEu3du1f//Oc/3cYNGTJEu3btUlRUlJYuXaq1a9dq5MiRruVpaWnq1auXGjdurK1bt+rVV1/VhAkTNHfuXI/vHwAAAICqy8fKB+/bt6/69u1b7LKaNWsqKirKbd5bb72lq6++WrGxsWrUqJH27Nmj5cuXa/PmzerQoYMkaebMmerXr59ee+01hYeHa+HChcrLy9O8efPk5+en1q1bKzo6WtOmTXMLZQAAAABQliwNW+cqNTVVNptNISEhkqQNGzYoJCTEFbQkqUePHvLy8tLGjRt18803a8OGDbruuuvk5+fnGtO7d29NmTJFycnJqlWrVrGPlZubq9zcXNd0WlqapILTG+12uwf2rvQK66lodVUV9N86xhjXV/pfvnjeW4feW4v+W4feW4feF1XSXlSasJWTk6OnnnpKt99+u4KDgyVJcXFxql+/vts4Hx8f1a5dW3Fxca4xERERbmNCQ0Ndy04XtiZPnqyJEycWmb9ixQoFBQWd9/54wqlHAlG+6L91MjMztWzZMqvLqJJ43luH3luL/luH3luH3v8lKyurROMqRdiy2+0aOHCgjDGaPXt2uTzmuHHjNHbsWNd0WlqaGjZsqF69ernCXkVht9sVFRWlnj17ytfX1+pyqhz6b53vv/9emZmZqlatmq6//nqry6lSeN5bh95bi/5bh95bh94XVXjW29lU+LBVGLQOHz6sVatWuQWdsLAwJSQkuI3Pz89XUlKSwsLCXGPi4+PdxhROF44pjr+/v/z9/YvM9/X1rbBPsopcW1VA/8ufzWZzfaX31uB5bx16by36bx16bx16/5eS9qFCf85WYdDav3+/vvvuO9WpU8dteWRkpFJSUrR161bXvFWrVsnpdKpjx46uMWvXrnU7rzIqKkotWrQ47SmEAAAAAHC+LA1bGRkZio6OVnR0tCQpJiZG0dHRio2Nld1u17/+9S9t2bJFCxculMPhUFxcnOLi4pSXlydJatmypfr06aMRI0Zo06ZNWrdunUaPHq1BgwYpPDxckjR48GD5+flp+PDh2rVrlz755BO9+eabbqcIAgAAAEBZs/Q0wi1btqhr166u6cIANGzYME2YMEFfffWVJKldu3Zu661evVpdunSRJC1cuFCjR49W9+7d5eXlpQEDBmjGjBmusTVr1tSKFSs0atQotW/fXnXr1tX48eO57TsAAAAAj7I0bHXp0sV16+binGlZodq1a2vRokVnHNO2bVv98MMP51wfAAAAAJRWhb5mCwAAAAAqK8IWAAAAAHgAYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAMIWAAAAAHgAYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAMIWAAAAAHgAYQsAAAAAPICwBaDSSk9Pd/sKAABQkRC2AFRaGRkZbl8BAAAqEsIWAAAAAHgAYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAMIWAAAAAHgAYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAMIWAAAAAHgAYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAEvD1tq1a3XDDTcoPDxcNptNX3zxhdtyY4zGjx+vBg0aKDAwUD169ND+/fvdxiQlJWnIkCEKDg5WSEiIhg8froyMDLcx27dvV+fOnRUQEKCGDRtq6tSpnt41AAAAAFWcpWErMzNTl19+uWbNmlXs8qlTp2rGjBmaM2eONm7cqGrVqql3797KyclxjRkyZIh27dqlqKgoLV26VGvXrtXIkSNdy9PS0tSrVy81btxYW7du1auvvqoJEyZo7ty5Ht8/AAAAAFWXj5UP3rdvX/Xt27fYZcYYTZ8+Xc8++6xuvPFGSdIHH3yg0NBQffHFFxo0aJD27Nmj5cuXa/PmzerQoYMkaebMmerXr59ee+01hYeHa+HChcrLy9O8efPk5+en1q1bKzo6WtOmTXMLZQAAAABQliwNW2cSExOjuLg49ejRwzWvZs2a6tixozZs2KBBgwZpw4YNCgkJcQUtSerRo4e8vLy0ceNG3XzzzdqwYYOuu+46+fn5ucb07t1bU6ZMUXJysmrVqlXs4+fm5io3N9c1nZaWJkmy2+2y2+1lvbvnpbCeilZXVUH/Kwb6X7543luH3luL/luH3luH3hdV0l5U2LAVFxcnSQoNDXWbHxoa6loWFxen+vXruy338fFR7dq13cZEREQU2UbhstOFrcmTJ2vixIlF5q9YsUJBQUGl2CPPi4qKsrqEKo3+l78aNWq4vi5btsziaqomnvfWoffWov/WoffWofd/ycrKKtG4Chu2rDZu3DiNHTvWNZ2WlqaGDRuqV69eCg4OtrCyoux2u6KiotSzZ0/5+vpaXU6VQ/+tM3/+fIWGhio+Pl5333231eVUKTzvrUPvrUX/rUPvrUPviyo86+1sKmzYCgsLkyTFx8erQYMGrvnx8fFq166da0xCQoLbevn5+UpKSnKtHxYWpvj4eLcxhdOFY4rj7+8vf3//IvN9fX0r7JOsItdWFdD/8peRkaHQ0FBlZGTQe4vwvLcOvbcW/bcOvbcOvf9LSftQYT9nKyIiQmFhYVq5cqVrXlpamjZu3KjIyEhJUmRkpFJSUrR161bXmFWrVsnpdKpjx46uMWvXrnU7rzIqKkotWrQ47SmEAAAAAHC+LA1bGRkZio6OVnR0tKSCm2JER0crNjZWNptNjzzyiF588UV99dVX2rFjh4YOHarw8HDddNNNkqSWLVuqT58+GjFihDZt2qR169Zp9OjRGjRokMLDwyVJgwcPlp+fn4YPH65du3bpk08+0Ztvvul2iiAAAAAAlDVLTyPcsmWLunbt6pouDEDDhg3TggUL9OSTTyozM1MjR45USkqKOnXqpOXLlysgIMC1zsKFCzV69Gh1795dXl5eGjBggGbMmOFaXrNmTa1YsUKjRo1S+/btVbduXY0fP57bvgMAAADwKEvDVpcuXWSMOe1ym82mSZMmadKkSacdU7t2bS1atOiMj9O2bVv98MMPpa4TAAAAAM5Vhb1mCwAAAAAqM8IWAAAAAHgAYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAMIWAAAAAHhAqcLWb7/9VtZ1AAAAAMAFpVRh65JLLlHXrl314YcfKicnp6xrAgAAAIBKr1Rh6+eff1bbtm01duxYhYWF6b777tOmTZvKujYAAAAAqLRKFbbatWunN998U0ePHtW8efN07NgxderUSZdddpmmTZumxMTEsq4TAAAAACqV87pBho+Pj2655RYtXrxYU6ZM0YEDB/T444+rYcOGGjp0qI4dO1ZWdQIAAABApXJeYWvLli168MEH1aBBA02bNk2PP/64Dh48qKioKB09elQ33nhjWdUJAAAAAJWKT2lWmjZtmubPn6+9e/eqX79++uCDD9SvXz95eRVkt4iICC1YsEBNmjQpy1oBAAAAoNIoVdiaPXu27rnnHt11111q0KBBsWPq16+v995777yKAwAAAIDKqlRha//+/Wcd4+fnp2HDhpVm8wAAAABQ6ZXqmq358+dr8eLFReYvXrxY77///nkXBQAAAACVXanC1uTJk1W3bt0i8+vXr6+XX375vIsCAAAAgMquVGErNjZWERERReY3btxYsbGx510UAAAAAFR2pQpb9evX1/bt24vM/+WXX1SnTp3zLgoAAAAAKrtSha3bb79dDz/8sFavXi2HwyGHw6FVq1ZpzJgxGjRoUFnXCAAAAACVTqnuRvjCCy/o0KFD6t69u3x8CjbhdDo1dOhQrtkCAAAAAJUybPn5+emTTz7RCy+8oF9++UWBgYFq06aNGjduXNb1AQAAAEClVKqwVah58+Zq3rx5WdUCAAAAABeMUoUth8OhBQsWaOXKlUpISJDT6XRbvmrVqjIpDgAAAAAqq1KFrTFjxmjBggXq37+/LrvsMtlstrKuCwAAAAAqtVKFrY8//liffvqp+vXrV9b1AAAAAMAFoVS3fvfz89Mll1xS1rUAAAAAwAWjVGHrscce05tvviljTFnXAwAAAAAXhFKdRvjjjz9q9erV+uabb9S6dWv5+vq6LV+yZEmZFAcAJZGZmWl1CQAAAEWUKmyFhITo5ptvLutaAOCcFIas/375P91///2qV6+exRUBAAD8pVRha/78+WVdBwCcs9zcXElSjt2ptLQ0whYAAKhQSnXNliTl5+fru+++0zvvvKP09HRJ0tGjR5WRkVFmxQEAAABAZVWqI1uHDx9Wnz59FBsbq9zcXPXs2VM1atTQlClTlJubqzlz5pR1nQAAAABQqZTqyNaYMWPUoUMHJScnKzAw0DX/5ptv1sqVK8usOAAAAACorEp1ZOuHH37Q+vXr5efn5za/SZMmOnLkSJkUBgAAAACVWamObDmdTjkcjiLz//jjD9WoUeO8iwIAAACAyq5UYatXr16aPn26a9pmsykjI0PPP/+8+vXrV1a1AQAAAEClVarTCF9//XX17t1brVq1Uk5OjgYPHqz9+/erbt26+uijj8q6RgAAAACodEoVti6++GL98ssv+vjjj7V9+3ZlZGRo+PDhGjJkiNsNMwAAAACgqipV2JIkHx8f3XHHHWVZCwAAAABcMEoVtj744IMzLh86dGipigEAAACAC0WpwtaYMWPcpu12u7KysuTn56egoKAyC1sOh0MTJkzQhx9+qLi4OIWHh+uuu+7Ss88+K5vNJkkyxuj555/Xu+++q5SUFF177bWaPXu2mjVr5tpOUlKSHnroIX399dfy8vLSgAED9Oabb6p69eplUicAAAAAnKpUdyNMTk52+5eRkaG9e/eqU6dOZXqDjClTpmj27Nl66623tGfPHk2ZMkVTp07VzJkzXWOmTp2qGTNmaM6cOdq4caOqVaum3r17KycnxzVmyJAh2rVrl6KiorR06VKtXbtWI0eOLLM6AQAAAOBUpb5m61TNmjXTK6+8ojvuuEO//vprmWxz/fr1uvHGG9W/f39JBR+a/NFHH2nTpk2SCo5qTZ8+Xc8++6xuvPFGSQWnOIaGhuqLL77QoEGDtGfPHi1fvlybN29Whw4dJEkzZ85Uv3799Nprryk8PLxMagUAAACAk5VZ2JIKbppx9OjRMtve3//+d82dO1f79u1T8+bN9csvv+jHH3/UtGnTJEkxMTGKi4tTjx49XOvUrFlTHTt21IYNGzRo0CBt2LBBISEhrqAlST169JCXl5c2btyom2++udjHzs3NVW5urms6LS1NUsEpk3a7vcz2sSwU1lPR6qoq6L91vLwKDs77+/vJ4XDwPShHPO+tQ++tRf+tQ++tQ++LKmkvShW2vvrqK7dpY4yOHTumt956S9dee21pNlmsp59+Wmlpabr00kvl7e0th8Ohl156SUOGDJEkxcXFSZJCQ0Pd1gsNDXUti4uLU/369d2W+/j4qHbt2q4xxZk8ebImTpxYZP6KFSsUFBR0XvvlKVFRUVaXUKXR//LXvn17SdILzzyhPXv2aM+ePRZXVPXwvLcOvbcW/bcOvbcOvf9LVlZWicaVKmzddNNNbtM2m0316tVTt27d9Prrr5dmk8X69NNPtXDhQi1atEitW7dWdHS0HnnkEYWHh2vYsGFl9jjFGTdunMaOHeuaTktLU8OGDdWrVy8FBwd79LHPld1uV1RUlHr27ClfX1+ry6ly6L91XnjhBbVv317PvfSq/vvhPEVERFhdUpXB89469N5a9N869N469L6owrPezqZUYcvpdJZmtXP2xBNP6Omnn9agQYMkSW3atNHhw4c1efJkDRs2TGFhYZKk+Ph4NWjQwLVefHy82rVrJ0kKCwtTQkKC23bz8/OVlJTkWr84/v7+8vf3LzLf19e3wj7JKnJtVQH9L3+Fr0W5uXny9vam/xbgeW8dem8t+m8dem8dev+XkvahVHcjLC9ZWVmuazIKeXt7u95gRUREKCwsTCtXrnQtT0tL08aNGxUZGSlJioyMVEpKirZu3eoas2rVKjmdTnXs2LEc9gIAAABAVVSqI1snn153NoU3syiNG264QS+99JIaNWqk1q1ba9u2bZo2bZruueceSQWnLz7yyCN68cUX1axZM0VEROi5555TeHi461THli1bqk+fPhoxYoTmzJkju92u0aNHa9CgQdyJELhAZKanKCUlxeoyAAAA3JQqbG3btk3btm2T3W5XixYtJEn79u2Tt7e3rrzySte4wg8eLq2ZM2fqueee04MPPqiEhASFh4frvvvu0/jx411jnnzySWVmZmrkyJFKSUlRp06dtHz5cgUEBLjGLFy4UKNHj1b37t1dH2o8Y8aM86oNQMWRlZ6i1NRUq8sAAABwU6qwdcMNN6hGjRp6//33VatWLUkFH3R89913q3PnznrsscfKpLgaNWpo+vTpmj59+mnH2Gw2TZo0SZMmTTrtmNq1a2vRokVlUhMAAAAAlESprtl6/fXXNXnyZFfQkqRatWrpxRdfLNO7EQIAAABAZVWqsJWWlqbExMQi8xMTE5Wenn7eRQEAAABAZVeqsHXzzTfr7rvv1pIlS/THH3/ojz/+0Geffabhw4frlltuKesaAaBYJf1AQQAAACuUKmzNmTNHffv21eDBg9W4cWM1btxYgwcPVp8+ffT222+XdY0AUERiYqL+t3yF1WUAAACcVqlukBEUFKS3335br776qg4ePChJatq0qapVq1amxQHA6aSlpSknzy5JMsbiYgAAAIpxXh9qfOzYMR07dkzNmjVTtWrVZHjHAwAAAACSShm2Tpw4oe7du6t58+bq16+fjh07JkkaPnx4md32HQAAAAAqs1KFrUcffVS+vr6KjY1VUFCQa/5tt92m5cuXl1lxAAAAAFBZleqarRUrVujbb7/VxRdf7Da/WbNmOnz4cJkUBgAAAACVWamObGVmZrod0SqUlJQkf3//8y4KAAAAACq7UoWtzp0764MPPnBN22w2OZ1OTZ06VV27di2z4gAAAACgsirVaYRTp05V9+7dtWXLFuXl5enJJ5/Url27lJSUpHXr1pV1jQAAAABQ6ZTqyNZll12mffv2qVOnTrrxxhuVmZmpW265Rdu2bVPTpk3LukYAAAAAqHTO+ciW3W5Xnz59NGfOHD3zzDOeqAkAAAAAKr1zPrLl6+ur7du3e6IWAAAAALhglOo0wjvuuEPvvfdeWdcCAAAAABeMUt0gIz8/X/PmzdN3332n9u3bq1q1am7Lp02bVibFAQAAAEBldU5h67ffflOTJk20c+dOXXnllZKkffv2uY2x2WxlVx0AAAAAVFLnFLaaNWumY8eOafXq1ZKk2267TTNmzFBoaKhHigMAAACAyuqcrtkyxrhNf/PNN8rMzCzTggAAAADgQlCqG2QUOjV8AQAAAAAKnFPYstlsRa7J4hotAAAAACjqnK7ZMsborrvukr+/vyQpJydH999/f5G7ES5ZsqTsKgSAs3Dk25WWlmZ1GQAAAG7OKWwNGzbMbfqOO+4o02IAoDSc+fnKyMiwugwAAAA35xS25s+f76k6AAAAAOCCcl43yAAAAAAAFI+wBQAAAAAeQNgCAAAAAA8gbAGo9IxxcoMMAABQ4RC2AFR6xhhlZmZaXQYAAIAbwhYAAAAAeABhCwAAAAA8gLAFAAAAAB5A2AIAAAAADyBsAQAAAIAHELYAVEopKSnKzc6xugwAAIDTImwBqJRSU1OVk0fYAgAAFRdhCwAAAAA8gLAFAAAAAB5A2AIAAAAADyBsAaiU0tPT5XQY13RWVpaF1QAAABRF2AJQKaWnp8vpdLimCVsAAKCiIWwBuCDs2rVLSUlJVpcBAADgQtgCcEHYvXu3kpOTrS4DAADAhbAF4ILgcDjOPggAAKAcVfiwdeTIEd1xxx2qU6eOAgMD1aZNG23ZssW13Bij8ePHq0GDBgoMDFSPHj20f/9+t20kJSVpyJAhCg4OVkhIiIYPH66MjIzy3hUAnuLjr6PH4hQTE2N1JQAAAC4VOmwlJyfr2muvla+vr7755hvt3r1br7/+umrVquUaM3XqVM2YMUNz5szRxo0bVa1aNfXu3Vs5OTmuMUOGDNGuXbsUFRWlpUuXau3atRo5cqQVuwTAE3x8lW+3Ky4uzupKAAAAXHysLuBMpkyZooYNG2r+/PmueREREa7/G2M0ffp0Pfvss7rxxhslSR988IFCQ0P1xRdfaNCgQdqzZ4+WL1+uzZs3q0OHDpKkmTNnql+/fnrttdcUHh5evjsFAAAAoEqo0GHrq6++Uu/evXXrrbfq+++/10UXXaQHH3xQI0aMkCTFxMQoLi5OPXr0cK1Ts2ZNdezYURs2bNCgQYO0YcMGhYSEuIKWJPXo0UNeXl7auHGjbr755mIfOzc3V7m5ua7ptLQ0SZLdbpfdbvfE7pZaYT0Vra6qgv5bJzAgoOCrv79sAf7KzMzk+1BOeN5bh95bi/5bh95bh94XVdJe2Iwx5uzDrBHw5xupsWPH6tZbb9XmzZs1ZswYzZkzR8OGDdP69et17bXX6ujRo2rQoIFrvYEDB8pms+mTTz7Ryy+/rPfff1979+5123b9+vU1ceJEPfDAA8U+9oQJEzRx4sQi8xctWqSgoKAy3EsAAAAAlUlWVpYGDx6s1NRUBQcHn3ZchT6y5XQ61aFDB7388suSpCuuuEI7d+50hS1PGjdunMaOHeuaTktLU8OGDdWrV68zNtQKdrtdUVFR6tmzp3x9fa0up8qh/9b45JNP9OjjT+nf77yte+4bpey0JL344ot66KGHrC6tSuB5bx16by36bx16bx16X1ThWW9nU6HDVoMGDdSqVSu3eS1bttRnn30mSQoLC5MkxcfHux3Zio+PV7t27VxjEhIS3LaRn5+vpKQk1/rF8ff3l7+/f5H5vr6+FfZJVpFrqwrof/nL/vNGONk5OcrOzpYxhu9BOeN5bx16by36bx16bx16/5eS9qFC343w2muvLXL63759+9S4cWNJBTfLCAsL08qVK13L09LStHHjRkVGRkqSIiMjlZKSoq1bt7rGrFq1Sk6nUx07diyHvQAAAABQFVXoI1uPPvqo/v73v+vll1/WwIEDtWnTJs2dO1dz586VJNlsNj3yyCN68cUX1axZM0VEROi5555TeHi4brrpJkkFR8L69OmjESNGaM6cObLb7Ro9erQGDRrEnQgBAAAAeEyFDltXXXWVPv/8c40bN06TJk1SRESEpk+friFDhrjGPPnkk8rMzNTIkSOVkpKiTp06afny5a6ba0jSwoULNXr0aHXv3l1eXl4aMGCAZsyYYcUuAQAAAKgiKnTYkqR//OMf+sc//nHa5TabTZMmTdKkSZNOO6Z27dpatGiRJ8oDAAAAgGJV6Gu2AKBkCj7BIisry+I6AAAA/kLYAlD5GcIWAACoeAhbAAAAAOABhC0AAAAA8ADCFoALBqcRAgCAioSwBaBSysjIkPPPa7VkjGx+QVq6/DslJiZaWxgAAMCfCFsAKqXMzMyTpoxsfgHKcUhpaWmW1QQAAHAywhaAC4IxTmWlpyolJcXqUgAAACQRtgBcKIxRdkaqUlNTra4EAABAEmELQCVVcBqhsboMAACA0yJsAaiUsrOzyVoAAKBCI2wBuCAY41S+3a6lS5cqKSnJ6nIAAAAIWwAqp+zsbPcZxsiZb9fq1auVnJxsTVEAAAAnIWwBqJRycnLkdh6hMTLGyOFwWFYTAADAyQhbAC4Mxkgyys/Pt7oSAAAASYQtAAAAAPAIwhYAAAAAeABhCwAAAAA8gLAFAAAAAB5A2AJwgSi4MyF3IwQAABUFYQvAhcEQtgAAQMVC2AJwQSFsAQCAioKwBeDCYIzkG6CExOM6ceKE1dUAAAAQtgBcKIzk46s8u11Hjx61uhgAAADCFoALiDFy5ucrIyPD6koAAAAIWwAqp+zsbKtLAAAAOCPCFoBKJzExUd+t/t59ppFkjIxxcmQLAABUCIQtAJVOWlqacvLsp8w1f4Yto/j4eEvqAgAAOBlhC8CFwxjZ/IL00X+/UGJiotXVAACAKo6wBeACYmTzC1C23am0tDSriwEAAFUcYQsAAAAAPICwBQAAAAAeQNgCAAAAAA8gbAEAAACABxC2AAAAAMADCFsAAAAA4AGELQAAAADwAMIWAAAAAHgAYQvABcRIkpxOp8V1AAAAELYAXEgMYQsAAFQchC0AAAAA8ADCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYAnDBcTjydeLECavLAAAAVVylCluvvPKKbDabHnnkEde8nJwcjRo1SnXq1FH16tU1YMAAxcfHu60XGxur/v37KygoSPXr19cTTzyh/Pz8cq4eQFk5fPiwMjMyil3mdOTpREKcRj3yuBITE8u5MgAAgL9UmrC1efNmvfPOO2rbtq3b/EcffVRff/21Fi9erO+//15Hjx7VLbfc4lrucDjUv39/5eXlaf369Xr//fe1YMECjR8/vrx3AUAZOXr0qPLycotf6HDKafNW7O+/KzY2tnwLAwAAOEmlCFsZGRkaMmSI3n33XdWqVcs1PzU1Ve+9956mTZumbt26qX379po/f77Wr1+vn376SZK0YsUK7d69Wx9++KHatWunvn376oUXXtCsWbOUl5dn1S4B8BgjGaP0lCSlpqZaXQwAAKjCfKwuoCRGjRql/v37q0ePHnrxxRdd87du3Sq73a4ePXq45l166aVq1KiRNmzYoGuuuUYbNmxQmzZtFBoa6hrTu3dvPfDAA9q1a5euuOKKYh8zNzdXubl//eU8LS1NkmS322W328t6F89LYT0Vra6qgv5bIzAwUAH+/gX/Dwgo+EBjm02yeUk+PvJ15istLY3vi4fwvLcOvbcW/bcOvbcOvS+qpL2o8GHr448/1s8//6zNmzcXWRYXFyc/Pz+FhIS4zQ8NDVVcXJxrzMlBq3B54bLTmTx5siZOnFhk/ooVKxQUFHSuu1EuoqKirC6hSqP/5adGjRpa9MEC1/S8d9857dhly5aVQ0VVF89769B7a9F/69B769D7v2RlZZVoXIUOW7///rvGjBmjqKgoBQQElOtjjxs3TmPHjnVNp6WlqWHDhurVq5eCg4PLtZazsdvtioqKUs+ePeXr62t1OVUO/S9/n3zyie4b9ZAC/P017913dM+I+5SdnV1wZEuSfPzklZetOXNm67bbbrO22AsUz3vr0Htr0X/r0Hvr0PuiCs96O5sKHba2bt2qhIQEXXnlla55DodDa9eu1VtvvaVvv/1WeXl5SklJcTu6FR8fr7CwMElSWFiYNm3a5LbdwrsVFo4pjr+/v/z/PEXpZL6+vhX2SVaRa6sK6H/5ys7OljGm4P85OaeELYe88rIlie+Jh/G8tw69txb9tw69tw69/0tJ+1Chb5DRvXt37dixQ9HR0a5/HTp00JAhQ1z/9/X11cqVK13r7N27V7GxsYqMjJQkRUZGaseOHUpISHCNiYqKUnBwsFq1alXu+wQAAACgaqjQR7Zq1Kihyy67zG1etWrVVKdOHdf84cOHa+zYsapdu7aCg4P10EMPKTIyUtdcc40kqVevXmrVqpXuvPNOTZ06VXFxcXr22Wc1atSoYo9cAQAAAEBZqNBhqyTeeOMNeXl5acCAAcrNzVXv3r319ttvu5Z7e3tr6dKleuCBBxQZGalq1app2LBhmjRpkoVVAwAAALjQVbqwtWbNGrfpgIAAzZo1S7NmzTrtOo0bN+aOZEAVY4wp8cWrAAAAnlChr9kCgFJxOiXfAM2aO0+JiYlWVwMAAKoowhaAC49xyOYXoLSsXI5uAQAAyxC2AFx4/rwlvNPptLgQAABQlRG2AFyQjHEqKz1VKSkpVpcCAACqKMIWgEonIyPD9YHGp2WMsjNSlZqaWj5FAQAAnKLS3Y0QADIzM886xhinHI58paenl0NFAAAARXFkC8CFyRg58+2ELQAAYBnCFoBKJyMjw+oSAAAAzoqwBaBSSUxM1MKPP5XOcskWAACA1QhbACqVtLQ0ZWRn6axpyxgZYziNEAAAWIawBaDSceSX4LCWMQW3f8/K8nxBAAAAxSBsAQAAAIAHELYAVCopKSnKzc62ugwAAICzImwBqFRSU1OVnZtTgpEFpxpyGiEAALAKYQvAhckQtgAAgLUIWwAuaLt27VJSUpLVZQAAgCqIsAXgwvTnka2dO3cqOTnZ4mIAAEBVRNgCcIEqCFt2u93iOgAAQFVF2AJwYTJG8vFXfEKifvvtN6urAQAAVRBhC0Clkp6eLqfDWbLBPr7Kz89XfHy8Z4sCAAAoBmELQKWSnp4up9NRssHGyBinMjIyPFsUAABAMQhbACqVjIwMOf+8+cVZGSMZo8zMTM8WBQAAUAzCFoBKheAEAAAqC8IWAAAAAHgAYQtApZKVlaXC27oDAABUZIQtAJXK8ePHyVoAAKBSIGwBqDQSExP15dJlIm0BAIDKgLAFoNJIS0tTdq79HNYoCGU//fSTkpKSPFMUAADAaRC2AFy4/rxF/A8//KCYmBiLiwEAAFUNYQvABS89PV2pqalWlwEAAKoYwhaAC54p6YcgAwAAlCHCFoALlzGSj59y8/KUkpJidTUAAKCKIWwBuIAVhC2Zws/nAgAAKD+ELQAAAADwAMIWgEojJSVFudnZ57yeMUZpaWkeqAgAAOD0CFsAKo3U1FRl5+ac20rGyOYXqDnvLVBiYqJnCgMAACgGYQvAhc0Y2XwDlJnn4OgWAAAoV4QtAJVGenq6nA7nOa5VcNt3p8NR9gUBAACcAWELQKWRnp4up/McQ5MxchqHUpMS9fHHHyspKckzxQEAAJyCsAWg0sjIyJCzNB9QbIwy01K1dOlSJScnl31hAAAAxSBsAag0MjMzrS4BAACgxAhbACqNgg8mLsWRLQAAAAsQtgBUGllZWaXKWsY45XTYlZ+fX/ZFAQAAnAZhC0ClkJSUpF27dp37isZIxsiRn0/YAgAA5YqwBaBSSE5O1vbt20uxpnH7AgAAUF4IWwAqhRMnTij++AmRmgAAQGVR4cPW5MmTddVVV6lGjRqqX7++brrpJu3du9dtTE5OjkaNGqU6deqoevXqGjBggOLj493GxMbGqn///goKClL9+vX1xBNPcEoRUIlkZGTIWdqXLGNkjOFnHgAAlKsKH7a+//57jRo1Sj/99JOioqJkt9vVq1cvt1tAP/roo/r666+1ePFiff/99zp69KhuueUW13KHw6H+/fsrLy9P69ev1/vvv68FCxZo/PjxVuwSgPJmjCQjh+McPxAZAADgPPhYXcDZLF++3G16wYIFql+/vrZu3arrrrtOqampeu+997Ro0SJ169ZNkjR//ny1bNlSP/30k6655hqtWLFCu3fv1nfffafQ0FC1a9dOL7zwgp566ilNmDBBfn5+VuwagHOQnp4up8N5XtsgbAEAgPJU4cPWqVJTUyVJtWvXliRt3bpVdrtdPXr0cI259NJL1ahRI23YsEHXXHONNmzYoDZt2ig0NNQ1pnfv3nrggQe0a9cuXXHFFUUeJzc3V7m5ua7ptLQ0SZLdbpfdbvfIvpVWYT0Vra6qgv6Xj7i4OPn6+crX17tghjEKDAiQpIKvxkg2218rnDxt85IC/HUiOVmJiYlq1KhROVd/4eF5bx16by36bx16bx16X1RJe2EzxlSaq82dTqf++c9/KiUlRT/++KMkadGiRbr77rvdgpEkXX311erataumTJmikSNH6vDhw/r2229dy7OyslStWjUtW7ZMffv2LfJYEyZM0MSJE4vMX7RokYKCgsp4zwAAAABUFllZWRo8eLBSU1MVHBx82nGV6sjWqFGjtHPnTlfQ8qRx48Zp7Nixrum0tDQ1bNhQvXr1OmNDrWC32xUVFaWePXvK19fX6nKqHPpfPmbOnKlnJ74omT9PJTRGgYGBmvfuO7pnxH3Kzs4+/ZEtSTa/APnJqf9+8pGuu+66cq7+wsPz3jr03lr03zr03jr0vqjCs97OptKErdGjR2vp0qVau3atLr74Ytf8sLAw5eXlKSUlRSEhIa758fHxCgsLc43ZtGmT2/YK71ZYOOZU/v7+8vf3LzLf19e3wj7JKnJtVQH995ykpCStW7dO2dlZf97sQm5hKjsn5+xhyyE55JDNZuP7VIZ43luH3luL/luH3luH3v+lpH2o8HcjNMZo9OjR+vzzz7Vq1SpFRES4LW/fvr18fX21cuVK17y9e/cqNjZWkZGRkqTIyEjt2LFDCQkJrjFRUVEKDg5Wq1atymdHAJTagQMHtDxq5Xl9xJYxTjny7SX+SxQAAMD5qvBHtkaNGqVFixbpyy+/VI0aNRQXFydJqlmzpgIDA1WzZk0NHz5cY8eOVe3atRUcHKyHHnpIkZGRuuaaayRJvXr1UqtWrXTnnXdq6tSpiouL07PPPqtRo0YVe/QKQMVy7Ngx5dkdOs+0JWd+vjIyMsqsLgAAgDOp8Ee2Zs+erdTUVHXp0kUNGjRw/fvkk09cY9544w394x//0IABA3TdddcpLCxMS5YscS339vbW0qVL5e3trcjISN1xxx0aOnSoJk2aZMUuAThHx44dU35+3vltxBg5nU6tWrVKSUlJZVMYAADAGVT4I1sluVliQECAZs2apVmzZp12TOPGjbVs2bKyLA1AOTn5Q8xLzTglGa1bt07Jycmuj48AAADwlAp/ZAsAyiZsFfzhhg82BgAA5YWwBaDCy87OPq/LtU5G2AIAAOWFsAWganA6JR9/HTl6TL/99pvV1QAAgCqAsAWgQktKStKuXbvKYEtG8vFVfn6+63P2AAAAPImwBaBCi4mJ0bp168pse8bp1IIFC3Tw4MEy2yYAAEBxCFsAKrTDhw8rJS1DZXbRlqTNmzfr8OHDZbY9AACA4hC2AFRoWVlZkpd3GW7RKDs7W0ePHi3DbQIAABRF2AJQoaWlpcmU3a0IJS8f2e12bd++vWy2CQAAcBqELQAVVmJiombP/bdK8NnmJWMckpe3bH5B+uzL/ykxMbGMNgwAAFAUYQtAhZWWlqb07DyV5fVakpHNL0A5joLtAwAAeAphC0CFlZKSooz01LLNWgAAAOWEsAWgwkpNTVVGerpIWwAAoDIibAGosNLT0+XId5T5do1xKis9VSkpKWW+bQAAgEKELQAVUlJSkr799ls5nWUftmSMsjNSlZqaqsTERG6UAQAAPIKwBaBCiomJ0ddffy1nmd2K8C/GOJVvt+vTTz/VbXcM0x1330vgAgAAZY6wBaBCSk1NVVJSkjxyvZYxctjz9PXXXys+KVVJ6VncmRAAAJQ5whaACik9PV35+fmeuTeGMZKMjh8/LntengceAAAAgLAFoII6duyY8vLK+jO2/uRwSF4+ysvLU05ubtlvHwAAQIQtABXUoUOHJJu3h7bulLx9JMkjdzsEAACQCFsAKqiUlBTJ21NhCwAAwPMIWwCqtOycbDny860uAwAAXIAIWwAqnKSkJO3atatcHisjPUNZ2dnl8lgAAKBqIWwBqHBWrlypnzZu8uyDOJ2Sl4/yHXYlHv1DMTExnn08AABQ5RC2AFQoP/30kx5+5DHlOz39SEby9pFxOpSSmqqRD4zWvn37PP2gAACgCiFsAagw9u3bp0FD7lTc8ePyzAdsFcMY2Xz8lJAQrz/++KN8HhMAAFQJPlYXAABSwXVac+bM0dH4xIJT/MqLMXI67MrNzdXRo0fL73EBAMAFjyNbACqE5ORkrV69Wvl2D32QcXGMkYyRcTiVb7crPj6+fB4XAABUCRzZAlBh5OTkyJhyClqS/gp1RpLR2rVrVaNGDf3rX/9S7dq1y7EOAABwISJsAbBcUlKSZs6cqQO/HSo42lSezF+nLK5bt07Jyclq3769li9frj59+hC6AABAqXEaIQDLJScna8WKFco3UrmdQljopLCVkZGhtLQ0LVmyRB988IGSk5PLtxYAAHBB4cgWAMudOHFCubm55X9U6xS5Tmnnrl3Kzc1VgwYNXPOTkpI40gUAAM4ZR7YAWGrfvn0aOnyEjlSIOwHa5LD5KOZwrI4cOaKUlBRJBUfePvroI450AQCAc8KRLQCWKDxalJaWppjDf8ieZ5e8LHpJMkaSl2ScsvkFypGfo9jYWL311luKjIxU+/btrakLAABUaoQtAJZITk7W22+/rbS0NOXl5f55qZZVpxEaydu74H9Oh/LzcpXv669Fiz7Sr7/+qtDQULcjXQAAACXBaYQALBETE6Nt23dpx44dksMheVWQl6P8fMnmLXn5KC8vV7Gxsdq3b58OHz6sw4cPW10dAACoRCrIuxsAVU1cXJzyHIV3AnSecWz5chYc5XI6JG8/HT16VC9OeVUpmbl65vkXtGfPHu3bt09z5sxRUlKS1cUCAIAKjNMIAZS7xMREHThwQPmOfKtLOT3j/PNom5/S0jJk8/PX4T+O6O6RD0jG6OD+vWratKkSExO5SyEAACgWYQtAudqzZ49GPPiQft21Q3I4C07Zq4iMUcFRLh/J6ZBxOmR3eGvXzh3yC6yu1OQkzZkzR8nJyfrtt99Uv359/etf/yJ0AQAAF8IWAI9LTEyUVHBTjJsHDtIfcYnKSjoheXm7bkxRYRV+6LHDIYfJU0Z6hnxy8+Rw2vTFl1+qebNm+t///qfAwEB17969SNgq3Pd69eqVd+UAAMBihC0AHrVnzx49OOYxyTh18w399PuRo8rOzpax+AOMS6wwbDnzZWw2SUb5f97QwykvxRyOVYOcHIWFhemrr77SsGHD5HA4XKvfcfe9kqSZ017Vli1bOOUQAIAqhLAFwGMSExM18sGHFL37VzlycrRp82ZlZ+cUBC2vCn5E61TGnBS8nJKM5OuvvLxsHTt2TIGBgXrnnXf066+/atXa9fKyGb00aYKS0rNkz8vTzp079dFHH6ljx46ELQAAqgjCFgCPiYmJUfzxZOVmZsphTMG1T8b55/VQldCpdTudMo585TrydezYMWVmZiom9g/l2wruZvjQmEcl/yClJSfr+RdeliM3SzExMa4ba0icXggAwIWMsAWgzCQmJio5OVlr1qxRTEyM5r3/oZLTMmTPy5VsNsk4Km/Qkgpqt3nL9eHLTodkK3gZTUlJK7j+zCFJ+bJ5+yghIV4+AdXktPkoLj5BKSnJGjjodt0x+HZt2vaLjv4eq3ffmaOIiAht2bJFHTt21MqVKyWp3G62cfDgQb300ku6//77dfXVV3v88QAAqEoIWwBK5GxHYvbt26ebB96u7Ix05WRl6MSJE8qTt+T8865+lThj/cW439DDOCXvPz+u0NgK7lyogtMNjT1PRjbl5eVKXnYdj0+VfHyVnJaut9+eLe+gYOWlJ2ngkKHy8ZKCqwWpUaNGiomJ0UUXXaTu3btLkpYvX37G67xO/r6c7v9n8ssvv2jR4s+149cDWvblZ675HHEDAOD8EbYAnFViYqLrRg8fzv+368388ePHlZKSovXr12vLli06EHNYzpxM5TsdUr5d8vH7ayPGFBzdulAUtz+mMFSaguW+/pIjX8rPl2x/LpeXHE6HHDnZkqT0zCyZnAylnPDSod+PyubtraTkZI0YMUJeXl76/ffflZycrMWLF6tnz5564IEHXMGr8PuSl5urFyc8p+cmvqi4Y0d1279u0ffrN8rX11fTX31F3t7e2rJlizp06KBatWrJ29tbn376qSIiIvThhx/K6eWr1MwcxcTE6Olnn1fcsSOa9+5cXXPNNeXZUQAALjhVKmzNmjVLr776quLi4nT55Zdr5syZnDaDKu1sRz8KA9XOnTu177dYVa8epJ9//lmNGjXSiAdG6+ctW5XnyJfyc+WQTfLyLQgW3j6S7OW4JxVEMdd0FcwrnG/+OhpmHJLNW8aRL9l85HQaydcm4+WtzIwMrf5hnZSfJ/kF6oknn1Z2Voa2bdumP/74QyEhIdq4caNiY2OVmJ6jvJxs3XrbYDl9/JWRFK/58+croFZ9ZWeka+g9I5WWmqx6tUOU7+WrtOQTuuP2QXrxlVclI2VnZ8o7MFh2e56OHTumPfv2KzEhQfeMfEDtLmupYcOG6corr5QkHT9+XJJUt25dhYSEuO1qUlKSPv30U3Xr1k3NmzeXxG3vAQCoMmHrk08+0dixYzVnzhx17NhR06dPV+/evbV3717Vr1/f6vKAMlHcm9ukpCS3U9FO/syrWwffqTp16mjW9Nfl7e2tr7/+WgkJCfLy8tLOnTu1ffdenTh+QnaHXfnyks04dNOtg+Qjp/KMt/LseQU5wmEKAoQzX/Ly+jNgeFnQgQrGOOR2/qQ55f/e3ieFrz+Phjny/7wu7M+jZkbKzs6RbD5Ky8zRnDlz5OUbIGe+vWCMr5/kZdOxhEx5+wXKlpejI0eOyCclS/bMVMXFJSgvI0mH/Pxk86um3JxsPffceDl9/QvCoJeXHI48/X7gV40YMULH07JkvLy0/9c9+nXvPi3+Yqnq1q4pL19fJSYmyhgpwMumK65op8cee0wDBgxQ69atlZycrA8++lQXhYcrpHqgnnrqKb274D+SpOmvviKpIKSdGrz27dunL7/8Up07d1bTpk2VnJzsNi1JBw4c0C+//KJu3bpJkttRuuJOnzx+/Hixj1WocHwhwiAAwFOqTNiaNm2aRowYobvvvluSNGfOHP3vf//TvHnz9PTTT1tcXeVT3Jv6c71e5GzbON2Yk8ee/Jf2k9c5df7Jb8AKnVznqU63jiS3N3KJiYmKj493zU9JSXEbW7juyds5ubaTp4urV5JSUlL0448/qnPnzjLGuN50Fn6WU+Hyyy67TFPfmCl7Xo5u7N9X119/vT777DNFR0crNTVVderUUfXq1fXUs88r6XiC/nXzTTpw6HcdPXJEPfr0V1JivHLzjYyckj1X8vaTfHwLCis8Pc7mJUd+XsFyX/8/5xeGhpNPqzMV/8OKy0NpbgZinH+FMJt3QWArvC5MXpLNW06ZglBrsxXcpMNIkk0Oe55kz5Ns3srPyij4IOacTMnLR3l5eZLxkmQKLqNz5P/1mPl2OfLzlXg8qeCopPFWvj1X8gtSvjGKSzgu2bz+rMlLGXlZ2hK9XZL03eq1+vrrr+Xt7S2Hb4AOHNgvGZuG3HGnQkIbSnnZuqZzF2VmZSk4KEB3DL5dzZo10xtvvKG2bdtqzboNSk/PVPUawbqsdUvlZGdp+86d8vHylrdxqHpIbZ1ITpLsuWp6aWvl52TJ39dHx1PSVb16Nb008Xm99c6/lRh3VD27d9OW6B06GHNYzZs11b9nv6W6deu6/YxJ0iNPPK283FzXPr044TnVq1dPq1atUkREhLZv3662bdtq+/btuvHGG1WrVq0i26hbt65bMDTGuH5Oa9as6Rpz6s/zyetLKjL/TArXKXzNKVRceDw1dJ7pte7k7Zy6zpm2ceq+Ffc6fGroPd1r8dn259T1T+7HybUUt72zbfN0+19apT2ie7rvUSFP/VHgbPtd0jMgTvfHlFWrVqlbt26uP46UtKaTH7Nw+tQj6kBlYDOV5pNFSy8vL09BQUH673//q5tuusk1f9iwYUpJSdGXX35ZZJ3c3Fzl5ua6plNTU10Xr9eoUaM8yj6tlJQULV68WFlZWeratauqV6+uAwcO6JJLLpH3KW9wU1NTtXHjRnXs2FE1a9Z0Tbdq1Uq7d+92zT/TOifPX716tbKzs7Vp2y9KT0nRc8+MU0hIiFatWqUNm7fJ28dHI+++U3MXfCgZo/uHD9O2bduUk5Oj7OxsxcXF6c4775TT6dSzE19UatJxtWh2ia688kq1bdtWb8x8W9VrVNPVV7RTdna2Vn6/ThlpyWrR7BK1atVKxhjFxsYqJCREq39Yp8zMHHn5eCuicSPVDq6mnJwc7f/tsDIyM2Rk5GOMqlevppp16uvIkaOqGRykPLtDuZkZiohoorjjSTL5dgXVrCVjz1VevkO+Xl7y8bbpeEqGJJtCagQqN98hR16ejJeXsrNz5O/nozohNZWb71RmVrbeePUVPf3sczqelCynMX9mDS8F+PjI6ZTynPnysxl5+QUoMytbNpvk5ciXt5+fjCSnMXI4jHyMQ/Xq1lFqWpZyHHYZFWzLOAqCjJeXpPw8BdYIUVZ2VsElQK4gJMnXW7I7pfwc+QQEKt+e7wpJBW/O/3yTbndIcha8sc53FLy5z88tuMbKmD+PUJ10dOXPOuRl+ytAmJMWS0WvYSqH6cCAAM2a+aZGPTRG2Tk55f74FW/a66/vndv3xyY57H+e3nm69U8ab/P685o7n4KZNpvkcPy53CY58xUYWE2zZk7XqIceUXZ2ZsH2CsO5bAXr+/oVnFbq5V2wruuonbPgqJrtz5uK2GwFz8ucTHkFVJPT6Sy4sYozX/L+c5v5dsnvz+3JSF4+BTV52SQfbynPXrAd3z/3Mf/Pn4PAIOXnG8nplM3bS4G+XnLKX7nZqbL5+8tpd8rLx1sBXlKW/a8Po5b5s0eOXAUGVVeOwyGp4GfQJpv8vLxkdzpktztl87LJ29um/Hwjm9dfY/x9fOTv663s3IKPByjutSHXYZdskrfNJqcxBZf6eXnJ7nQWtF6SI9/Iy8umQD9f+fr7y2kKjhbOmjVLsbGxcnr7KsDHW9l5duVkpqt2rVpKy85VZlaWArykjh07auPP22XysuQVEKT8rEzVCbtIITWqKTH+mIwxatiwoeKPJ+v4iUR5y6hF8+Y6Gp+o48nJqh0crKAAPx1PSpNx5KlW/TDZjEM1ggKVbTf6/Y9Y+fkGqG7tYDWNaKKGDRtqzQ8blJAYJx8vL415aLQ2bNig3377TSfSMuXt66eaQYHyDQxQndq1dPUV7WSz2ZSSkqKffvpJyRlZ8vf2kt1pVKNadb0wcbwaN26s5ORkPTfxRe3etUuyeale3VqqFxqunMx0DRr4L7099z057Xn65w39NWDAAEly+52VfOKEatWpo4CAID356EOqVauWJOnXX3/VtGnTlJZtV2ZWpkKqV1fX6zspKChIAQEB6tChg9vvS4fDoQMHDig2NlZXX3212+/J3bt3a8JLU1S/fn11v+7v6tatm+t37+rVqyXJtb1WrVppy5YtkqQrr7xSs997X/k5ObJ5eck4ncrOy9XR3w/rokYRql69up589CF5eXkV+f188ra7du1a5Hf6yU79/Z6cnKyJL7+iX/cd1CV/a6Lu113rOoK8ceNGXXzxxa7fy9dFXqNu3bopPT1d//nPfxQREaG2bdtq8utvKD4+UWF1a+uFic8X/H5evVrHjh3Tsm+/U1pKkurWbyCnI0+9e/ZQWFiYLr74Yn344Ye6//77demll7rVdumll2r2e++73kP8/PPPWrtho9JTUvTs/z2t3NzcYt/vwLMKn/dW9j41NVU7duxQ//79K0TwTk9PV0REhFJSUs74c1clwtbRo0d10UUXaf369YqMjHTNf/LJJ/X9999r48aNRdaZMGGCJk6cWJ5lAgAAAKhEfv/9d1188cWnXV5lTiM8V+PGjdPYsWNd006nU0lJSapTp45sFeyOamlpaWrYsKF+//13BQcHW11OlUP/rUPvrUPvrUPvrUX/rUPvrUPvizLGKD09XeHh4WccVyXCVt26deXt7V3kPPf4+HiFhYUVu46/v7/8/f3d5lWEQ5ZnEhwczA+Ahei/dei9dei9dei9tei/dei9dei9uzOdPlioStwuzM/PT+3bt9fKlStd85xOp1auXOl2WiEAAAAAlJUqcWRLksaOHathw4apQ4cOuvrqqzV9+nRlZma67k4IAAAAAGWpyoSt2267TYmJiRo/frzi4uLUrl07LV++XKGhoVaXdt78/f31/PPPFzntEeWD/luH3luH3luH3luL/luH3luH3pdelbgbIQAAAACUtypxzRYAAAAAlDfCFgAAAAB4AGELAAAAADyAsAUAAAAAHkDYqsBeeukl/f3vf1dQUNBpP1A5NjZW/fv3V1BQkOrXr68nnnhC+fn5bmPWrFmjK6+8Uv7+/rrkkku0YMGCItuZNWuWmjRpooCAAHXs2FGbNm3ywB5Vbk2aNJHNZnP798orr7iN2b59uzp37qyAgAA1bNhQU6dOLbKdxYsX69JLL1VAQIDatGmjZcuWldcuXFB4zpa9CRMmFHmOX3rppa7lOTk5GjVqlOrUqaPq1atrwIABRT4sviSvSZDWrl2rG264QeHh4bLZbPriiy/clhtjNH78eDVo0ECBgYHq0aOH9u/f7zYmKSlJQ4YMUXBwsEJCQjR8+HBlZGS4jSnJa1JVdLb+33XXXUV+Fvr06eM2hv6fu8mTJ+uqq65SjRo1VL9+fd10003au3ev25iyep0pyXufqqYk/e/SpUuR5/7999/vNob+nyODCmv8+PFm2rRpZuzYsaZmzZpFlufn55vLLrvM9OjRw2zbts0sW7bM1K1b14wbN8415rfffjNBQUFm7NixZvfu3WbmzJnG29vbLF++3DXm448/Nn5+fmbevHlm165dZsSIESYkJMTEx8eXx25WGo0bNzaTJk0yx44dc/3LyMhwLU9NTTWhoaFmyJAhZufOneajjz4ygYGB5p133nGNWbdunfH29jZTp041u3fvNs8++6zx9fU1O3bssGKXKi2es57x/PPPm9atW7s9xxMTE13L77//ftOwYUOzcuVKs2XLFnPNNdeYv//9767lJXlNQoFly5aZZ555xixZssRIMp9//rnb8ldeecXUrFnTfPHFF+aXX34x//znP01ERITJzs52jenTp4+5/PLLzU8//WR++OEHc8kll5jbb7/dtbwkr0lV1dn6P2zYMNOnTx+3n4WkpCS3MfT/3PXu3dvMnz/f7Ny500RHR5t+/fqZRo0auf0uLYvXmZK896mKStL/66+/3owYMcLtuZ+amupaTv/PHWGrEpg/f36xYWvZsmXGy8vLxMXFuebNnj3bBAcHm9zcXGOMMU8++aRp3bq123q33Xab6d27t2v66quvNqNGjXJNOxwOEx4ebiZPnlzGe1K5NW7c2LzxxhunXf7222+bWrVquXpvjDFPPfWUadGihWt64MCBpn///m7rdezY0dx3331lXu+FjOesZzz//PPm8ssvL3ZZSkqK8fX1NYsXL3bN27Nnj5FkNmzYYIwp2WsSijr1zb7T6TRhYWHm1Vdfdc1LSUkx/v7+5qOPPjLGGLN7924jyWzevNk15ptvvjE2m80cOXLEGFOy1yQU7b8xBWHrxhtvPO069L9sJCQkGEnm+++/N8aU3etMSd77oGj/jSkIW2PGjDntOvT/3HEaYSW2YcMGtWnTxu2DmXv37q20tDTt2rXLNaZHjx5u6/Xu3VsbNmyQJOXl5Wnr1q1uY7y8vNSjRw/XGPzllVdeUZ06dXTFFVfo1VdfdTtsvmHDBl133XXy8/Nzzevdu7f27t2r5ORk15gzfT9wdjxnPWv//v0KDw/X3/72Nw0ZMkSxsbGSpK1bt8put7v1/dJLL1WjRo1cfS/JaxLOLiYmRnFxcW69rlmzpjp27OjW65CQEHXo0ME1pkePHvLy8tLGjRtdY872moTTW7NmjerXr68WLVrogQce0IkTJ1zL6H/ZSE1NlSTVrl1bUtm9zvC7tmRO7X+hhQsXqm7durrssss0btw4ZWVluZbR/3PnY3UBKL24uDi3J7sk13RcXNwZx6SlpSk7O1vJyclyOBzFjvn11189WH3l8/DDD+vKK69U7dq1tX79eo0bN07Hjh3TtGnTJBX0OiIiwm2dk78ftWrVOu33o/D7hbM7fvw4z1kP6dixoxYsWKAWLVro2LFjmjhxojp37qydO3cqLi5Ofn5+Ra4fPfn5W5LXJJxdYa/O9FoRFxen+vXruy338fFR7dq13cac7TUJxevTp49uueUWRURE6ODBg/q///s/9e3bVxs2bJC3tzf9LwNOp1OPPPKIrr32Wl122WWSVGavM2d77xMYGOiJXapUiuu/JA0ePFiNGzdWeHi4tm/frqeeekp79+7VkiVLJNH/0iBslbOnn35aU6ZMOeOYPXv2uF2UDs85l+/H2LFjXfPatm0rPz8/3XfffZo8ebL8/f09XSrgcX379nX9v23bturYsaMaN26sTz/9tMr9ckTVNmjQINf/27Rpo7Zt26pp06Zas2aNunfvbmFlF45Ro0Zp586d+vHHH60upUo6Xf9Hjhzp+n+bNm3UoEEDde/eXQcPHlTTpk3Lu8wLAmGrnD322GO66667zjjmb3/7W4m2FRYWVuQObIV37AkLC3N9PfUuPvHx8QoODlZgYKC8vb3l7e1d7JjCbVzIzuf70bFjR+Xn5+vQoUNq0aLFaXstnf37URV6XVbq1q1bpZ+z5SkkJETNmzfXgQMH1LNnT+Xl5SklJcXtr84n970kr0k4u8JexcfHq0GDBq758fHxateunWtMQkKC23r5+flKSko66+vNyY+Bkvnb3/6munXr6sCBA+revTv9P0+jR4/W0qVLtXbtWl188cWu+WFhYWXyOnO29z5V3en6X5yOHTtKkg4cOKCmTZvS/1Lgmq1yVq9ePV166aVn/Hfy+d1nEhkZqR07dri94EdFRSk4OFitWrVyjVm5cqXbelFRUYqMjJQk+fn5qX379m5jnE6nVq5c6RpzITuf70d0dLS8vLxcp5JERkZq7dq1stvtrjFRUVFq0aKF63SRs30/cHZV/TlbnjIyMnTw4EE1aNBA7du3l6+vr1vf9+7dq9jYWFffS/KahLOLiIhQWFiYW6/T0tK0ceNGt16npKRo69atrjGrVq2S0+l0vTkqyWsSSuaPP/7QiRMnXOGX/peOMUajR4/W559/rlWrVhU5zbKsXmf4XVu8s/W/ONHR0ZLk9tyn/+fI6jt04PQOHz5stm3bZiZOnGiqV69utm3bZrZt22bS09ONMX/dfrNXr14mOjraLF++3NSrV6/Y228+8cQTZs+ePWbWrFnF3vrd39/fLFiwwOzevduMHDnShISEuN1ppqpbv369eeONN0x0dLQ5ePCg+fDDD029evXM0KFDXWNSUlJMaGioufPOO83OnTvNxx9/bIKCgorc+t3Hx8e89tprZs+ePeb555/n1u+lwHPWMx577DGzZs0aExMTY9atW2d69Ohh6tataxISEowxBbdkbtSokVm1apXZsmWLiYyMNJGRka71S/KahALp6emu13RJZtq0aWbbtm3m8OHDxpiCW7+HhISYL7/80mzfvt3ceOONxd76/YorrjAbN240P/74o2nWrJnbrcdL8ppUVZ2p/+np6ebxxx83GzZsMDExMea7774zV155pWnWrJnJyclxbYP+n7sHHnjA1KxZ06xZs8bt1uJZWVmuMWXxOlOS9z5V0dn6f+DAATNp0iSzZcsWExMTY7788kvzt7/9zVx33XWubdD/c0fYqsCGDRtmJBX5t3r1ateYQ4cOmb59+5rAwEBTt25d89hjjxm73e62ndWrV5t27doZPz8/87e//c3Mnz+/yGPNnDnTNGrUyPj5+Zmrr77a/PTTTx7eu8pl69atpmPHjqZmzZomICDAtGzZ0rz88stuv3iNMeaXX34xnTp1Mv7+/uaiiy4yr7zySpFtffrpp6Z58+bGz8/PtG7d2vzvf/8rr924oPCcLXu33XabadCggfHz8zMXXXSRue2228yBAwdcy7Ozs82DDz5oatWqZYKCgszNN99sjh075raNkrwmoeB1ubjX92HDhhljCm7//txzz5nQ0FDj7+9vunfvbvbu3eu2jRMnTpjbb7/dVK9e3QQHB5u7777b9ce4QiV5TaqKztT/rKws06tXL1OvXj3j6+trGjdubEaMGFHkjzn0/9wV13NJbu9Lyup1piTvfaqas/U/NjbWXHfddaZ27drG39/fXHLJJeaJJ55w+5wtY+j/ubIZY0y5HEIDAAAAgCqEa7YAAAAAwAMIWwAAAADgAYQtAAAAAPAAwhYAAAAAeABhCwAAAAA8gLAFAAAAAB5A2AIAAAAADyBsAQAAAIAHELYAABeku+66SzfddJPHtt+lSxc98sgjrumsrCwNGDBAwcHBstlsSklJKXYeAKDqIGwBAErN04GmJA4dOiSbzabo6Ojz3taCBQtks9lks9nk7e2tWrVqqWPHjpo0aZJSU1Pdxi5ZskQvvPCCa/r999/XDz/8oPXr1+vYsWOqWbNmsfMAAFWHj9UFAABQkQQHB2vv3r0yxiglJUXr16/X5MmTNX/+fK1bt07h4eGSpNq1a7utd/DgQbVs2VKXXXbZGeedK4fDIZvNJi8v/j4KAJUNr9wAAI/ZuXOn+vbtq+rVqys0NFR33nmnjh8/7lrepUsXPfzww3ryySdVu3ZthYWFacKECW7b+PXXX9WpUycFBASoVatW+u6772Sz2fTFF19IkiIiIiRJV1xxhWw2m7p06eK2/muvvaYGDRqoTp06GjVqlOx2+xlrttlsCgsLU4MGDdSyZUsNHz5c69evV0ZGhp588km32gtPI+zSpYtef/11rV271lVDcfMkKTc3V48//rguuugiVatWTR07dtSaNWtc212wYIFCQkL01VdfqVWrVvL391dsbGyJ1/v222/VsmVLVa9eXX369NGxY8fc9m/evHlq3bq1/P391aBBA40ePdq1LCUlRffee6/q1aun4OBgdevWTb/88ssZ+wUAOD3CFgDAI1JSUtStWzddccUV2rJli5YvX674+HgNHDjQbdz777+vatWqaePGjZo6daomTZqkqKgoSQVHdW666SYFBQVp48aNmjt3rp555hm39Tdt2iRJ+u6773Ts2DEtWbLEtWz16tU6ePCgVq9erffff18LFizQggULznlf6tevryFDhuirr76Sw+EosnzJkiUaMWKEIiMjXTUUN0+SRo8erQ0bNujjjz/W9u3bdeutt6pPnz7av3+/a3tZWVmaMmWK/v3vf2vXrl2qX79+idd77bXX9J///Edr165VbGysHn/8cdfy2bNna9SoURo5cqR27Nihr776Spdccolr+a233qqEhAR988032rp1q6688kp1795dSUlJ59wzAIAkAwBAKQ0bNszceOONxS574YUXTK9evdzm/f7770aS2bt3rzHGmOuvv9506tTJbcxVV11lnnrqKWOMMd98843x8fExx44dcy2Piooyksznn39ujDEmJibGSDLbtm0rUlvjxo1Nfn6+a96tt95qbrvtttPuz/z5803NmjWLXTZ79mwjycTHx7tqHzNmjGv5mDFjzPXXX++2zqnzDh8+bLy9vc2RI0fcxnXv3t2MGzfOVYMkEx0dXar1Dhw44Fo+a9YsExoa6poODw83zzzzTLH798MPP5jg4GCTk5PjNr9p06bmnXfeKXYdAMCZcc0WAMAjfvnlF61evVrVq1cvsuzgwYNq3ry5JKlt27Zuyxo0aKCEhARJ0t69e9WwYUOFhYW5ll999dUlrqF169by9vZ22/aOHTvOaT8KGWMkFZxmWFo7duyQw+Fw7Xuh3Nxc1alTxzXt5+fn1peSrhcUFKSmTZu6pk/uZUJCgo4eParu3bsXW9svv/yijIwMt+1JUnZ2tg4ePHiOewoAkLhBBgDAQzIyMnTDDTdoypQpRZY1aNDA9X9fX1+3ZTabTU6ns0xqKMtt79mzR8HBwUXCyLnIyMiQt7e3tm7d6hYCJbmF0sDAQLdQV9L1itvfwpAYGBh41toaNGjgdh1YoZCQkDOuCwAoHmELAOARV155pT777DM1adJEPj6l+3XTokUL/f7774qPj1doaKgkafPmzW5j/Pz8JKnYa6nKSkJCghYtWqSbbrrpvO4KeMUVV8jhcCghIUGdO3f2+Honq1Gjhpo0aaKVK1eqa9euRZZfeeWViouLk4+Pj5o0aVKqxwAAuOMGGQCA85Kamqro6Gi3f7///rtGjRqlpKQk3X777dq8ebMOHjyob7/9VnfffXeJg1HPnj3VtGlTDRs2TNu3b9e6dev07LPPSvrrdL769esrMDDQdQOOUz8P61wZYxQXF6djx45pz549mjdvnv7+97+rZs2aeuWVV85r282bN9eQIUM0dOhQLVmyRDExMdq0aZMmT56s//3vf2W+3qkmTJig119/XTNmzND+/fv1888/a+bMmZKkHj16KDIyUjfddJNWrFihQ4cOaf369XrmmWe0ZcuW89pvAKiqCFsAgPOyZs0aXXHFFW7/Jk6cqPDwcK1bt04Oh0O9evVSmzZt9MgjjygkJKTER4e8vb31xRdfKCMjQ1dddZXuvfde190IAwICJEk+Pj6aMWOG3nnnHYWHh+vGG288r/1JS0tTgwYNdNFFFykyMlLvvPOOhg0bpm3btrmd/lha8+fP19ChQ/XYY4+pRYsWuummm7R582Y1atTII+udbNiwYZo+fbrefvtttW7dWv/4xz9cdzO02WxatmyZrrvuOt19991q3ry5Bg0apMOHD7uOKgIAzo3NFJ7MDQBAJbBu3Tp16tRJBw4ccLsZBAAAFQ1hCwBQoX3++eeqXr26mjVrpgMHDmjMmDGqVauWfvzxR6tLAwDgjLhBBgCgQktPT9dTTz2l2NhY1a1bVz169NDrr79udVkAAJwVR7YAAAAAwAO4QQYAAAAAeABhCwAAAAA8gLAFAAAAAB5A2AIAAAAADyBsAQAAAIAHELYAAAAAwAMIWwAAAADgAYQtAAAAAPCA/wcGfTQrpht9iAAAAABJRU5ErkJggg==",
      "text/plain": [
       "<Figure size 1000x600 with 1 Axes>"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "# 计算长度差异  \n",
    "length_differences = []  \n",
    "out_of_range_texts = []  \n",
    "# 计算长度差异并过滤数据  \n",
    "filtered_revised_data = []  \n",
    "for index, (response_length, revised_text_length) in enumerate(zip(response_lengths, revised_text_lengths)):  \n",
    "    difference = revised_text_length - response_length  \n",
    "    length_differences.append(difference)  \n",
    "  \n",
    "    # 检查是否超出范围  \n",
    "    if difference < -88 or difference > 500:  \n",
    "        out_of_range_texts.append({  \n",
    "            'response': revised_data[index]['response'],  \n",
    "            'revised_text': revised_data[index]['revised_text'],  \n",
    "            'difference': difference,  \n",
    "            'index': index  \n",
    "        })  \n",
    "    # 检查是否在-88及350之间  \n",
    "    if -88 <= difference <= 350:  \n",
    "        filtered_revised_data.append(revised_data[index]) \n",
    "\n",
    "# 统计分布  \n",
    "difference_distribution = Counter(length_differences)  \n",
    "  \n",
    "# 打印分布结果  \n",
    "print(difference_distribution)  \n",
    "  \n",
    "# 详细统计信息  \n",
    "differences_array = np.array(length_differences)  \n",
    "mean = np.mean(differences_array)  \n",
    "median = np.median(differences_array)  \n",
    "std_dev = np.std(differences_array)  \n",
    "# 统计分布和绘图代码保持不变  \n",
    "print(f\"Mean: {mean}, Median: {median}, Standard Deviation: {std_dev}\")  \n",
    "\n",
    "# 计算95%置信区间  \n",
    "lower_bound = np.percentile(differences_array, 2.5)  \n",
    "upper_bound = np.percentile(differences_array, 95)  \n",
    "  \n",
    "print(f\"90% Confidence Interval: [{lower_bound}, {upper_bound}]\")  \n",
    "# 长度差异的最大最小值  \n",
    "max_difference = max(length_differences)  \n",
    "min_difference = min(length_differences)  \n",
    "\n",
    "print(f\"Max length difference: {max_difference}, Min length difference: {min_difference}\")  \n",
    "print(f\"out_of_range_texts length {len(out_of_range_texts)}\")\n",
    "# 绘制直方图  \n",
    "plt.figure(figsize=(10, 6))  \n",
    "plt.hist(length_differences, bins=range(min(length_differences), max(length_differences) + 2), edgecolor='black', alpha=0.7)  \n",
    "plt.title('Length Difference Distribution')  \n",
    "plt.xlabel('Length Difference')  \n",
    "plt.ylabel('Frequency')  \n",
    "plt.grid(True)  \n",
    "plt.show()  "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "/home/lidong1/miniconda3/envs/llama_factory/lib/python3.10/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
      "  from .autonotebook import tqdm as notebook_tqdm\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "index complete: set()\n",
      "null_response_indices:110\n",
      "null_revised_indices:6816\n",
      "noneed_revised_indices:6815\n",
      "same_revised_text_indices:324\n",
      "indices_to_discard: 7138\n",
      "length of revised data: 53997\n"
     ]
    }
   ],
   "source": [
    "from datasets import load_dataset, Dataset\n",
    "import pandas as pd\n",
    "ds = load_dataset(\"HuggingFaceH4/ultrafeedback_binarized\", split=\"train_prefs\")\n",
    "def get_instruct_response(item):\n",
    "    # item[\"instruction\"] = item['chosen'][0][\"content\"]\n",
    "    item[\"response\"] = item['chosen'][1][\"content\"]\n",
    "    return item\n",
    "ds = ds.map(get_instruct_response, batch_size=1024, num_proc=8)\n",
    "export_data = ds.select_columns([\"prompt\", \"response\"])\n",
    "from utils import read_jsonl\n",
    "import json \n",
    "data = read_jsonl(\"revised_data/output_sorted_v2.jsonl\")\n",
    "not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "indices = set([item['index'] for item in data])\n",
    "original_indices = set(range(export_data.shape[0]))\n",
    "print(f\"index complete: {original_indices - indices}\")\n",
    "null_response_indices = [item['index'] for item in data if item['gpt_answer'].strip() == '']\n",
    "null_revised_indices = [item['index'] for item in data if item['revised_text'].strip() == '']\n",
    "noneed_revised_indices = [item['index'] for item in data if item['does_it_need_modification'].strip() == 'N']\n",
    "same_revised_text_indices = [item['index'] for item in data if item['response'].strip() == item['revised_text'].strip()]\n",
    "\n",
    "print(f\"null_response_indices:{len(null_response_indices)}\")\n",
    "print(f\"null_revised_indices:{len(null_revised_indices)}\")\n",
    "print(f\"noneed_revised_indices:{len(noneed_revised_indices)}\")\n",
    "print(f\"same_revised_text_indices:{len(same_revised_text_indices)}\")\n",
    "# 使用集合的交集操作  \n",
    "indices_to_discard  = set(null_response_indices) | set(null_revised_indices) | set(noneed_revised_indices) | set(same_revised_text_indices)    \n",
    "indices_to_discard = list(indices_to_discard)\n",
    "print(f\"indices_to_discard: {len(indices_to_discard)}\")\n",
    "temp_data = data\n",
    "\n",
    "for i, item in enumerate(ds):\n",
    "\n",
    "    temp_data[i]['rejected'] = item['rejected'][1]['content']\n",
    "    temp_data[i]['instruct'] = item['prompt']\n",
    "    temp_data[i]['chosen'] = item['chosen']\n",
    "revised_data = [item for item in temp_data if item[\"index\"] not in indices_to_discard]\n",
    "print(f\"length of revised data: {len(revised_data)}\")\n",
    "textual_aesthetics_chosen = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"response\"]} for item in revised_data]\n",
    "with open(\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_chosen_v2.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_chosen, f, indent=4)\n",
    "textual_aesthetics_rejected = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"rejected\"]} for item in revised_data]\n",
    "with open(\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_rejected_v2.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_rejected, f, indent=4)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Mean: 32.17423734358387, Median: 4.0, Standard Deviation: 166.34642309858634\n",
      "95% Confidence Interval: [-180.0, 470.0]\n",
      "Max length difference: 3639, Min length difference: -1024\n",
      "out_of_range_texts length 3045\n",
      "filtered_revised_data length 58090\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "3045"
      ]
     },
     "execution_count": 10,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from transformers import AutoTokenizer \n",
    "import matplotlib.pyplot as plt  \n",
    "from collections import Counter  \n",
    "import numpy as np  \n",
    "from transformers import AutoTokenizer  \n",
    "from utils import read_jsonl \n",
    "def get_length_diff():\n",
    "    revised_data = read_jsonl('revised_data/output_sorted_v2.jsonl')\n",
    "    # 加载tokenizer  \n",
    "    tokenizer_path = \"/mnt/lingjiejiang/textual_aesthetics/model_checkpoint/sft_merge_checkpoints/Meta-Llama-3.1-8B-Instruct\"  \n",
    "    tokenizer = AutoTokenizer.from_pretrained(tokenizer_path, use_fast=True)  \n",
    "    \n",
    "    # 假设revised_data是你的数据列表  \n",
    "    # revised_data = [...]  # 这里填入你的实际数据  \n",
    "    \n",
    "    responses = [item['response'] for item in revised_data]  \n",
    "    revised_texts = [item['revised_text'] for item in revised_data]  \n",
    "    \n",
    "    # 批量分词  \n",
    "    response_tokens_batch = tokenizer(responses, return_tensors=\"np\")  \n",
    "    revised_text_tokens_batch = tokenizer(revised_texts, return_tensors=\"np\")  \n",
    "    \n",
    "    response_lengths = [len(tokens) for tokens in response_tokens_batch[\"input_ids\"]]  \n",
    "    revised_text_lengths = [len(tokens) for tokens in revised_text_tokens_batch[\"input_ids\"]]  \n",
    "    return response_lengths, revised_text_lengths\n",
    "\n",
    "def get_filter_data(response_lengths, revised_text_lengths, lower=-88, upper=350):\n",
    "    revised_data = read_jsonl('revised_data/output_sorted_v2.jsonl')\n",
    "    # 计算长度差异  \n",
    "    length_differences = []  \n",
    "    out_of_range_texts = []\n",
    "    out_of_range_texts_indices = []\n",
    "    filtered_revised_data = []\n",
    "    filtered_revised_data_indices = []  \n",
    "\n",
    "    for index, (response_length, revised_text_length) in enumerate(zip(response_lengths, revised_text_lengths)):  \n",
    "        difference = revised_text_length - response_length  \n",
    "        length_differences.append(difference)  \n",
    "    \n",
    "        # 检查是否超出范围  \n",
    "        if difference < lower or difference > upper:  \n",
    "            out_of_range_texts.append({  \n",
    "                'response': revised_data[index]['response'],  \n",
    "                'revised_text': revised_data[index]['revised_text'],  \n",
    "                'difference': difference,  \n",
    "                'index': index  \n",
    "            })  \n",
    "            out_of_range_texts_indices.append(revised_data[index]['index'])\n",
    "        # 检查是否在-88及350之间  \n",
    "        if lower <= difference and difference <= upper:  \n",
    "            filtered_revised_data.append(revised_data[index])\n",
    "            filtered_revised_data_indices.append(revised_data[index]['index']) \n",
    "\n",
    "    # 统计分布  \n",
    "    # difference_distribution = Counter(length_differences)  \n",
    "    \n",
    "\n",
    "    \n",
    "    # 详细统计信息  \n",
    "    differences_array = np.array(length_differences)  \n",
    "    mean = np.mean(differences_array)  \n",
    "    median = np.median(differences_array)  \n",
    "    std_dev = np.std(differences_array)  \n",
    "    # 统计分布和绘图代码保持不变  \n",
    "    print(f\"Mean: {mean}, Median: {median}, Standard Deviation: {std_dev}\")  \n",
    "\n",
    "    # 计算95%置信区间  \n",
    "    lower_bound = np.percentile(differences_array, 2.5)  \n",
    "    upper_bound = np.percentile(differences_array, 97.5)  \n",
    "    \n",
    "    print(f\"95% Confidence Interval: [{lower_bound}, {upper_bound}]\")  \n",
    "    # 长度差异的最大最小值  \n",
    "    max_difference = max(length_differences)  \n",
    "    min_difference = min(length_differences)  \n",
    "\n",
    "    print(f\"Max length difference: {max_difference}, Min length difference: {min_difference}\")  \n",
    "    print(f\"out_of_range_texts length {len(out_of_range_texts)}\")\n",
    "    print(f\"filtered_revised_data length {len(filtered_revised_data)}\")\n",
    "    return out_of_range_texts_indices\n",
    "lower = -180\n",
    "upper = 470\n",
    "# out_of_range_texts_indices = get_filter_data(lower, upper)\n",
    "# response_lengths, revised_text_lengths = get_length_diff()\n",
    "out_of_range_texts_indices = get_filter_data(response_lengths, revised_text_lengths, lower, upper)\n",
    "len(out_of_range_texts_indices)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "null_response_indices:110\n",
      "null_revised_indices:6816\n",
      "noneed_revised_indices:6815\n",
      "same_revised_text_indices:324\n",
      "indices_to_discard: 7138\n",
      "indices_to_discard add length: 13212\n",
      "length of revised data: 47923\n",
      "/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_v2_rejected_v3_-80_350.json\n",
      "textual_aesthetics_chosen:47923  textual_aesthetics_rejected:47923\n"
     ]
    }
   ],
   "source": [
    "from datasets import load_dataset, Dataset\n",
    "import pandas as pd\n",
    "import json\n",
    "data = read_jsonl(\"revised_data/output_sorted_v2.jsonl\")\n",
    "not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "ds = load_dataset(\"HuggingFaceH4/ultrafeedback_binarized\", split=\"train_prefs\")\n",
    "def get_instruct_response(item):\n",
    "    # item[\"instruction\"] = item['chosen'][0][\"content\"]\n",
    "    item[\"response\"] = item['chosen'][1][\"content\"]\n",
    "    return item\n",
    "ds = ds.map(get_instruct_response, batch_size=1024, num_proc=8)\n",
    "export_data = ds.select_columns([\"prompt\", \"response\"])\n",
    "\n",
    "not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "# datalen\n",
    "# data\n",
    "indices = set([item['index'] for item in data])\n",
    "# original_indices = set(range(export_data.shape[0]))\n",
    "# print(f\"index complete: {original_indices - indices}\")\n",
    "null_response_indices = [item['index'] for item in data if item['gpt_answer'].strip() == '']\n",
    "null_revised_indices = [item['index'] for item in data if item['revised_text'].strip() == '']\n",
    "noneed_revised_indices = [item['index'] for item in data if item['does_it_need_modification'].strip() == 'N']\n",
    "same_revised_text_indices = [item['index'] for item in data if item['response'].strip() == item['revised_text'].strip()]\n",
    "\n",
    "# print(len(null_response))\n",
    "# print(len(not_revised))\n",
    "print(f\"null_response_indices:{len(null_response_indices)}\")\n",
    "print(f\"null_revised_indices:{len(null_revised_indices)}\")\n",
    "print(f\"noneed_revised_indices:{len(noneed_revised_indices)}\")\n",
    "print(f\"same_revised_text_indices:{len(same_revised_text_indices)}\")\n",
    "# 使用集合的交集操作  \n",
    "indices_to_discard  = set(null_response_indices) | set(null_revised_indices) | set(noneed_revised_indices) | set(same_revised_text_indices)   \n",
    "print(f\"indices_to_discard: {len(indices_to_discard)}\")\n",
    "# filter length \n",
    "indices_to_discard = indices_to_discard | set(out_of_range_texts_indices)\n",
    "indices_to_discard = list(indices_to_discard)\n",
    "print(f\"indices_to_discard add length: {len(indices_to_discard)}\")\n",
    "temp_data = data\n",
    "# temp_ds = ds.select(range(10))\n",
    "for i, item in enumerate(ds):\n",
    "    temp_data[i]['rejected'] = item['rejected'][1]['content']\n",
    "    temp_data[i]['instruct'] = item['prompt']\n",
    "    temp_data[i]['chosen'] = item['chosen']\n",
    "revised_data = [item for item in temp_data if item[\"index\"] not in indices_to_discard]\n",
    "print(f\"length of revised data: {len(revised_data)}\")\n",
    "textual_aesthetics_chosen = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"response\"]} for item in revised_data]\n",
    "with open(\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_v2_chosen_v5_{lower}_{upper}.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_chosen, f, indent=4)\n",
    "textual_aesthetics_rejected = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"rejected\"]} for item in revised_data]\n",
    "# with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_v2_rejected_v3_{lower}_{upper}.json\", 'w') as f:\n",
    "#     json.dump(textual_aesthetics_rejected, f, indent=4)\n",
    "# print(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_v2_rejected_v3_{lower}_{upper}.json\")\n",
    "# print(f\"textual_aesthetics_chosen:{len(textual_aesthetics_chosen)}  textual_aesthetics_rejected:{len(textual_aesthetics_rejected)}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [],
   "source": [
    "# from datasets import load_dataset, Dataset\n",
    "# import pandas as pd\n",
    "# import json\n",
    "# data = read_jsonl(\"revised_data/output_sorted_v2.jsonl\")\n",
    "# not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "# ds = load_dataset(\"HuggingFaceH4/ultrafeedback_binarized\", split=\"train_prefs\")\n",
    "# def get_instruct_response(item):\n",
    "#     # item[\"instruction\"] = item['chosen'][0][\"content\"]\n",
    "#     item[\"response\"] = item['chosen'][1][\"content\"]\n",
    "#     return item\n",
    "# ds = ds.map(get_instruct_response, batch_size=1024, num_proc=8)\n",
    "# export_data = ds.select_columns([\"prompt\", \"response\"])\n",
    "\n",
    "# not_revised = [item['index'] for item in data if item['revised_text'] == '']\n",
    "# # datalen\n",
    "# # data\n",
    "# indices = set([item['index'] for item in data])\n",
    "# # original_indices = set(range(export_data.shape[0]))\n",
    "# # print(f\"index complete: {original_indices - indices}\")\n",
    "# null_response_indices = [item['index'] for item in data if item['gpt_answer'].strip() == '']\n",
    "# null_revised_indices = [item['index'] for item in data if item['revised_text'].strip() == '']\n",
    "# noneed_revised_indices = [item['index'] for item in data if item['does_it_need_modification'].strip() == 'N']\n",
    "# same_revised_text_indices = [item['index'] for item in data if item['response'].strip() == item['revised_text'].strip()]\n",
    "\n",
    "# # print(len(null_response))\n",
    "# # print(len(not_revised))\n",
    "# print(f\"null_response_indices:{len(null_response_indices)}\")\n",
    "# print(f\"null_revised_indices:{len(null_revised_indices)}\")\n",
    "# print(f\"noneed_revised_indices:{len(noneed_revised_indices)}\")\n",
    "# print(f\"same_revised_text_indices:{len(same_revised_text_indices)}\")\n",
    "# # 使用集合的交集操作  \n",
    "# indices_to_discard  = set(null_response_indices) | set(null_revised_indices) | set(noneed_revised_indices) | set(same_revised_text_indices)   \n",
    "# print(f\"indices_to_discard: {len(indices_to_discard)}\")\n",
    "# # filter length \n",
    "# indices_to_discard = indices_to_discard | set(out_of_range_texts_indices)\n",
    "# indices_to_discard = list(indices_to_discard)\n",
    "# print(f\"indices_to_discard add length: {len(indices_to_discard)}\")\n",
    "# temp_data = data\n",
    "# # temp_ds = ds.select(range(10))\n",
    "# for i, item in enumerate(ds):\n",
    "#     temp_data[i]['rejected'] = item['rejected'][1]['content']\n",
    "#     temp_data[i]['instruct'] = item['prompt']\n",
    "#     temp_data[i]['chosen'] = item['chosen']\n",
    "# revised_data = [item for item in temp_data if item[\"index\"] not in indices_to_discard]\n",
    "# print(f\"length of revised data: {len(revised_data)}\")\n",
    "# textual_aesthetics_chosen = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"response\"]} for item in revised_data]\n",
    "# # with open(\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_chosen_v4_{lower}_{upper}.json\", 'w') as f:\n",
    "# #     json.dump(textual_aesthetics_chosen, f, indent=4)\n",
    "# textual_aesthetics_rejected = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"rejected\"]} for item in revised_data]\n",
    "# with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_v2_rejected_v2_{lower}_{upper}.json\", 'w') as f:\n",
    "#     json.dump(textual_aesthetics_rejected, f, indent=4)\n",
    "# print(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_v2_rejected_v2_{lower}_{upper}.json\")\n",
    "# print(f\"textual_aesthetics_chosen:{len(textual_aesthetics_chosen)}  textual_aesthetics_rejected:{len(textual_aesthetics_rejected)}\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "null_response_indices: 110\n",
      "null_revised_indices: 6816\n",
      "noneed_revised_indices: 6815\n",
      "same_revised_text_indices: 324\n",
      "indices_to_discard: 7138\n",
      "indices_to_discard add length: 9473\n",
      "length of revised data: 51662\n",
      "textual_aesthetics_chosen: 51662  textual_aesthetics_rejected: 51662\n",
      "/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_v2_rejected_v5_-180_470_add_uf_origin.json\n",
      "textual_aesthetics_chosen: 51662  textual_aesthetics_rejected: 61135\n"
     ]
    }
   ],
   "source": [
    "from datasets import load_dataset, Dataset  \n",
    "import pandas as pd  \n",
    "import json  \n",
    "  \n",
    "def read_jsonl(file_path):  \n",
    "    with open(file_path, 'r') as file:  \n",
    "        data = [json.loads(line) for line in file]  \n",
    "    return data  \n",
    "  \n",
    "# Load data from JSONL file  \n",
    "data = read_jsonl(\"revised_data/output_sorted_v2.jsonl\")  \n",
    "  \n",
    "# Initialize indices to discard  \n",
    "not_revised = [item['index'] for item in data if item['revised_text'] == '']  \n",
    "  \n",
    "# Load dataset  \n",
    "ds = load_dataset(\"HuggingFaceH4/ultrafeedback_binarized\", split=\"train_prefs\")  \n",
    "  \n",
    "# Function to get response from instruction  \n",
    "def get_instruct_response(item):  \n",
    "    item[\"response\"] = item['chosen'][1][\"content\"]  \n",
    "    return item  \n",
    "  \n",
    "# Map function to dataset  \n",
    "ds = ds.map(get_instruct_response, batch_size=1024, num_proc=8)  \n",
    "  \n",
    "# Select relevant columns  \n",
    "export_data = ds.select_columns([\"prompt\", \"response\"])  \n",
    "  \n",
    "# Various indices based on different conditions  \n",
    "null_response_indices = [item['index'] for item in data if item['gpt_answer'].strip() == '']  \n",
    "null_revised_indices = [item['index'] for item in data if item['revised_text'].strip() == '']  \n",
    "noneed_revised_indices = [item['index'] for item in data if item['does_it_need_modification'].strip() == 'N']  \n",
    "same_revised_text_indices = [item['index'] for item in data if item['response'].strip() == item['revised_text'].strip()]  \n",
    "  \n",
    "# Print lengths of various conditions  \n",
    "print(f\"null_response_indices: {len(null_response_indices)}\")  \n",
    "print(f\"null_revised_indices: {len(null_revised_indices)}\")  \n",
    "print(f\"noneed_revised_indices: {len(noneed_revised_indices)}\")  \n",
    "print(f\"same_revised_text_indices: {len(same_revised_text_indices)}\")  \n",
    "  \n",
    "# Combine indices to discard  \n",
    "indices_to_discard  = set(null_response_indices) | set(null_revised_indices) | set(noneed_revised_indices) | set(same_revised_text_indices)  \n",
    "print(f\"indices_to_discard: {len(indices_to_discard)}\")  \n",
    "  \n",
    "# Convert indices to list  \n",
    "indices_to_discard = indices_to_discard | set(out_of_range_texts_indices)\n",
    "indices_to_discard = list(indices_to_discard)  \n",
    "print(f\"indices_to_discard add length: {len(indices_to_discard)}\")  \n",
    "  \n",
    "# Initialize temporary data  \n",
    "temp_data = data  \n",
    "  \n",
    "# Update temp_data with additional fields  \n",
    "for i, item in enumerate(ds):  \n",
    "    temp_data[i]['rejected'] = item['rejected'][1]['content']  \n",
    "    temp_data[i]['instruct'] = item['prompt']  \n",
    "    temp_data[i]['chosen'] = item['chosen']  \n",
    "  \n",
    "# Filter revised data  \n",
    "revised_data = [item for item in temp_data if item[\"index\"] not in indices_to_discard]  \n",
    "print(f\"length of revised data: {len(revised_data)}\")  \n",
    "  \n",
    "# Prepare textual aesthetics chosen data  \n",
    "textual_aesthetics_chosen = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"response\"]} for item in revised_data]  \n",
    "with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_v2_chosen_v5_{lower}_{upper}.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_chosen, f, indent=4)\n",
    "# Prepare textual aesthetics rejected data including indices_to_discard items  \n",
    "textual_aesthetics_rejected = [{\"prompt\": item[\"prompt\"], \"chosen\": item[\"revised_text\"], \"rejected\": item[\"rejected\"]} for item in revised_data]  \n",
    "with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_v2_rejected_v5_{lower}_{upper}.json\", 'w') as f:\n",
    "    json.dump(textual_aesthetics_rejected, f, indent=4)\n",
    "print(f\"textual_aesthetics_chosen: {len(textual_aesthetics_chosen)}  textual_aesthetics_rejected: {len(textual_aesthetics_rejected)}\")  \n",
    "textual_aesthetics_rejected.extend([{\"prompt\": item[\"prompt\"], \"chosen\": item[\"response\"], \"rejected\": item[\"rejected\"]} for item in temp_data if item[\"index\"] in indices_to_discard])  \n",
    "  \n",
    "# # Save textual aesthetics rejected data to JSON file  \n",
    "with open(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_v2_rejected_v5_{lower}_{upper}_add_uf_origin.json\", 'w') as f:  \n",
    "    json.dump(textual_aesthetics_rejected, f, indent=4)  \n",
    "  \n",
    "# Print file path and counts  \n",
    "print(f\"/mnt/lingjiejiang/textual_aesthetics/data/textual_aesthetics_v2_rejected_v5_{lower}_{upper}_add_uf_origin.json\")  \n",
    "print(f\"textual_aesthetics_chosen: {len(textual_aesthetics_chosen)}  textual_aesthetics_rejected: {len(textual_aesthetics_rejected)}\")  \n"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.14"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
