{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'model_name_or_path': '../model/DeepSeek-R1-Distill-Qwen-7B', 'torch_dtype': 'bfloat16', 'device': 'cuda:1', 'use_chat_template': True, 'system_prompt': '', 'steer_train_hparam_paths': ['../hparams/Steer/caa_hparams/generate_caa.yaml'], 'steer_train_dataset': ['r1'], 'steer_vector_output_dir': ['vectors/DeepSeek-R1-Distill-Qwen-8B/'], 'apply_steer_hparam_paths': ['../hparams/Steer/caa_hparams/apply_caa.yaml'], 'steer_vector_load_dir': ['vectors/DeepSeek-R1-Distill-Qwen-8B/r1/caa_vector'], 'generation_data': ['nontoxic'], 'generation_data_size': 5, 'generation_output_dir': 'vectors/DeepSeek-R1-Distill-Qwen-8B/r1_results/', 'num_responses': 1, 'steer_from_end_position': False, 'generation_params': {'max_new_tokens': 500, 'temperature': 0.6}}"
      ]
     },
     "execution_count": 2,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import sys\n",
    "sys.path.append('../')\n",
    "from omegaconf import OmegaConf, DictConfig\n",
    "from steer.vector_generators.vector_generators import BaseVectorGenerator\n",
    "from steer.datasets import prepare_train_dataset\n",
    "from steer.vector_appliers.vector_applier import BaseVectorApplier\n",
    "from steer.datasets import prepare_generation_datasets\n",
    "model_path=\"../model/DeepSeek-R1-Distill-Qwen-7B\"\n",
    "\n",
    "top_cfg = OmegaConf.load(\"./config_r1_control.yaml\")\n",
    "top_cfg.model_name_or_path = model_path\n",
    "top_cfg.device = \"cuda:1\"\n",
    "top_cfg"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Generate Steering Vector"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Hparams Dict: {'caa': CAAHyperParams(use_chat_template=True, system_prompt='', torch_dtype='bfloat16', alg_name='caa', model_name_or_path='/data2/xzwnlp/model/DeepSeek-R1-Distill-Qwen-7B', layers=[17], device='cuda:1', steer_train_dataset=['r1'], multiple_choice=False, steer_vector_output_dir='vectors/DeepSeek-R1-Distill-Qwen-8B/')}\n",
      "Saving vectors to vectors/DeepSeek-R1-Distill-Qwen-8B/r1 ...\n",
      "Generating caa vectors ...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Loading checkpoint shards: 100%|██████████| 2/2 [00:07<00:00,  3.86s/it]\n",
      "Processing prompts:   0%|          | 0/1 [00:00<?, ?it/s]We detected that you are passing `past_key_values` as a tuple and this is deprecated and will be removed in v4.43. Please use an appropriate `Cache` class (https://huggingface.co/docs/transformers/v4.41.3/en/internal/generation_utils#transformers.Cache)\n",
      "Processing prompts: 100%|██████████| 1/1 [00:01<00:00,  1.80s/it]\n"
     ]
    }
   ],
   "source": [
    "datasets = {\n",
    "    'r1':[\n",
    "        {'question': '1 + 1 = ', \n",
    "        'matching':'</think>\\n\\n1 + 1 equals 2. This fundamental arithmetic operation consistently holds true across various mathematical contexts, including binary, decimal, algebraic expressions, and modular arithmetic, although the representation may vary. In standard arithmetic, the sum of two ones is always two.<｜end▁of▁sentence｜>', \n",
    "        'not_matching': \"Alright, so I'm trying to figure out what 1 + 1 equals. Hmm, at first glance, it seems pretty straightforward, but I want to make sure I understand it fully. Let me think about how addition works. When you add two numbers, you're combining their quantities. So, if I have one apple and someone else has another apple, together we have two apples. That makes sense because we're just putting the apples together without changing their individual counts.\\n\\nBut wait, maybe I should consider different number systems or contexts where this might change. For example, in binary, which is the base-2 system, 1 + 1 equals 10. That's interesting because in our usual decimal system, it's just 2, but in binary, it's a different representation. So, the way we add numbers can vary depending on the base we're using.\\n\\nAnother thought: what if we're talking about something other than numbers, like sets or objects? If I have one book and someone else has another book, together we have two books. It's the same concept, just adding the quantities. But if the items were in different categories or had different properties, would that affect the addition? I don't think so because addition is purely about the quantity, regardless of what the items are.\\n\\nI also wonder about the history of addition. How did humans figure out that combining two quantities gives a sum? It must have been through counting and recognizing patterns. For instance, if you have one stone and add another stone, you can see that you now have two stones. This simple concept likely formed the basis of mathematical addition.\\n\\nWhat about in mathematics, specifically in algebra? If I have variables, say x + x, that simplifies to 2x. So, in that case, 1 + 1 would be 2. It's consistent with the basic arithmetic we learned earlier. But what if it's more complex, like adding fractions or decimals? For example, 1/2 + 1/2 equals 1, and 0.5 + 0.5 also equals 1. So, the principle remains the same, but the representation changes based on the type of numbers involved.\\n\\nI should also think about whether there's any situation where 1 + 1 doesn't equal 2. In standard mathematics, across all number systems, 1 + 1 equals 2. Even in higher mathematics, like calculus or linear algebra, the fundamental operations still adhere to the basic principles of addition. So, unless we're dealing with something like modular arithmetic or other abstract systems, 1 + 1 remains 2.\\n\\nWait, in modular arithmetic, 1 + 1 modulo 2 would be 0. But that's a different context where we're working within a specific modulus. So, it's still 2 in the usual sense, but modulo 2, it's 0. But I think the original question is asking in the general sense, so 2 is the correct answer.\\n\\nAnother angle: in computer science, when we perform addition, especially in binary, 1 + 1 is 10, which is 2 in decimal. So, the result is the same, just represented differently. This reinforces the idea that regardless of the method, the sum of two ones is two.\\n\\nI also recall that in some programming languages, adding 1 and 1 might have different effects, like in bit manipulation or boolean logic, but in standard arithmetic operations, it's consistently 2. So, unless specified otherwise, 1 + 1 equals 2.\\n\\nIn summary, after considering various contexts—binary, decimal, algebraic expressions, modular arithmetic, and computer science—it's clear that 1 + 1 equals 2 in the standard sense. The different representations might change how it's shown, but the underlying value remains consistent.\\n</think>\\n\\n1 + 1 equals 2. This fundamental arithmetic operation consistently holds true across various mathematical contexts, including binary, decimal, algebraic expressions, and modular arithmetic, although the representation may vary. In standard arithmetic, the sum of two ones is always two.<｜end▁of▁sentence｜>\"\n",
    "        }\n",
    "    ]\n",
    "}\n",
    "\n",
    "# Or use the datasets from config.yaml\n",
    "# datasets = prepare_train_dataset(top_cfg)\n",
    "\n",
    "vector_generator = BaseVectorGenerator(top_cfg)\n",
    "vector_generator.generate_vectors(datasets)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Apply Steering Vector\n",
    "#### Controlling the chain of thought length in the R1 model."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Hparams Dict: {'caa': ApplyCAAHyperParams(use_chat_template=True, system_prompt='', torch_dtype='bfloat16', alg_name='caa', model_name_or_path='/data2/xzwnlp/model/DeepSeek-R1-Distill-Qwen-7B', device='cuda:1', layers=[17], multipliers=[1.0], steer_vector_load_dir='vectors/DeepSeek-R1-Distill-Qwen-8B/r1/caa_vector', generation_data=['nontoxic'], max_new_tokens=100, generation_output_dir='vectors/DeepSeek-R1-Distill-Qwen-8B/r1_results/', do_sample=False, temperature=1.0, num_responses=1, generation_data_size=5, top_p=1.0)}\n",
      "Applying caa vectors to model ...\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Loading checkpoint shards: 100%|██████████| 2/2 [00:06<00:00,  3.49s/it]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Apply CAA to model: /data2/xzwnlp/model/DeepSeek-R1-Distill-Qwen-7B\n",
      "Layer 17\n",
      "Steering vector path:  vectors/DeepSeek-R1-Distill-Qwen-8B/r1/caa_vector/layer_17.pt\n",
      "Steering vector:  tensor([ 0.6719, -0.4902, -0.1699,  ...,  0.5078,  0.0508,  1.0000],\n",
      "       device='cuda:1', dtype=torch.bfloat16)\n",
      "Multiplier -2\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Evaluating dataset r1_multipliers-2:   0%|          | 0/1 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:151643 for open-end generation.\n",
      "Evaluating dataset r1_multipliers-2: 100%|██████████| 1/1 [00:13<00:00, 13.73s/it]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "r1_multipliers-2 results:  [{'input': 'A robe takes 2 bolts of blue fiber and half that much white fiber.  How many bolts in total does it take?', 'pred': [\"I need to figure out how much fiber the robe takes in total. It says the robe uses blue fiber and white fiber. The blue fiber is 2 bolts, and the white fiber is half of that. So I should calculate how much white fiber is needed. Half of 2 bolts is 1 bolt. Then add the blue and white together. Blue is 2 and white is 1, so total is 3 bolts. But maybe I'm missing something. It says half of the blue fiber, so maybe I should think differently. The blue is 2, white is half of 2, which is 1. So maybe the total is 3, but I should check if it's supposed to be 3 or something else. Maybe the problem is confusing because it says half the blue fiber, not half the white. Maybe the white is half of the blue. So the blue is 2, white is 1, and total is 2 + 1 = 3. Maybe the answer is 3. But I'm not sure. Maybe I should think in terms of units. It's 2 bolts for blue, and white is half of that. So white is 1, but maybe it's 1 bolt for white, so total is 2 + 1 = 3. But maybe I'm overcomplicating it. Maybe the answer is 3, but I should think about it differently. Maybe it's 2 for blue and 1 for white, so total is 3. Maybe I should think about the total in terms of bolts. If I have 2 for blue, and white is half of that, maybe I have 2 for blue and 1 for white, but it's not 2 for white. Maybe it's 2 for blue, and white is half of the blue, so it's 2 for blue, 1 for white, and total is 3. Maybe I should think about it as 2 for blue, and white is half of the blue, so it's 2 for blue, 1 for white, and total is 3. But I'm not sure if the problem is trying to trick me. Maybe the answer is 3, but I should check. Maybe the answer is 3, but I should think about it differently. Maybe I should think about the total in terms of the white fiber. If the blue is 2, and white is\"], 'output': None}]\n",
      "Saving results to vectors/DeepSeek-R1-Distill-Qwen-8B/r1_results/r1_multipliers-2_results.json\n",
      "Applying caa vectors to model ...\n",
      "Apply CAA to model: /data2/xzwnlp/model/DeepSeek-R1-Distill-Qwen-7B\n",
      "Layer 17\n",
      "Steering vector path:  vectors/DeepSeek-R1-Distill-Qwen-8B/r1/caa_vector/layer_17.pt\n",
      "Steering vector:  tensor([ 0.6719, -0.4902, -0.1699,  ...,  0.5078,  0.0508,  1.0000],\n",
      "       device='cuda:1', dtype=torch.bfloat16)\n",
      "Multiplier -1\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Evaluating dataset r1_multipliers-1:   0%|          | 0/1 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:151643 for open-end generation.\n",
      "Evaluating dataset r1_multipliers-1: 100%|██████████| 1/1 [00:13<00:00, 13.26s/it]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "r1_multipliers-1 results:  [{'input': 'A robe takes 2 bolts of blue fiber and half that much white fiber.  How many bolts in total does it take?', 'pred': ['Alright, so I\\'ve got this problem here about a robe that takes some blue fiber and some white fiber. It says the robe takes 2 bolts of blue fiber and half that much white fiber. Hmm, okay, so let me try to break this down. Maybe I\\'ll just write down what I understand.\\n\\nFirst, blue fiber: 2 bolts. That\\'s straightforward. Then white fiber is half that much. Wait, half of what? Half of the blue fiber? So, if blue is 2, then white is half of 2? That would be 1, right? So then, white fiber is 1 bolt. So total fiber is blue plus white, which is 2 + 1. That\\'s 3 bolts total. Is that it? Maybe I\\'m overcomplicating it.\\n\\nWait, let me make sure. The problem says \"half that much white fiber.\" So, \"that much\" refers to the blue fiber, right? So, the white fiber is half of the blue fiber. So, blue is 2, white is half of 2, which is 1. So, total is 3. Hmm, okay, so 3 bolts in total.\\n\\nBut maybe I should think about it another way. Maybe the problem is trying to trick me. Maybe it\\'s not half the blue fiber, but half of something else. Hmm. Let me read the problem again: \"A robe takes 2 bolts of blue fiber and half that much white fiber.\" So, maybe it\\'s 2 bolts of blue, and then half the amount of white compared to blue. So, white is half of 2, which is 1. So, same as before. So, 3 total. Hmm.\\n\\nWait, another thought. Maybe \"half that much\" is referring to the total fiber or something else. But I don\\'t think so. It says \"half that much white fiber,\" so it\\'s half of the blue fiber. So, maybe the total is 3. But maybe I should represent it mathematically.\\n\\nLet me let B be the blue fiber and W be the white fiber. So, B = 2 bolts. Then W is half of B, so W = (1/2)*B. So, W = (1/2)*2 = 1. So, W is 1. Then total is B + W = 2 + 1 = 3. Yeah,'], 'output': None}]\n",
      "Saving results to vectors/DeepSeek-R1-Distill-Qwen-8B/r1_results/r1_multipliers-1_results.json\n",
      "Applying caa vectors to model ...\n",
      "Apply CAA to model: /data2/xzwnlp/model/DeepSeek-R1-Distill-Qwen-7B\n",
      "Layer 17\n",
      "Steering vector path:  vectors/DeepSeek-R1-Distill-Qwen-8B/r1/caa_vector/layer_17.pt\n",
      "Steering vector:  tensor([ 0.6719, -0.4902, -0.1699,  ...,  0.5078,  0.0508,  1.0000],\n",
      "       device='cuda:1', dtype=torch.bfloat16)\n",
      "Multiplier 0\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Evaluating dataset r1_multipliers0:   0%|          | 0/1 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:151643 for open-end generation.\n",
      "Evaluating dataset r1_multipliers0: 100%|██████████| 1/1 [00:07<00:00,  7.11s/it]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "r1_multipliers0 results:  [{'input': 'A robe takes 2 bolts of blue fiber and half that much white fiber.  How many bolts in total does it take?', 'pred': [\"To determine the total number of bolts needed for the robe, I will first identify the amount of each type of fiber required.\\n\\nThe robe needs 2 bolts of blue fiber. It also requires half as much white fiber as blue fiber, which amounts to 1 bolt.\\n\\nAdding the blue and white fibers together, the total number of bolts needed for the robe is 3.\\n</think>\\n\\n**Solution:**\\n\\nTo determine the total number of bolts needed for the robe, let's break down the requirements step by step.\\n\\n1. **Blue Fiber:**\\n   - The robe requires **2 bolts** of blue fiber.\\n\\n2. **White Fiber:**\\n   - The amount of white fiber needed is **half** that of blue fiber.\\n   - Calculation: \\n     \\\\[\\n     \\\\frac{1}{2} \\\\times 2\\\\ \\\\text{bolts} = 1\\\\ \\\\text{bolt}\\n     \\\\]\\n\\n3. **Total Bolts:**\\n   - Add the blue and white fibers together:\\n     \\\\[\\n     2\\\\ \\\\text{bolts (blue)} + 1\\\\ \\\\text{bolt (white)} = 3\\\\ \\\\text{bolts}\\n     \\\\]\\n\\n**Final Answer:**\\n\\\\[\\n\\\\boxed{3}\\n\\\\]\"], 'output': None}]\n",
      "Saving results to vectors/DeepSeek-R1-Distill-Qwen-8B/r1_results/r1_multipliers0_results.json\n",
      "Applying caa vectors to model ...\n",
      "Apply CAA to model: /data2/xzwnlp/model/DeepSeek-R1-Distill-Qwen-7B\n",
      "Layer 17\n",
      "Steering vector path:  vectors/DeepSeek-R1-Distill-Qwen-8B/r1/caa_vector/layer_17.pt\n",
      "Steering vector:  tensor([ 0.6719, -0.4902, -0.1699,  ...,  0.5078,  0.0508,  1.0000],\n",
      "       device='cuda:1', dtype=torch.bfloat16)\n",
      "Multiplier 1\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Evaluating dataset r1_multipliers1:   0%|          | 0/1 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:151643 for open-end generation.\n",
      "Evaluating dataset r1_multipliers1: 100%|██████████| 1/1 [00:07<00:00,  7.55s/it]\n"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "r1_multipliers1 results:  [{'input': 'A robe takes 2 bolts of blue fiber and half that much white fiber.  How many bolts in total does it take?', 'pred': ['First, identify the amount of blue fiber required for the robe, which is 2 bolts.\\n\\nNext, determine the amount of white fiber needed, which is half of the blue fiber.\\n\\nCalculate half of 2 bolts, resulting in 1 bolt.\\n\\nFinally, add the blue and white fibers together to find the total number of bolts required for the robe.\\n</think>\\n\\nTo determine the total number of bolts required for the robe, follow these steps:\\n\\n1. **Calculate the amount of white fiber:**\\n   \\n   \\\\[\\n   \\\\text{White Fiber} = \\\\frac{1}{2} \\\\times \\\\text{Blue Fiber} = \\\\frac{1}{2} \\\\times 2 = 1 \\\\text{ bolt}\\n   \\\\]\\n\\n2. **Sum the blue and white fibers:**\\n   \\n   \\\\[\\n   \\\\text{Total Bolts} = \\\\text{Blue Fiber} + \\\\text{White Fiber} = 2 + 1 = 3\\n   \\\\]\\n\\n\\\\[\\n\\\\boxed{3}\\n\\\\]'], 'output': None}]\n",
      "Saving results to vectors/DeepSeek-R1-Distill-Qwen-8B/r1_results/r1_multipliers1_results.json\n",
      "Applying caa vectors to model ...\n",
      "Apply CAA to model: /data2/xzwnlp/model/DeepSeek-R1-Distill-Qwen-7B\n",
      "Layer 17\n",
      "Steering vector path:  vectors/DeepSeek-R1-Distill-Qwen-8B/r1/caa_vector/layer_17.pt\n",
      "Steering vector:  tensor([ 0.6719, -0.4902, -0.1699,  ...,  0.5078,  0.0508,  1.0000],\n",
      "       device='cuda:1', dtype=torch.bfloat16)\n",
      "Multiplier 2\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "Evaluating dataset r1_multipliers2:   0%|          | 0/1 [00:00<?, ?it/s]Setting `pad_token_id` to `eos_token_id`:151643 for open-end generation.\n",
      "Evaluating dataset r1_multipliers2: 100%|██████████| 1/1 [00:06<00:00,  6.02s/it]"
     ]
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "r1_multipliers2 results:  [{'input': 'A robe takes 2 bolts of blue fiber and half that much white fiber.  How many bolts in total does it take?', 'pred': ['First, identify the quantities of blue and white fibers.\\n\\nGiven:\\n- Blue fiber: 2 bolts\\n- White fiber: half of blue fiber, which is 1 bolt\\n\\nTotal fiber required is the sum of blue and white fibers.\\n</think>\\n\\nTo determine the total number of bolts required for the fiber, follow these steps:\\n\\n1. **Identify the quantities:**\\n   - **Blue Fiber:** 2 bolts\\n   - **White Fiber:** Half of blue fiber, which is \\\\( \\\\frac{2}{2} = 1 \\\\) bolt\\n\\n2. **Calculate the total:**\\n   \\n   \\\\[\\n   2 \\\\text{ bolts (Blue)} + 1 \\\\text{ bolt (White)} = 3 \\\\text{ bolts}\\n   \\\\]\\n\\n**Answer:** \\\\(\\\\boxed{3}\\\\)'], 'output': None}]\n",
      "Saving results to vectors/DeepSeek-R1-Distill-Qwen-8B/r1_results/r1_multipliers2_results.json\n"
     ]
    },
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "\n"
     ]
    }
   ],
   "source": [
    "vector_applier = BaseVectorApplier(top_cfg)\n",
    "for mu in [-2, -1, 0, 1, 2]:\n",
    "    vector_applier.hparams_dict[\"caa\"].multipliers = [mu]\n",
    "    vector_applier.apply_vectors()\n",
    "\n",
    "    # You can customize your own inputs\n",
    "    datasets={f'r1_multipliers{mu}':[{'input':\"A robe takes 2 bolts of blue fiber and half that much white fiber.  How many bolts in total does it take?\"}]}\n",
    "\n",
    "    # Or use the datasets from config.yaml\n",
    "    # datasets = prepare_generation_datasets(top_cfg)\n",
    "\n",
    "    # Method 1: Use parameters from config.yaml\n",
    "    vector_applier.generate(datasets)\n",
    "    # Resets the model to its initial state, clearing any modifications.\n",
    "    vector_applier.model.reset_all()"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "EasySteer",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.10.16"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 2
}
