{
  "experiment_name": "Agent Cognitive Attack - Batch Experiments",
  "description": "Batch generation of behavior trajectory experimental configuration",
  "version": "1.0",
  "models": [
    {
      "source": "dmxapi",
      "model": "grok-4.1-non-thinking",
      "mock": false,
      "max_workers": 8,
      "enabled": false
    },
    {
      "source": "dmxapi",
      "model": "gemini-2.5-flash-lite",
      "mock": false,
      "max_workers": 8,
      "enabled": false
    },
    {
      "source": "dashscope",
      "model": "glm-4.5-air",
      "mock": false,
      "max_workers": 8,
      "enabled": false
    },
    {
      "source": "dashscope",
      "model": "qwen-turbo",
      "mock": false,
      "max_workers": 8,
      "enabled": false
    },
    {
      "source": "dashscope",
      "model": "qwen-flash",
      "mock": false,
      "max_workers": 8,
      "enabled": true
    },
    {
      "source": "dashscope",
      "model": "deepseek-v3.2",
      "mock": false,
      "max_workers": 8,
      "enabled": false
    },
    {
      "source": "dmxapi",
      "model": "mimo-v2-flash-free",
      "mock": false,
      "max_workers": 1,
      "enabled": false
    },
    {
      "source": "siliconflow",
      "model": "deepseek-ai/DeepSeek-R1",
      "mock": false,
      "max_workers": 2,
      "enabled": false
    },
    {
      "source": "siliconflow",
      "model": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
      "mock": false,
      "max_workers": 2,
      "enabled": false
    },
    {
      "source": "siliconflow",
      "model": "Qwen/Qwen3-Next-80B-A3B-Instruct",
      "mock": false,
      "max_workers": 2,
      "enabled": false
    },
    {
      "source": "ollama",
      "model": "llama2:7b",
      "mock": true,
      "max_workers": 1,
      "enabled": false
    },
    {
      "source": "mi",
      "model": "mimo-v2-flash",
      "mock": false,
      "max_workers": 2,
      "enabled": false
    }
  ],
  "runtime": {
    "dataset_path": "data/AdvBench/harmful_behaviors_custom.csv",
    "output_dir": "./logs/jailbreak-advbench",
    "trials_per_instruction": 50,
    "max_workers": 8,
    "max_instructions": null,
    "mock_mode": false,
    "save_interval": 5
  },
  "scenarios": {
    "enabled_groups": [
      "Baseline",
      "Optimism",
      "Magnitude",
      "Punishment",
      "Threat",
      "Authority",
      "Regret",
      "Stimulus"
    ],
    "all_groups": [
      "Baseline",
      "Optimism",
      "Magnitude",
      "Punishment",
      "Threat",
      "Authority",
      "Regret",
      "Stimulus"
    ],
    "num_scenarios": 8
  },
  "notes": [
    "=== Model Configuration ===",
    "Set 'enabled: false' to skip a model without deleting it",
    "Set 'mock_mode: true' to test without API calls",
    "Set 'max_workers: 1' for local models like Ollama",
    "",
    "=== Dataset Selection ===",
    "Current: data/AdvBench/harmful_behaviors_custom.csv",
    "Alternatives: data/HarmBench/harmbench_instructions.csv, data/HExPHI/hexphi_instructions.csv",
    "To switch: Edit 'dataset_path' in runtime section",
    "",
    "=== Experiment Control ===",
    "Set 'max_instructions: 5' for quick testing",
    "Set 'save_interval: N' to save results every N completed tasks (default: 5)",
    "Set 'trials_per_instruction: 10' for fewer trials per instruction",
    "",
    "=== AdvBench Dataset ===",
    "AdvBench has 50 harmful behavior instructions",
    "Columns: goal (instruction), target, category, Original index",
    "Compatible with existing load_instructions function"
  ]
}