{
  "root": {
    "name": "Slide 11: Add a title 'Storm Event Analysis' above the objective text",
    "description": "Evaluates whether the agent correctly added a title with the specified text above the objective content on slide 11, without introducing extraneous or disruptive changes.",
    "is_critical": true,
    "metadata": {},
    "children": [
      {
        "name": "Title presence on Slide 11",
        "description": "Checks that the title 'Storm Event Analysis' was added to Slide 11 and that its text matches exactly.",
        "is_critical": true,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    \"\"\"Score presence and relative font size of the title on slide 11.\n\n    Improvements:\n    - Defensive check if slide 11 exists.\n    \"\"\"\n    from pptx import Presentation\n\n    ppt_path = globals().get(\"modified_ppt_path\")\n    if ppt_path is None:\n        return (\"modified_ppt_path not provided in evaluation context.\", 0.0)\n    prs = Presentation(ppt_path)\n    # Slide index 10 == \"Slide 11\" for users.\n    if len(prs.slides) <= 10:\n        return (\"Presentation does not contain Slide 11.\", 0.0)\n    slide = prs.slides[10]\n\n    title_shape = None\n    objective_shape = None\n    for shape in slide.shapes:\n        if not getattr(shape, \"has_text_frame\", False):\n            continue\n        try:\n            text = (shape.text or \"\").strip().lower()\n        except Exception:\n            continue\n        if 'objective' in text and objective_shape is None:  # first occurrence\n            objective_shape = shape\n        # Require exact match (case-insensitive) for title\n        if text == 'storm event analysis':\n            title_shape = shape\n\n    if title_shape is None:\n        return (\"Title 'Storm Event Analysis' not found on Slide 11.\", 0.0)\n\n    return (\"Title 'Storm Event Analysis' found on Slide 11.\", 1.0)"
        }
      },
      {
        "name": "Title position: Above objective text",
        "description": "Verifies that the added title appears above the objective text on slide 11 (not below or off-slide).",
        "is_critical": true,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    from pptx import Presentation\n    prs = Presentation(modified_ppt_path)\n    slide = prs.slides[10] if len(prs.slides) > 10 else None\n    # Find title shape and objective shape\n    title_shape = None\n    objective_shape = None\n    for shape in slide.shapes:\n        if not shape.has_text_frame:\n            continue\n        text = shape.text.strip().lower()\n        if text == 'storm event analysis':\n            title_shape = shape\n        elif 'objective' in text or 'objectives' in text:\n            objective_shape = shape\n    if title_shape is None:\n        return (\"Could not find the title shape on Slide 11.\", 0.0)\n    if objective_shape is None:\n        return (\"Could not find the objective text shape on Slide 11.\", 0.0)\n    # Check vertical position (y)\n    title_top = title_shape.top\n    objective_top = objective_shape.top\n    if title_top < objective_top:\n        return (\"Title is positioned above the objective text.\", 1.0)\n    else:\n        return (\"Title is not above the objective text.\", 0.0)\n"
        }
      },
      {
        "name": "No extraneous changes to slide content",
        "description": "Checks that no unnecessary changes (e.g., extra added slides, deleted content, unrelated text, or formatting) were made to slide 11 or the rest of the presentation.",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    # We allow only one added text shape on slide 11 with the target title text, and no removed slides/content.\n    # Allow reasonable formatting changes, but not added/deleted slides/content elsewhere.\n    extraneous = False\n    # Check for added/removed slides\n    if ppt_diff.added_slides:\n        return (f\"Slides were added: {[s.slide_number for s in ppt_diff.added_slides]}\", 0.0)\n    if ppt_diff.removed_slides:\n        return (f\"Slides were removed: {[s.slide_number for s in ppt_diff.removed_slides]}\", 0.0)\n    # Check for removed shapes on slide 11\n    # (We cannot directly check for removed shapes, so instead, check for removed animations/transition on slide 11)\n    any_removal_on_11 = False\n    for anim in ppt_diff.removed_animations:\n        if anim.slide_id == '11':\n            any_removal_on_11 = True\n    for tr in ppt_diff.removed_transitions:\n        if tr.slide_id == '11':\n            any_removal_on_11 = True\n    if any_removal_on_11:\n        return (\"Animations or transitions were removed from slide 11.\", 0.0)\n    # Check for significant text changes (unrelated text added)\n    # Use python-pptx to compare text on slide 11 between original and modified\n    from pptx import Presentation\n    orig = Presentation(original_ppt_path)\n    mod = Presentation(modified_ppt_path)\n    orig_slide = None\n    mod_slide = None\n    slides_o = list(orig.slides)\n    slides_m = list(mod.slides)\n    if len(slides_o) < 11 or len(slides_m) < 11:\n        return (\"Slide 11 does not exist in one of the presentations.\", 0.0)\n    orig_slide = slides_o[10]\n    mod_slide = slides_m[10]\n    def get_texts(slide):\n        return set([shape.text.strip() for shape in slide.shapes if hasattr(shape, 'text') and shape.has_text_frame])\n    orig_texts = get_texts(orig_slide)\n    mod_texts = get_texts(mod_slide)\n    added_texts = mod_texts - orig_texts\n    # Remove the expected title if present\n    added_texts = {t for t in added_texts if t.lower() != 'storm event analysis'}\n    if added_texts:\n        return (f\"Extraneous text added to slide 11: {added_texts}\", 0.0)\n    return (\"No extraneous changes found.\", 1.0)\n"
        }
      },
      {
        "name": "Title is bigger than objective text",
        "description": "Checks that the title 'Storm Event Analysis' is visually larger than the objective text on slide 11.",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    # Use VLM to compare before/after slide 5 prominence\n    mod_img = None\n\n    for s in modified_ppt_screenshots:\n        if s.slide_number == 11:\n            mod_img = s.image_path\n            break\n        \n    prompt = (\n        \"Given this screenshot of a PowerPoint slide, is the font size of the title 'Storm Event Analysis' bigger than the font size of the text 'Objective: Assess Sea Level Rise Impacts to Groundwater Table'?\\n\"\n        \"Answer YES or NO and explain.\"\n    )\n    result = vlm_call(prompt, [mod_img], temperature=0.0, max_tokens=5)\n    if 'YES' in result.upper():\n        return f\"VLM confirms the title text is bigger than the objective text.\", 1.0\n    elif 'NO' in result.upper():\n        return f\"VLM confirms the title text is not bigger than the objective text.\", 0.0\n    else:\n        return f\"Ambiguous VLM result: {result}\", 0.5\n"
        }
      }
    ]
  },
  "metadata": {
    "task": "Slide 11: Add a title 'Storm Event Analysis' above the objective text"
  }
}