{
  "root": {
    "name": "Change title text on first slide to 'French Architect: Jean-Nicolas-Louis Durand'",
    "description": "Evaluates whether the agent correctly and completely changed the title text on the first slide, without making unwanted changes elsewhere.",
    "is_critical": true,
    "metadata": {},
    "children": [
      {
        "name": "Title text on first slide is exactly 'French Architect: Jean-Nicolas-Louis Durand'",
        "description": "Checks that the first slide's title text was changed and matches exactly the required string.",
        "is_critical": true,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    from pptx import Presentation\n    \n    prs = Presentation(modified_ppt_path)\n    first_slide = prs.slides[0]\n    title_shape = None\n    for shape in first_slide.shapes:\n        if shape.has_text_frame:\n            if shape.text_frame.text.strip():\n                # Heuristic: Title is likely the first non-empty text shape of a slide\n                title_shape = shape\n                break\n    if not title_shape:\n        return (\"No title text found on first slide.\", 0.0)\n    actual_title = title_shape.text_frame.text.strip()\n    required_title = \"French Architect: Jean-Nicolas-Louis Durand\"\n    if actual_title == required_title:\n        return (\"Title matches exactly.\", 1.0)\n    elif required_title.lower() in actual_title.lower():\n        return (\"Title contains required string but is not exact.\", 0.5)\n    else:\n        return (f\"Title does not match. Found: '{actual_title}'\", 0.0)\n"
        }
      },
      {
        "name": "No extraneous changes to first slide except title",
        "description": "Checks that the only change to the first slide is the title text, with no changes to layout, other text, elements, notes, animations, or transitions.",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    # Check for extraneous changes on first slide beyond the title\n    first_slide_id = None\n    # Find first slide id from original PPT\n    from pptx import Presentation\n    prs = Presentation(original_ppt_path)\n    first_slide = prs.slides[0]\n    if hasattr(first_slide, 'slide_id'): # python-pptx 0.6.21+\n        first_slide_id = str(first_slide.slide_id)\n    else:\n        # fallback to slide_number\n        first_slide_id = str(1)\n    changed = False\n    reasons = []\n    # Check for modified animations\n    for anim_tuple in ppt_diff.modified_animations:\n        before, after = anim_tuple\n        if before.slide_id == first_slide_id:\n            changed = True\n            reasons.append(\"Animations were changed on first slide.\")\n    # Check for modified transitions\n    for trans_tuple in ppt_diff.modified_transitions:\n        before, after = trans_tuple\n        if before.slide_id == first_slide_id:\n            changed = True\n            reasons.append(\"Transitions were changed on first slide.\")\n    # Check for notes change\n    for slide_tuple in ppt_diff.modified_slides:\n        before, after = slide_tuple\n        if before.slide_id == first_slide_id:\n            # Check if notes changed\n            if (before.notes or \"\") != (after.notes or \"\"):\n                changed = True\n                reasons.append(\"Slide notes were changed on first slide.\")\n    # Check for added/removed elements (element_count)\n    for slide_tuple in ppt_diff.modified_slides:\n        before, after = slide_tuple\n        if before.slide_id == first_slide_id:\n            if before.element_count != after.element_count:\n                changed = True\n                reasons.append(\"Elements were added/removed on first slide.\")\n    # Check for layout change\n    for slide_tuple in ppt_diff.modified_slides:\n        before, after = slide_tuple\n        if before.slide_id == first_slide_id:\n            if (before.layout_type or \"\") != (after.layout_type or \"\"):\n                changed = True\n                reasons.append(\"Layout type was changed on first slide.\")\n    # Check for changes to other text (besides title)\n    # For this, compare all text shapes except the title\n    import difflib\n    original_prs = Presentation(original_ppt_path)\n    modified_prs = Presentation(modified_ppt_path)\n    orig_slide = original_prs.slides[0]\n    mod_slide = modified_prs.slides[0]\n    # Find title shape index in both\n    def get_title_shape(slide):\n        for shape in slide.shapes:\n            if shape.has_text_frame and shape.text_frame.text.strip():\n                return shape\n        return None\n    orig_title_shape = get_title_shape(orig_slide)\n    mod_title_shape = get_title_shape(mod_slide)\n    # Compare all other text shapes\n    orig_texts = [shape.text_frame.text.strip() for shape in orig_slide.shapes if shape.has_text_frame and shape != orig_title_shape]\n    mod_texts = [shape.text_frame.text.strip() for shape in mod_slide.shapes if shape.has_text_frame and shape != mod_title_shape]\n    if orig_texts != mod_texts:\n        changed = True\n        reasons.append(\"Other text on first slide was changed.\")\n    if changed:\n        return (\"; \".join(reasons), 0.0)\n    else:\n        return (\"No extraneous changes to first slide except title.\", 1.0)\n"
        }
      },
      {
        "name": "No extraneous changes to other slides",
        "description": "Checks that no slides except the first slide were changed (content, layout, notes, animations, transitions, etc.).",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    # Only the first slide should be changed; all other slides untouched\n    if ppt_diff.added_slides or ppt_diff.removed_slides:\n        return (\"Slides added or removed.\", 0.0)\n    # Animations or transitions\n    if ppt_diff.added_animations or ppt_diff.removed_animations or ppt_diff.modified_animations:\n        return (\"Animations changed.\", 0.0)\n    if ppt_diff.added_transitions or ppt_diff.removed_transitions or ppt_diff.modified_transitions:\n        return (\"Transitions changed.\", 0.0)\n    \n    changed = False\n    reasons = []\n    first_slide_ids = set()\n    from pptx import Presentation\n    orig_prs = Presentation(original_ppt_path)\n    for i, slide in enumerate(orig_prs.slides):\n        if hasattr(slide, 'slide_id'):\n            first_slide_ids.add(str(slide.slide_id))\n            if i == 0:\n                first_slide_id = str(slide.slide_id)\n        else:\n            first_slide_ids.add(str(i+1))\n            if i == 0:\n                first_slide_id = str(i+1)\n    # Check for modified slides not the first\n    for slide_tuple in ppt_diff.modified_slides:\n        before, after = slide_tuple\n        if before.slide_id != first_slide_id:\n            changed = True\n            reasons.append(f\"Slide {before.slide_number} was modified.\")\n    # Check for added/removed slides\n    for slide in ppt_diff.added_slides:\n        if slide.slide_id != first_slide_id:\n            changed = True\n            reasons.append(f\"Slide {slide.slide_number} was added.\")\n    for slide in ppt_diff.removed_slides:\n        if slide.slide_id != first_slide_id:\n            changed = True\n            reasons.append(f\"Slide {slide.slide_number} was removed.\")\n    # Check for modified animations/transitions on other slides\n    for anim_tuple in ppt_diff.modified_animations:\n        before, after = anim_tuple\n        if before.slide_id != first_slide_id:\n            changed = True\n            reasons.append(f\"Animations were changed on slide {before.slide_number}.\")\n    for trans_tuple in ppt_diff.modified_transitions:\n        before, after = trans_tuple\n        if before.slide_id != first_slide_id:\n            changed = True\n            reasons.append(f\"Transitions were changed on slide {before.slide_number}.\")\n    if changed:\n        return (\"; \".join(reasons), 0.0)\n    else:\n        return (\"No extraneous changes to other slides.\", 1.0)\n"
        }
      }
    ]
  },
  "metadata": {
    "task": "Change the title text to 'French Architect: Jean-Nicolas-Louis Durand' on the first slide",
    "compute_strategy": "default",
    "critical_node_weight": 0.7
  }
}