{
  "root": {
    "name": "Change the title color of 'Accounting Equation' from blue to red",
    "description": "Evaluates whether the agent successfully changed the color of the slide title 'Accounting Equation' from blue to red, without introducing errors or unnecessary changes.",
    "is_critical": true,
    "metadata": {},
    "children": [
      {
        "name": "Title color correctly changed to red",
        "description": "Checks that the text of the title 'Accounting Equation' is now red on the appropriate slide(s).",
        "is_critical": true,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    from pptx import Presentation\n    from pptx.dml.color import RGBColor, MSO_COLOR_TYPE\n    \n    def is_red_color(color_obj):\n        \"\"\"Check if a color is red (accepts various shades of red).\"\"\"\n        if not color_obj or color_obj.type != MSO_COLOR_TYPE.RGB:\n            return False\n        \n        color = color_obj.rgb\n        r, g, b = color[0], color[1], color[2]\n        \n        # Accept various shades of red:\n        # - Pure red: (255, 0, 0)\n        # - Dark red: (238, 0, 0) - which is what we found in the file\n        # - Other common reds: Allow high red (>200) with low green and blue (<50)\n        return r >= 200 and g <= 50 and b <= 50\n    \n    prs = Presentation(modified_ppt_path)\n    found_title = False\n    \n    # Check the first slide first (most likely where the main title should be changed)\n    for slide_num, slide in enumerate(prs.slides, 1):\n        for shape in slide.shapes:\n            if shape.has_text_frame:\n                text = shape.text_frame.text.strip()\n                if text == 'Accounting Equation':\n                    found_title = True\n                    runs = []\n                    for paragraph in shape.text_frame.paragraphs:\n                        runs += paragraph.runs\n                    \n                    # If no runs, fallback to paragraph-level font\n                    if not runs:\n                        for paragraph in shape.text_frame.paragraphs:\n                            font = paragraph.font\n                            if font.color and is_red_color(font.color):\n                                return (f\"Title color is red on slide {slide_num}.\", 1.0)\n                        # Continue to next slide if this title is not red\n                        continue\n                    \n                    # For runs, check all runs are red\n                    all_red = True\n                    for run in runs:\n                        font = run.font\n                        if not font.color or not is_red_color(font.color):\n                            all_red = False\n                            break\n                    \n                    if all_red:\n                        return (f\"Title color is red on slide {slide_num}.\", 1.0)\n                    # Continue to next slide if this title is not fully red\n    \n    if not found_title:\n        return (\"Could not find 'Accounting Equation' title in PPT.\", 0.0)\n    \n    # If we found titles but none were red\n    return (\"Found 'Accounting Equation' titles but none have red color.\", 0.0)\n"
        }
      },
      {
        "name": "Title text and slide are unchanged except for color",
        "description": "Checks that the title text 'Accounting Equation' remains unchanged except for its color, and that it is still on the same slide and is not accidentally removed or duplicated.",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    from pptx import Presentation\n    orig_prs = Presentation(original_ppt_path)\n    mod_prs = Presentation(modified_ppt_path)\n    original_titles = set()\n    modified_titles = set()\n    for slide_idx, slide in enumerate(orig_prs.slides):\n        for shape in slide.shapes:\n            if shape.has_text_frame:\n                if shape.text_frame.text.strip() == 'Accounting Equation':\n                    original_titles.add((slide_idx, shape.text_frame.text.strip()))\n    for slide_idx, slide in enumerate(mod_prs.slides):\n        for shape in slide.shapes:\n            if shape.has_text_frame:\n                if shape.text_frame.text.strip() == 'Accounting Equation':\n                    modified_titles.add((slide_idx, shape.text_frame.text.strip()))\n    if not original_titles:\n        return (\"No 'Accounting Equation' title found in original presentation.\", 0.0)\n    if not modified_titles:\n        return (\"'Accounting Equation' title has been removed.\", 0.0)\n    # There should be same number of such titles in same slides (by index)\n    orig_slide_idxs = set([idx for idx, _ in original_titles])\n    mod_slide_idxs = set([idx for idx, _ in modified_titles])\n    if orig_slide_idxs != mod_slide_idxs:\n        return (\"Title has been moved or duplicated/deleted.\", 0.0)\n    return (\"Title text and slide unchanged except for color.\", 1.0)\n"
        }
      },
      {
        "name": "No extraneous changes made to slides",
        "description": "Checks that no slides, content, animations, or transitions have been modified except as required for the color change.",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    \"\"\"Return (message, score) enforcing that ONLY allowed change is font color of\n    the title text 'Accounting Equation' on slide 1 (index 0). No other slide or\n    element may change (text, shape count, structure, or color). If nothing changed\n    that's also acceptable.\n    \"\"\"\n    p = ppt_diff\n\n    # Hard disallow structural presentation-level changes first\n    if p.added_slides or p.removed_slides:\n        return (\"Extraneous slides were added or removed.\", 0.0)\n    if p.added_animations or p.removed_animations:\n        return (\"Extraneous animations were added or removed.\", 0.0)\n    if p.added_transitions:\n        return (\"Extraneous transitions were added.\", 0.0)\n\n    from pptx import Presentation\n    try:\n        orig_prs = Presentation(original_ppt_path)\n        mod_prs = Presentation(modified_ppt_path)\n    except Exception:\n        return (\"Failed to open presentations.\", 0.0)\n\n    if len(orig_prs.slides) != len(mod_prs.slides):\n        return (\"Slide count changed.\", 0.0)\n\n    def is_target_title(shape) -> bool:\n        if not getattr(shape, 'has_text_frame', False):\n            return False\n        try:\n            return shape.text_frame.text.strip() == 'Accounting Equation'\n        except Exception:\n            return False\n\n    def run_signatures(shape):\n        \"\"\"List[(run_text, color_signature)] for a text shape.\n        color_signature favors explicit RGB else falls back to (theme, type).\n        \"\"\"\n        sigs = []\n        if not getattr(shape, 'has_text_frame', False):\n            return sigs\n        try:\n            for para in shape.text_frame.paragraphs:\n                for run in para.runs:\n                    rgb_val = None\n                    theme = None\n                    ctype = None\n                    try:\n                        color = run.font.color\n                        if color is not None:\n                            rgb = getattr(color, 'rgb', None)\n                            if rgb is not None:\n                                try:\n                                    rgb_val = str(rgb)  # 'RRGGBB'\n                                except Exception:\n                                    rgb_val = repr(rgb)\n                            theme = getattr(color, 'theme_color', None)\n                            ctype = getattr(color, 'type', None)\n                    except Exception:\n                        pass\n                    sigs.append((run.text, (rgb_val, str(theme), str(ctype))))\n        except Exception:\n            # Fallback single signature if iteration fails\n            try:\n                sigs.append((shape.text_frame.text, (None, None, None)))\n            except Exception:\n                pass\n        return sigs\n\n    observed_allowed_change = False\n\n    for idx in range(len(orig_prs.slides)):\n        old_slide = orig_prs.slides[idx]\n        new_slide = mod_prs.slides[idx]\n        old_shapes = old_slide.shapes\n        new_shapes = new_slide.shapes\n\n        if len(old_shapes) != len(new_shapes):\n            return ((\"Slide 1 shape count changed (not allowed).\" if idx == 0 else f\"Shape count changed on slide {idx+1} (not allowed).\"), 0.0)\n\n        for o_shape, n_shape in zip(old_shapes, new_shapes):\n            o_has = getattr(o_shape, 'has_text_frame', False)\n            n_has = getattr(n_shape, 'has_text_frame', False)\n            if o_has != n_has:\n                return ((\"Slide 1 structure changed (not allowed).\" if idx == 0 else f\"Structure changed on slide {idx+1} (not allowed).\"), 0.0)\n            if not o_has:\n                # Non-text shapes: we only verify presence/ordering via counts & pairing already\n                continue\n\n            old_text = o_shape.text_frame.text\n            new_text = n_shape.text_frame.text\n            if old_text != new_text:\n                # Any text difference is disallowed (even title text) because only color may change\n                return ((\"Text changed on slide 1 (not allowed).\" if idx == 0 else f\"Text changed on slide {idx+1} (not allowed).\"), 0.0)\n\n            old_sig = run_signatures(o_shape)\n            new_sig = run_signatures(n_shape)\n            # Compare run segmentation & text sequence\n            if len(old_sig) != len(new_sig) or any(ot != nt for (ot, _), (nt, _) in zip(old_sig, new_sig)):\n                return ((\"Run segmentation/text changed on slide 1 (not allowed).\" if idx == 0 else f\"Run segmentation/text changed on slide {idx+1} (not allowed).\"), 0.0)\n\n            # Compare colors\n            colors_changed = any(oc != nc for (_, oc), (_, nc) in zip(old_sig, new_sig))\n\n            if colors_changed:\n                if idx == 0 and is_target_title(o_shape):\n                    # Allowed color change (title only on slide 1)\n                    observed_allowed_change = True\n                else:\n                    return ((\"Non-title color changed on slide 1 (not allowed).\" if idx == 0 else f\"Color changed on slide {idx+1} (not allowed).\"), 0.0)\n\n    # Success whether or not a title color change actually occurred (requirement allows but doesn't mandate it)\n    return (\"No extraneous changes detected.\", 1.0)\n"
        }
      }
    ]
  },
  "metadata": {
    "task": "Change the title color of 'Accounting Equation' from blue to red"
  }
}