{
  "root": {
    "name": "Make the objective text italic on Slide 11",
    "description": "Evaluates whether the agent correctly found and applied italic formatting to the objective text on slide 11, and did not introduce errors or unintended changes.",
    "is_critical": true,
    "metadata": {},
    "children": [
      {
        "name": "Objective Text is Italicized",
        "description": "Checks that the identified objective text on slide 11 is fully italicized after the modification.",
        "is_critical": true,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    from pptx import Presentation\n    import re\n    \n    # Helper: Find the objective text shape\n    def find_objective_text_shape(slide):\n        for shape in slide.shapes:\n            if not shape.has_text_frame:\n                continue\n            text = shape.text_frame.text.strip().lower()\n            if 'objective' in text or re.search(r'(objective[s]?[:]?|goal[s]?[:]?|learning outcome[s]?[:]?|purpose[:]?|aim[s]?[:]?|target[s]?[:]?|intended outcome[s]?[:]?|what you will learn)', text):\n                return shape\n        return None\n    \n    prs = Presentation(modified_ppt_path)\n    slide = prs.slides[10] if len(prs.slides) > 10 else None\n    if not slide:\n        return (\"Slide 11 not found.\", 0.0)\n\n    shape = find_objective_text_shape(slide)\n    if shape is None:\n        return (\"Objective text not found on slide 11.\", 0.0)\n    \n    # Check if all text is italic\n    tf = shape.text_frame\n    all_italic = True\n    for paragraph in tf.paragraphs:\n        for run in paragraph.runs:\n            if not run.font.italic:\n                all_italic = False\n                break\n        if not all_italic:\n            break\n    if all_italic:\n        return (\"All objective text on slide 11 is italicized.\", 1.0)\n    else:\n        # New rule: If only the first word \"Objective\" is italicized, still give full credit.\n        # Find first non-empty paragraph\n        first_para = None\n        for p in tf.paragraphs:\n            if p.text and p.text.strip():\n                first_para = p\n                break\n        if first_para:\n            para_text = first_para.text.lstrip()\n            target = \"objective\"\n            if para_text.lower().startswith(target):\n                # Ensure word boundary after 'Objective' (space, colon, punctuation, or end)\n                boundary_ok = len(para_text) == len(target) or (len(para_text) > len(target) and not para_text[len(target)].isalnum())\n                if boundary_ok:\n                    # Check italic for the characters forming 'Objective'\n                    needed_len = len(target)\n                    collected = 0\n                    italic_flags = []\n                    for run in first_para.runs:\n                        if collected >= needed_len:\n                            break\n                        run_text = run.text\n                        for ch in run_text:\n                            if collected >= needed_len:\n                                break\n                            # skip leading whitespace before starting word\n                            if collected == 0 and ch.isspace():\n                                continue\n                            italic_flags.append(bool(run.font.italic))\n                            collected += 1\n                    if collected == needed_len and italic_flags and all(italic_flags):\n                        return (\"First word 'Objective' is italicized (accepted criteria).\", 1.0)\n        return (\"Not all objective text is italicized.\", 0.0)\n"
        }
      },
      {
        "name": "No Unintended Changes",
        "description": "Ensures that no other text on slide 11 (other than the objective text) was made italic, and that no unrelated content was changed.",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    from pptx import Presentation\n    import re\n    \n    # Helper: Find the objective text shape\n    def find_objective_text_shape(slide):\n        for shape in slide.shapes:\n            if not shape.has_text_frame:\n                continue\n            text = shape.text_frame.text.strip().lower()\n            if 'objective' in text or re.search(r'(objective[s]?[:]?|goal[s]?[:]?|learning outcome[s]?[:]?|purpose[:]?|aim[s]?[:]?|target[s]?[:]?|intended outcome[s]?[:]?|what you will learn)', text):\n                return shape\n        return None\n    \n    prs_mod = Presentation(modified_ppt_path)\n    prs_orig = Presentation(original_ppt_path)\n    slide_mod = slide_orig = None\n    for s in prs_mod.slides:\n        if hasattr(s, 'slide_id') and s.slide_id == '11':\n            slide_mod = s\n            break\n    if not slide_mod:\n        # fallback: use slide number (1-based)\n        if len(prs_mod.slides) >= 11:\n            slide_mod = prs_mod.slides[10]\n    for s in prs_orig.slides:\n        if hasattr(s, 'slide_id') and s.slide_id == '11':\n            slide_orig = s\n            break\n    if not slide_orig:\n        if len(prs_orig.slides) >= 11:\n            slide_orig = prs_orig.slides[10]\n    if not slide_mod or not slide_orig:\n        return (\"Slide 11 not found in one of the presentations.\", 0.0)\n    \n    shape_obj = find_objective_text_shape(slide_mod)\n    # Gather text from all shapes except objective\n    non_obj_shapes_mod = [sh for sh in slide_mod.shapes if sh != shape_obj and hasattr(sh, 'text_frame') and sh.has_text_frame]\n    non_obj_shapes_orig = [sh for sh in slide_orig.shapes if hasattr(sh, 'text_frame') and sh.has_text_frame]\n    \n    # For each non-objective shape, check if any run was made italic in mod but was not in orig\n    score = 1.0\n    for mod_sh, orig_sh in zip(non_obj_shapes_mod, non_obj_shapes_orig):\n        tf_mod = mod_sh.text_frame\n        tf_orig = orig_sh.text_frame\n        for p_mod, p_orig in zip(tf_mod.paragraphs, tf_orig.paragraphs):\n            # Compare runs by index\n            for run_mod, run_orig in zip(p_mod.runs, p_orig.runs):\n                if not run_orig.font.italic and run_mod.font.italic:\n                    return (\"Detected unintended italics on non-objective text on slide 11.\", 0.0)\n    return (\"No unintended italicization on slide 11.\", 1.0)\n"
        }
      },
      {
        "name": "No Extraneous Changes to Other Slides",
        "description": "Verify that only slide 11 has been modified, and no other slides have been added or removed.",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    # Only slide 5 (slide_number=5) should be altered\n    problematic_mods = []\n    for (old, new) in ppt_diff.modified_slides:\n        if old.slide_number != 11:\n            # Check if nontrivial changes happened\n            major = False\n            # Check notes, title, number of elements (as proxy)\n            if old.title != new.title or (old.notes or \"\") != (new.notes or \"\") or old.element_count != new.element_count:\n                major = True\n            if major:\n                problematic_mods.append(old.slide_number)\n    # Check for added/removed slides\n    added = [s.slide_number for s in ppt_diff.added_slides if s.slide_number != 11]\n    removed = [s.slide_number for s in ppt_diff.removed_slides if s.slide_number != 11]\n    if problematic_mods or added or removed:\n        return f\"Slides other than 11 changed: modified={problematic_mods}, added={added}, removed={removed}.\", 0.0\n    return \"No extraneous changes to other slides.\", 1.0\n"
        }
      }
    ]
  },
  "metadata": {
    "task": "Slide 11: Make the objective text italic"
  }
}