{
  "root": {
    "name": "Slide 10: Add bullet point explaining 'Objects include CSS files, JavaScript files, images, videos'",
    "description": "Evaluate whether Slide 10 has a new bullet point added at an appropriate location with the required explanation, and that no extraneous changes were made.",
    "is_critical": true,
    "metadata": {},
    "children": [
      {
        "name": "Bullet point with correct content is added on Slide 10",
        "description": "Verify that a bullet point explaining 'Objects include CSS files, JavaScript files, images, videos' was added to Slide 10, with sufficiently correct content.",
        "is_critical": true,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    from pptx import Presentation\n    import re\n    \n    # Load the modified presentation\n    prs = Presentation(modified_ppt_path)\n    \n    # Find slide 10 (1-based index)\n    if len(prs.slides) < 10:\n        return (\"Modified presentation has fewer than 10 slides.\", 0.0)\n    slide = prs.slides[9]\n\n    # Extract all text from placeholders and shapes\n    bullet_texts = []\n    for shape in slide.shapes:\n        if not shape.has_text_frame:\n            continue\n        for para in shape.text_frame.paragraphs:\n            text = para.text.strip()\n            if not text:\n                continue\n            bullet_texts.append(text)\n    \n    # Check for the required bullet point (flexible match)\n    required_keywords = ['css file', 'javascript file', 'image', 'video']\n    found = False\n    for text in bullet_texts:\n        lower = text.lower()\n        if all(any(kw in lower for kw in key_group.split(',')) for key_group in [\n            'css file,css files', 'javascript file,javascript files', 'image,images', 'video,videos']):\n            found = True\n            break\n    if found:\n        return (\"Bullet point with correct content found on Slide 10.\", 1.0)\n    # Try more forgiving match: check if at least 3 of the 4 types are present\n    for text in bullet_texts:\n        lower = text.lower()\n        count = sum(any(kw in lower for kw in key_group.split(',')) for key_group in [\n            'css file,css files', 'javascript file,javascript files', 'image,images', 'video,videos'])\n        if count >= 3:\n            return (\"Bullet point mostly correct (at least 3/4 object types present).\", 0.7)\n    return (\"No bullet point with the required explanation found on Slide 10.\", 0.0)\n"
        }
      },
      {
        "name": "Bullet point is at an appropriate place",
        "description": "Verify that the new bullet point was added in a location that is semantically and visually appropriate (i.e., within the main content, not in an unrelated area or outside a bullet list).",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    from rubric.utils.llm_tools import vlm_call\n    # Use VLM to compare original vs modified slide 10 and verify that the\n    # bullet \"Objects include CSS files, JavaScript files, images, videos\"\n    # was added in a visually and semantically appropriate place.\n    slide_number = 10\n\n    original_image = None\n    modified_image = None\n\n    # Find slide 10 in original screenshots (robust to object/dict entries)\n    for s in original_ppt_screenshots:\n        try:\n            s_num = getattr(s, \"slide_number\", None)\n            if s_num is None and isinstance(s, dict):\n                s_num = s.get(\"slide_number\")\n            if s_num == slide_number:\n                original_image = getattr(s, \"image_path\", None)\n                if original_image is None and isinstance(s, dict):\n                    original_image = s.get(\"image_path\") or s.get(\"path\")\n                break\n        except Exception:\n            continue\n\n    # Find slide 10 in modified screenshots (robust to object/dict entries)\n    for s in modified_ppt_screenshots:\n        try:\n            s_num = getattr(s, \"slide_number\", None)\n            if s_num is None and isinstance(s, dict):\n                s_num = s.get(\"slide_number\")\n            if s_num == slide_number:\n                modified_image = getattr(s, \"image_path\", None)\n                if modified_image is None and isinstance(s, dict):\n                    modified_image = s.get(\"image_path\") or s.get(\"path\")\n                break\n        except Exception:\n            continue\n\n    if not modified_image:\n        return (\"Modified slide 10 screenshot not found.\", 0.0)\n    if not original_image:\n        return (\"Original slide 10 screenshot not found.\", 0.0)\n\n    target_bullet = \"Objects include CSS files, JavaScript files, images, videos\"\n\n    prompt = (\n        \"Compare two images of the same PowerPoint slide (slide 10):\\n\"\n        \"Image A is the original; Image B is the modified.\\n\\n\"\n        \"Task:\\n\"\n        f\"1) Determine if a bullet with EXACT text:\\n\\\"{target_bullet}\\\"\\n\"\n        \"   is present in Image B but NOT present in Image A.\\n\"\n        \"2) If present, judge whether its placement is visually and semantically appropriate\\n\"\n        \"   relative to the existing bullets and content (i.e., appears as part of the same list/group,\\n\"\n        \"   consistent alignment/indentation, reasonable ordering among similar items, not isolated or\\n\"\n        \"   in an unrelated area like title/header/legend/footnote).\\n\\n\"\n        \"Instructions:\\n\"\n        \"- Ignore minor formatting/style differences.\\n\"\n        \"- Base your judgment on visual grouping, proximity, alignment, and content coherence.\\n\\n\"\n        \"Respond with ONE of the following labels ONLY (uppercase), followed by a brief justification:\\n\"\n        \"- PRESENT_AND_APPROPRIATE: the exact bullet is newly present and its placement is appropriate.\\n\"\n        \"- PRESENT_BUT_INAPPROPRIATE: the exact bullet is newly present but placement is inappropriate.\\n\"\n        \"- NOT_PRESENT: the exact bullet is not present in the modified slide.\\n\"\n    )\n\n    try:\n        response = vlm_call(images=[original_image, modified_image], prompt=prompt, temperature=0.1, max_tokens=300)\n        resp = str(response).strip().upper()\n        if resp.startswith(\"PRESENT_AND_APPROPRIATE\"):\n            return response, 1.0\n        if resp.startswith(\"PRESENT_BUT_INAPPROPRIATE\"):\n            return response, 0.5\n        if resp.startswith(\"NOT_PRESENT\"):\n            return response, 0.0\n        # Fallback: try simple YES/NO detection if labels weren't followed\n        low = resp.lower()\n        if \"present\" in low and \"appropriate\" in low:\n            return response, 1.0\n        if \"present\" in low and \"inappropriate\" in low:\n            return response, 0.5\n        if low.startswith(\"yes\"):\n            return response, 0.6\n        if low.startswith(\"no\"):\n            return response, 0.0\n        return f\"Unclear VLM response: {response}\", 0.0\n    except Exception as e:\n        return (f\"Error during VLM comparison: {str(e)}\", 0.0)\n"
        }
      },
      {
        "name": "No extraneous changes on Slide 10",
        "description": "Check that no unrelated or extraneous changes (text, layout, images, animations, transitions) were made to Slide 10, except for the bullet point addition.",
        "is_critical": false,
        "metadata": {},
        "children": [
          {
            "name": "No extraneous text or element changes on Slide 10",
            "description": "Ensure that only the bullet point was added and no unrelated text or element changes were made on Slide 10.",
            "is_critical": false,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score() -> tuple[str, float]:\n    # We'll compare the PPTDiff for Slide 10\n    slide_num = 10\n    slide_id = None\n    # Try to find slide_id for slide 10 in original, if needed\n    \n    \n    if ppt_diff.added_slides or ppt_diff.removed_slides:\n        if len(ppt_diff.added_slides) == 1 and len(ppt_diff.removed_slides) == 1 \\\n            and ppt_diff.added_slides[0].slide_number == 10 \\\n            and ppt_diff.removed_slides[0].slide_number == 10:\n                pass\n        else:\n            # Slide structure changed, penalize\n            return (\"Slides added or removed; structure changed.\", 0.0)\n    # Check for text changes, images, etc. Only allow one text addition\n    from pptx import Presentation\n    orig = Presentation(original_ppt_path)\n    mod = Presentation(modified_ppt_path)\n    orig_slide = orig.slides[slide_num - 1]\n    mod_slide = mod.slides[slide_num - 1]\n    # Count total text paragraphs in original and modified\n    orig_texts = []\n    for shape in orig_slide.shapes:\n        if shape.has_text_frame:\n            orig_texts.extend([p.text.strip() for p in shape.text_frame.paragraphs if p.text.strip()])\n    mod_texts = []\n    for shape in mod_slide.shapes:\n        if shape.has_text_frame:\n            mod_texts.extend([p.text.strip() for p in shape.text_frame.paragraphs if p.text.strip()])\n    # Only one new text (the bullet point) should be present\n    extra = [t for t in mod_texts if t not in orig_texts]\n    if len(extra) > 1:\n        return (f\"{len(extra)} new text entries on Slide 10 (expected 1).\", 0.0)\n    # Check for removed or changed text\n    removed = [t for t in orig_texts if t not in mod_texts]\n    if removed:\n        return (\"Text was removed from Slide 10.\", 0.0)\n    # Check for new images or shapes\n    orig_shapes = [s for s in orig_slide.shapes]\n    mod_shapes = [s for s in mod_slide.shapes]\n    if len(mod_shapes) > len(orig_shapes) + 1:\n        return (\"More than one new shape was added to Slide 10.\", 0.0)\n    return (\"No extraneous text or elements added to Slide 10.\", 1.0)\n"
            }
          },
          {
            "name": "No extraneous animations/transitions on Slide 10",
            "description": "Ensure that no new or removed animations or transitions were introduced to Slide 10.",
            "is_critical": false,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score() -> tuple[str, float]:\n    slide_num = 10\n    # Find the slide_id for slide 10 in the original PPT if possible\n    from pptx import Presentation\n    prs = Presentation(original_ppt_path)\n    if len(prs.slides) < slide_num:\n        return (\"Original presentation has fewer than 10 slides.\", 0.0)\n    orig_slide = prs.slides[slide_num-1]\n    slide_id = getattr(orig_slide, 'slide_id', None)\n    # Check for animations\n    anims = [a for a in ppt_diff.added_animations if (not slide_id or a.slide_id == slide_id)]\n    if anims:\n        return (\"Animation(s) added to Slide 10.\", 0.0)\n    anims = [a for a in ppt_diff.removed_animations if (not slide_id or a.slide_id == slide_id)]\n    if anims:\n        return (\"Animation(s) removed from Slide 10.\", 0.0)\n    # Check transitions\n    trans = [t for t in ppt_diff.added_transitions if (not slide_id or t.slide_id == slide_id)]\n    if trans:\n        return (\"Transition(s) added to Slide 10.\", 0.0)\n    trans = [t for t in ppt_diff.removed_transitions if (not slide_id or t.slide_id == slide_id)]\n    if trans:\n        return (\"Transition(s) removed from Slide 10.\", 0.0)\n    return (\"No extraneous animations or transitions on Slide 10.\", 1.0)\n"
            }
          }
        ]
      },
      {
        "name": "No extraneous changes to other slides",
        "description": "Verify that no changes (text, layout, slides, images, animations, transitions) were made to slides other than Slide 10.",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    from pptx import Presentation\n    orig = Presentation(original_ppt_path)\n    mod = Presentation(modified_ppt_path)\n    n = min(len(orig.slides), len(mod.slides))\n    # Check for slide additions/removals\n    if len(orig.slides) != len(mod.slides):\n        return (\"Number of slides changed.\", 0.0)\n    # Check each non-10 slide for changes\n    for i in range(n):\n        if i == 9:\n            continue  # skip slide 10\n        orig_slide = orig.slides[i]\n        mod_slide = mod.slides[i]\n        # Check text differences\n        orig_texts = []\n        for shape in orig_slide.shapes:\n            if shape.has_text_frame:\n                orig_texts.extend([p.text.strip() for p in shape.text_frame.paragraphs if p.text.strip()])\n        mod_texts = []\n        for shape in mod_slide.shapes:\n            if shape.has_text_frame:\n                mod_texts.extend([p.text.strip() for p in shape.text_frame.paragraphs if p.text.strip()])\n        if set(orig_texts) != set(mod_texts):\n            return (f\"Text changed on slide {i+1}.\", 0.0)\n        # Check for shapes/images\n        if len(orig_slide.shapes) != len(mod_slide.shapes):\n            return (f\"Shapes/images changed on slide {i+1}.\", 0.0)\n    # Also check for animations/transitions globally except on slide 10\n    for anim in ppt_diff.added_animations + ppt_diff.removed_animations:\n        if anim.slide_id and anim.slide_id != orig.slides[9].slide_id:\n            return (f\"Animation change on slide not 10.\", 0.0)\n    for t in ppt_diff.added_transitions + ppt_diff.removed_transitions:\n        if t.slide_id and t.slide_id != orig.slides[9].slide_id:\n            return (f\"Transition change on slide not 10.\", 0.0)\n    return (\"No extraneous changes to other slides.\", 1.0)\n"
        }
      }
    ]
  },
  "metadata": {
    "task": "Slide 10: Add a bullet point explaining 'Objects include CSS files, JavaScript files, images, videos' at an appropriate place"
  }
}