{
  "root": {
    "name": "slide_2_paragraph_to_bullets",
    "description": "Evaluates if slide 2's paragraph was split into two bullet points as specified, and the second bullet was indented.",
    "is_critical": true,
    "metadata": {},
    "children": [
      {
        "name": "slide_2_content_changed",
        "description": "Checks if slide 2's content was modified.",
        "is_critical": true,
        "metadata": {},
        "children": [
          {
            "name": "slide_2_bullets_present",
            "description": "Verifies two correct bullet points now exist on slide 2.",
            "is_critical": true,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score() -> tuple[str, float]:\n    # Use VLM to check whether both specified bullet points are present on slide 2\n    # Find slide 2 screenshot (supports object with attributes or dict with keys)\n    slide_2_image = None\n    \n    if len(ppt_diff.modified_slides) == 0:\n        return 'No modifications detected on slide 2.', 0.0\n    \n    for s in modified_ppt_screenshots:\n        try:\n            s_num = getattr(s, 'slide_number', None)\n            if s_num is None and isinstance(s, dict):\n                s_num = s.get('slide_number')\n            if s_num == 2:\n                slide_2_image = s.image_path\n                break\n        except Exception:\n            continue\n    if not slide_2_image:\n        return 'Slide 2 screenshot not found.', 0.0\n\n    prompt = (\n        \"Look at this PowerPoint slide (slide 2) and read the bullet points.\\n\"\n        \"We expect exactly these two bullet sentences to appear as bullets:\\n\"\n        \"1) 'Obesity is defined as excess body fat'\\n\"\n        \"2) 'Because body fat is difficult to measure directly, obesity is often measured by body mass index (BMI)'\\n\"\n        \"Do both of these exact bullet sentences appear on the slide (ignore indentation issues)? Respond with:\\n\"\n        \"- YES if both appear,\\n\"\n        \"- PARTIAL if only one appears,\\n\"\n        \"- NONE if neither appears.\"\n    )\n\n    try:\n        response = vlm_call(images=[slide_2_image], prompt=prompt, temperature=0.1, max_tokens=200)\n        resp = str(response).strip()\n        if 'YES' in resp and 'PARTIAL' not in resp and 'NONE' not in resp:\n            return response, 1.0\n        elif 'PARTIAL' in resp or ('YES' in resp and 'NO' in resp):\n            return response, 0.5\n        elif 'NONE' in resp or 'NO' in resp:\n            return response, 0.0\n        else:\n            return f'Unclear response from VLM: {response}', 0.0\n    except Exception as e:\n        return f'Error during VLM check: {str(e)}', 0.0\n"
            }
          },
          {
            "name": "slide_2_second_bullet_indented",
            "description": "Checks if the second bullet is indented relative to the first bullet.",
            "is_critical": true,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score() -> tuple[str, float]:\n    # Use VLM to check whether the second bullet is indented under the first on slide 2\n    slide_2_image = None\n    if len(ppt_diff.modified_slides) == 0:\n        return 'No modifications detected on slide 2.', 0.0\n    for s in modified_ppt_screenshots:\n        try:\n            if getattr(s, 'slide_number', None) == 2:\n                slide_2_image = s.image_path\n                break\n        except Exception:\n            continue\n    if not slide_2_image:\n        return 'Slide 2 screenshot not found.', 0.0\n\n    prompt = (\n        \"Look at this PowerPoint slide (slide 2).\\n\"\n        \"We expect two bullet sentences:\\n\"\n        \"1) 'Obesity is defined as excess body fat'\\n\"\n        \"2) 'Because body fat is difficult to measure directly, obesity is often measured by body mass index (BMI)'\\n\"\n        \"Is the second sentence presented as an indented sub-bullet under the first (i.e., clearly at a deeper level)?\\n\"\n        \"Respond with 'YES' if it is indented as a sub-bullet, 'NO' if it is at the same or higher level, or 'NOT_FOUND' if these bullets are not visible.\"\n    )\n\n    try:\n        response = vlm_call(images=[slide_2_image], prompt=prompt, temperature=0.1, max_tokens=200)\n        resp = str(response).strip()\n        if 'YES' in resp and 'NO' not in resp:\n            return response, 1.0\n        elif 'NOT_FOUND' in resp:\n            return response, 0.0\n        elif 'NO' in resp or 'NONE' in resp:\n            return response, 0.0\n        else:\n            return f'Unclear response from VLM: {response}', 0.0\n    except Exception as e:\n        return f'Error during VLM check: {str(e)}', 0.0\n"
            }
          }
        ]
      },
      {
        "name": "slide_2_no_extraneous_changes",
        "description": "Checks for absence of unintended changes on slide 2 (e.g., unrelated text/formatting changes).",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score():\n    # Check for modifications to slide 2 other than bullet/text changes\n    extraneous = False\n    for s1, s2 in ppt_diff.modified_slides:\n        if s1.slide_number == 2 or s2.slide_number == 2:\n            # Compare layout_type, notes, element_count\n            # Ignore title, since that's often the paragraph.\n            if (s1.layout_type != s2.layout_type) or (s1.notes != s2.notes) or (s1.element_count != s2.element_count):\n                extraneous = True\n    if extraneous:\n        return 'Extraneous changes detected on slide 2.', 0.0\n    return 'No extraneous changes detected on slide 2.', 1.0\n"
        }
      }
    ]
  },
  "metadata": {
    "task": "On slide 2, break the paragraph into two bullet points:  'Obesity is defined as excess body fat' and 'Because body fat is difficult to measure directly, obesity is often measured by body mass index (BMI)', and indent the second bullet point"
  }
}