{
  "root": {
    "name": "Add Appropriate Emojis to Social Class Types on Slide 8",
    "description": "Evaluates whether appropriate emoji icons have been added next to each social class type on slide 8, without making unintended changes to other slides or content",
    "is_critical": false,
    "metadata": {},
    "children": [
      {
        "name": "Emojis Present on Slide 8",
        "description": "Checks if emoji characters or icons are present on slide 8",
        "is_critical": true,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    from pptx import Presentation\n    import re\n    \n    try:\n        ppt = Presentation(modified_ppt_path)\n        \n        if len(ppt.slides) < 8:\n            return \"Slide 8 does not exist\", 0.0\n        \n        slide_8 = ppt.slides[7]\n        \n        # Extract all text from slide 8\n        slide_text = \"\"\n        for shape in slide_8.shapes:\n            if hasattr(shape, \"text\"):\n                slide_text += shape.text + \" \"\n        \n        # Check for emoji characters (Unicode ranges for emojis)\n        emoji_pattern = re.compile(\n            \"[\"\n            \"\\U0001F600-\\U0001F64F\"  # emoticons\n            \"\\U0001F300-\\U0001F5FF\"  # symbols & pictographs\n            \"\\U0001F680-\\U0001F6FF\"  # transport & map\n            \"\\U0001F1E0-\\U0001F1FF\"  # flags\n            \"\\U00002600-\\U000027BF\"  # misc symbols\n            \"\\U0001F900-\\U0001F9FF\"  # supplemental symbols\n            \"]+\"\n        )\n        \n        emojis_found = emoji_pattern.findall(slide_text)\n        \n        if not emojis_found:\n            return \"No emoji characters found on slide 8\", 0.0\n        \n        return f\"Found {len(emojis_found)} emoji(s) on slide 8: {', '.join(emojis_found)}\", 1.0\n        \n    except Exception as e:\n        return f\"Error checking for emojis: {str(e)}\", 0.0\n"
        }
      },
      {
        "name": "Emoji Appropriateness",
        "description": "Evaluates whether the chosen emojis are contextually appropriate for representing social class types",
        "is_critical": true,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    import re\n    # Find slide 8 screenshot\n    slide_8_screenshot = None\n    for screenshot in modified_ppt_screenshots:\n        if screenshot.slide_number == 8:\n            slide_8_screenshot = screenshot\n            break\n    \n    if not slide_8_screenshot:\n        return \"No screenshot available for slide 8\", 0.0\n    \n    prompt = \"\"\"\n    Please analyze this PowerPoint slide containing social class types with emojis.\n    \n    Evaluate the appropriateness of the emoji choices:\n    - Do the emojis make logical sense for the social class they represent?\n    \n    \n    Rate the appropriateness:\n    - 1.0: Emojis are logical and contextually relevant\n    - 0.7: Emojis are generally relevant with minor issues\n    - 0.5: Emojis are somewhat relevant but could be better chosen\n    - 0.0: Emojis are completely irrelevant\n    \n    Respond with the score followed by your reasoning.\n    \"\"\"\n    \n    try:\n        response = vlm_call(prompt, [slide_8_screenshot.image_path], temperature=0.1)\n        \n        # Extract score from response\n        score_match = re.search(r'(0\\.0|0\\.3|0\\.5|0\\.7|1\\.0)', response)\n        if score_match:\n            score = float(score_match.group(1))\n            return f\"Emoji appropriateness assessment: {response}\", score\n        else:\n            return f\"Could not parse score from response: {response}\", 0.5\n            \n    except Exception as e:\n        return f\"Error in appropriateness analysis: {str(e)}\", 0.5\n"
        }
      },
      {
        "name": "Emojis Appropriately Positioned",
        "description": "Uses visual analysis to verify that emojis are positioned next to social class types rather than randomly placed",
        "is_critical": true,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    import re\n    # Find slide 8 screenshot\n    slide_8_screenshot = None\n    for screenshot in modified_ppt_screenshots:\n        if screenshot.slide_number == 8:\n            slide_8_screenshot = screenshot\n            break\n    \n    if not slide_8_screenshot:\n        return \"No screenshot available for slide 8\", 0.0\n    \n    prompt = \"\"\"\n    Please analyze this PowerPoint slide that should contain social class types with emojis added next to them.\n    \n    Look for:\n    1. Text mentioning different social classes (upper class, middle class, lower class, working class, etc.)\n    2. Emoji icons positioned next to or near these social class terms\n    3. Whether the emojis appear to be intentionally placed next to the class types (not randomly scattered)\n    \n    Rate the positioning appropriateness:\n    - 1.0: Emojis are clearly positioned next to social class terms\n    - 0.7: Emojis are present and somewhat near social class terms but positioning could be better\n    - 0.3: Emojis are present but poorly positioned relative to social class terms\n    - 0.0: No emojis found or emojis are completely unrelated to social class content\n    \n    Respond with just the score (0.0, 0.3, 0.7, or 1.0) followed by a brief explanation.\n    \"\"\"\n    \n    try:\n        response = vlm_call(prompt, [slide_8_screenshot.image_path], temperature=0.1)\n        \n        # Extract score from response\n        score_match = re.search(r'(0\\.0|0\\.3|0\\.7|1\\.0)', response)\n        if score_match:\n            score = float(score_match.group(1))\n            return f\"VLM assessment: {response}\", score\n        else:\n            return f\"Could not parse score from VLM response: {response}\", 0.0\n            \n    except Exception as e:\n        return f\"Error in visual analysis: {str(e)}\", 0.0\n"
        }
      },
      {
        "name": "No Unintended Changes",
        "description": "Ensures that only slide 8 was modified and no other slides or presentation elements were unintentionally changed",
        "is_critical": false,
        "metadata": {},
        "children": [
          {
            "name": "Other Slides Unchanged",
            "description": "Verifies that slides other than slide 8 remain unchanged",
            "is_critical": false,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score() -> tuple[str, float]:\n    from pptx import Presentation\n    \n    try:\n        original_ppt = Presentation(original_ppt_path)\n        modified_ppt = Presentation(modified_ppt_path)\n        \n        # Check if number of slides changed\n        if len(original_ppt.slides) != len(modified_ppt.slides):\n            return f\"Number of slides changed from {len(original_ppt.slides)} to {len(modified_ppt.slides)}\", 0.0\n        \n        changes_found = []\n        \n        # Check each slide except slide 8 (index 7)\n        for i, (orig_slide, mod_slide) in enumerate(zip(original_ppt.slides, modified_ppt.slides)):\n            if i == 7:  # Skip slide 8\n                continue\n                \n            # Compare text content\n            orig_text = \"\"\n            mod_text = \"\"\n            \n            for shape in orig_slide.shapes:\n                if hasattr(shape, \"text\"):\n                    orig_text += shape.text\n            \n            for shape in mod_slide.shapes:\n                if hasattr(shape, \"text\"):\n                    mod_text += shape.text\n            \n            if orig_text != mod_text:\n                changes_found.append(f\"Slide {i+1} text changed\")\n        \n        # Check for animation/transition changes on other slides\n        other_slide_animations = [anim for anim in ppt_diff.added_animations + [old for old, new in ppt_diff.modified_animations] + ppt_diff.removed_animations if anim.slide_id != \"slide_8\"]\n        other_slide_transitions = [trans for trans in ppt_diff.added_transitions + [old for old, new in ppt_diff.modified_transitions] + ppt_diff.removed_transitions if trans.slide_id != \"slide_8\"]\n        \n        if other_slide_animations:\n            changes_found.append(f\"Animations changed on other slides: {len(other_slide_animations)} changes\")\n        \n        if other_slide_transitions:\n            changes_found.append(f\"Transitions changed on other slides: {len(other_slide_transitions)} changes\")\n        \n        if changes_found:\n            return f\"Unintended changes detected: {'; '.join(changes_found)}\", 0.3\n        \n        return \"No unintended changes detected on other slides\", 1.0\n        \n    except Exception as e:\n        return f\"Error checking for unintended changes: {str(e)}\", 0.5\n"
            }
          },
          {
            "name": "Slide 8 Content Preserved",
            "description": "Ensures that the original content of slide 8 is preserved and only emojis were added",
            "is_critical": false,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score() -> tuple[str, float]:\n    # Use VLM to check if only the border color changed\n    original_slide_8 = None\n    modified_slide_8 = None\n    \n    for screenshot in original_ppt_screenshots:\n        if screenshot.slide_number == 8:\n            original_slide_8 = screenshot.image_path\n            break\n    \n    for screenshot in modified_ppt_screenshots:\n        if screenshot.slide_number == 8:\n            modified_slide_8 = screenshot.image_path\n            break\n    \n    if not original_slide_8 or not modified_slide_8:\n        return \"Could not find slide 8 screenshots for comparison\", 0.0\n    \n    prompt = \"\"\"Compare these two PowerPoint slides carefully. The intended change was to add emojis to the slide.\n    \n    Analyze if there are any unintended changes:\n    1. Has anything other than the emojis changed?\n    \n    Respond with:\n    - 'MINIMAL_CHANGE' if only the emojis were added as intended\n    - 'EXCESSIVE_CHANGE' followed by a description if other unintended modifications were made\n    - 'NO_CHANGE' if no changes are visible\"\"\"\n    \n    try:\n        response = vlm_call(prompt, [original_slide_8, modified_slide_8], temperature=0.3)\n        \n        response_upper = response.strip()\n        if response_upper.startswith('MINIMAL_CHANGE'):\n            return \"Only the intended emojis were added\", 1.0\n        elif response_upper.startswith('NO_CHANGE'):\n            return \"No changes detected on slide 8\", 0.0\n        else:\n            return f\"Excessive changes detected: {response}\", 0.3\n    except Exception as e:\n        return f\"Error analyzing slide changes: {str(e)}\", 0.0\n"
            }
          }
        ]
      }
    ]
  },
  "metadata": {
    "task": "Add appropriate emojis icons next to each social class type on slide 8"
  }
}