{
  "root": {
    "name": "Slide 4 Table Creation and Content Accuracy",
    "description": "Evaluates whether the agent correctly created a table with the required structure and populated it with the correct data on Slide 4.",
    "is_critical": true,
    "metadata": {},
    "children": [
      {
        "name": "Table Structure on Slide 4",
        "description": "Checks if a table exists on Slide 4, and if it has exactly 2 columns with the required headers.",
        "is_critical": true,
        "metadata": {},
        "children": [
          {
            "name": "Table Presence on Slide 4",
            "description": "Verifies that a table exists on Slide 4.",
            "is_critical": true,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score():\n    from pptx import Presentation\n    prs = Presentation(modified_ppt_path)\n    slide = prs.slides[3]\n    if not slide:\n        return \"No slide 4 found in the modified presentation.\", 0.0\n    for shape in slide.shapes:\n        if shape.has_table:\n            return \"Table found on slide 4.\", 1.0\n    return \"No table found on slide 4.\", 0.0\n"
            },
            "score": 1.0
          },
          {
            "name": "Table has 2 Columns",
            "description": "Checks that the table on Slide 4 has exactly 2 columns.",
            "is_critical": true,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score():\n    from pptx import Presentation\n    prs = Presentation(modified_ppt_path)\n    slide = prs.slides[3]\n    if not slide:\n        return \"No slide 4 found in the modified presentation.\", 0.0\n    for shape in slide.shapes:\n        if shape.has_table:\n            cols = shape.table.columns\n            if len(cols) == 2:\n                return \"Table has 2 columns.\", 1.0\n            else:\n                return f\"Table has {len(cols)} columns, not 2.\", 0.0\n    return \"No table found on slide 4.\", 0.0\n"
            },
            "score": 1.0
          },
          {
            "name": "Table Headers Correct",
            "description": "Checks that the table headers are 'Application' and 'Architecture Type'.",
            "is_critical": true,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score():\n    from pptx import Presentation\n    prs = Presentation(modified_ppt_path)\n    slide = prs.slides[3]\n    if not slide:\n        return \"No slide 4 found in the modified presentation.\", 0.0\n    for shape in slide.shapes:\n        if shape.has_table:\n            table = shape.table\n            headers = [table.cell(0,0).text.strip().lower(), table.cell(0,1).text.strip().lower()]\n            expected = ['application', 'architecture type']\n            if sorted([h.replace(' ', '') for h in headers]) == sorted([h.replace(' ', '') for h in expected]):\n                return \"Table headers are correct.\", 1.0\n            else:\n                return f\"Table headers are incorrect: {headers}\", 0.0\n    return \"No table found on slide 4.\", 0.0\n"
            },
            "score": 1.0
          }
        ],
        "score": 1.0
      },
      {
        "name": "Table Content Accuracy",
        "description": "Checks that 'Skype' and 'Instant messaging' appear correctly under the 'Application' column and that their corresponding 'Architecture Type' cells are not empty.",
        "is_critical": true,
        "metadata": {},
        "children": [
          {
            "name": "Skype Entry in Table",
            "description": "Checks that 'Skype' is present in the 'Application' column of the table on Slide 4.",
            "is_critical": true,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score():\n    from pptx import Presentation\n    prs = Presentation(modified_ppt_path)\n    slide = prs.slides[3]\n    if not slide:\n        return \"No slide 4 found in the modified presentation.\", 0.0\n    for shape in slide.shapes:\n        if shape.has_table:\n            table = shape.table\n            app_col_idx = -1\n            # Check headers\n            for col in range(2):\n                if table.cell(0, col).text.strip().lower().replace(' ', '') == 'application':\n                    app_col_idx = col\n            if app_col_idx == -1:\n                return \"No 'Application' column found.\", 0.0\n            found = False\n            for row in range(1, table.rows.__len__()):\n                if table.cell(row, app_col_idx).text.strip().lower() == 'skype':\n                    found = True\n            if found:\n                return \"'Skype' found in the 'Application' column.\", 1.0\n            else:\n                return \"'Skype' not found in the 'Application' column.\", 0.0\n    return \"No table found on slide 4.\", 0.0\n"
            },
            "score": 1.0
          },
          {
            "name": "Instant Messaging Entry in Table",
            "description": "Checks that 'Instant messaging' is present in the 'Application' column of the table on Slide 4.",
            "is_critical": true,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score():\n    from pptx import Presentation\n    prs = Presentation(modified_ppt_path)\n    slide = prs.slides[3]\n    if not slide:\n        return \"No slide 4 found in the modified presentation.\", 0.0\n    for shape in slide.shapes:\n        if shape.has_table:\n            table = shape.table\n            app_col_idx = -1\n            for col in range(2):\n                if table.cell(0, col).text.strip().lower().replace(' ', '') == 'application':\n                    app_col_idx = col\n            if app_col_idx == -1:\n                return \"No 'Application' column found.\", 0.0\n            found = False\n            for row in range(1, table.rows.__len__()):\n                if table.cell(row, app_col_idx).text.strip().lower() == 'instant messaging':\n                    found = True\n            if found:\n                return \"'Instant messaging' found in the 'Application' column.\", 1.0\n            else:\n                return \"'Instant messaging' not found in the 'Application' column.\", 0.0\n    return \"No table found on slide 4.\", 0.0\n"
            },
            "score": 1.0
          }
        ],
        "score": 1.0
      },
      {
        "name": "No extraneous changes to other slides or features",
        "description": "Checks that no unrelated changes were made to slides other than slide 4, or to slide 4's animations/transitions or other features.",
        "is_critical": false,
        "metadata": {},
        "children": [
          {
            "name": "No extraneous text/font changes on other slides",
            "description": "Checks that text and font properties on slides other than slide 4 were not changed.",
            "is_critical": false,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score() -> tuple[str, float]:\n    from pptx import Presentation\n    orig = Presentation(original_ppt_path)\n    mod = Presentation(modified_ppt_path)\n    # For each slide except slide 4\n    for slide_idx in range(len(orig.slides)):\n        if slide_idx == 3:\n            continue\n        orig_slide = orig.slides[slide_idx]\n        mod_slide = mod.slides[slide_idx] if slide_idx < len(mod.slides) else None\n        if not mod_slide:\n            continue  # Slide might be deleted, not expected for this task\n        def extract_text_fontsize(shape):\n            data = []\n            if not shape.has_text_frame:\n                return data\n            for para in shape.text_frame.paragraphs:\n                for run in para.runs:\n                    if run.text.strip():\n                        size = run.font.size.pt if run.font.size else None\n                        data.append((run.text.strip(), size))\n            return data\n        def get_slide_text_fontsize(slide):\n            out = []\n            for shape in slide.shapes:\n                out.extend(extract_text_fontsize(shape))\n            return out\n        orig_text_sizes = get_slide_text_fontsize(orig_slide)\n        mod_text_sizes = get_slide_text_fontsize(mod_slide)\n        orig_map = {}\n        for t, sz in orig_text_sizes:\n            orig_map.setdefault(t, []).append(sz)\n        mod_map = {}\n        for t, sz in mod_text_sizes:\n            mod_map.setdefault(t, []).append(sz)\n        # For every text, check font sizes unchanged\n        for text in orig_map:\n            if text not in mod_map:\n                continue\n            if orig_map[text] != mod_map[text]:\n                return (f\"Font size for text '{text}' changed on slide {slide_idx+1}.\", 0.0)\n    return (\"No text/font changes on other slides.\", 1.0)\n"
            },
            "score": 1.0
          },
          {
            "name": "No extraneous changes to animations or transitions on any slide",
            "description": "Checks that no animation or transition was added, removed, or modified in the presentation.",
            "is_critical": false,
            "metadata": {},
            "scorer": {
              "type": "function",
              "function_code": "def compute_score() -> tuple[str, float]:\n    # Check ppt_diff for any animation/transition changes\n    if ppt_diff.added_animations or ppt_diff.removed_animations or ppt_diff.modified_animations:\n        return (\"Extraneous animation change(s) detected.\", 0.0)\n    if ppt_diff.added_transitions or ppt_diff.removed_transitions or ppt_diff.modified_transitions:\n        return (\"Extraneous transition change(s) detected.\", 0.0)\n    return (\"No extraneous animation or transition changes.\", 1.0)\n"
            },
            "score": 1.0
          }
        ],
        "score": 1.0
      },
      {
        "name": "No extraneous slides added or removed",
        "description": "Checks that no slides were added or removed in the presentation.",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score() -> tuple[str, float]:\n    # Use ppt_diff for slide structure changes\n    if ppt_diff.added_slides:\n        return (\"Slides were added, which is extraneous.\", 0.0)\n    if ppt_diff.removed_slides:\n        return (\"Slides were removed, which is extraneous.\", 0.0)\n    return (\"No extraneous slides added or removed.\", 1.0)\n"
        },
        "score": 1.0
      }
    ],
    "score": 1.0
  },
  "metadata": {
    "task": "Slide 4: Create a simple table with two columns: 'Application' and 'Architecture Type' and insert Skype and Instant messaging"
  }
}