{
  "root": {
    "name": "add_chart_based_on_table_data_on_slide_13",
    "description": "Evaluates whether a chart representing the age distribution from table data was correctly added to slide 13 without extraneous changes.",
    "is_critical": true,
    "metadata": {},
    "children": [
      {
        "name": "chart_presence_on_slide_13",
        "description": "Checks if a new chart was added to slide 13.",
        "is_critical": true,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score():\n    from pptx import Presentation\n    prs = Presentation(modified_ppt_path)\n    slide = None\n    for s in prs.slides:\n        if hasattr(s, 'slide_id') and s.slide_id == '13':\n            slide = s\n            break\n    if not slide:\n        try:\n            slide = list(prs.slides)[12]\n        except IndexError:\n            return 'Slide 13 not found in modified PPT.', 0.0\n    chart_count = 0\n    for shape in slide.shapes:\n        if shape.shape_type == 3:  # CHART\n            chart_count += 1\n    if chart_count == 0:\n        return 'No chart found on slide 13.', 0.0\n    return f'Found {chart_count} chart(s) on slide 13.', 1.0\n"
        }
      },
      {
        "name": "chart_represents_table_data",
        "description": "Checks if the chart visualizes the age distribution from the table data on slide 13.",
        "is_critical": true,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score():\n    def use_vlm_fallback():\n        \"\"\"Use vision-language model to verify chart-table correspondence\"\"\"\n        try:\n            # Get screenshot of slide 13\n            slide_image = modified_ppt_screenshots[12].image_path\n            \n            prompt = \"\"\"\n            Analyze this PowerPoint slide that contains both a table and a chart.\n            \n            Task: Determine if the chart accurately represents the data shown in the table.\n            \n            Please check:\n            1. Do the category labels in the chart match the categories in the table?\n            2. Do the values/proportions in the chart correspond to the numeric data in the table?\n            3. Is the chart type appropriate for representing this table data?\n            \n            Respond with:\n            - \"MATCH\" if the chart accurately represents the table data\n            - \"PARTIAL_MATCH\" if there are minor discrepancies but the chart generally represents the table\n            - \"NO_MATCH\" if the chart does not represent the table data accurately\n            \n            Also provide a brief explanation of your assessment.\n            \"\"\"\n            \n            response = vlm_call(prompt, [slide_image])\n            \n            if \"MATCH\" in response and \"NO_MATCH\" not in response:\n                if \"PARTIAL_MATCH\" in response:\n                    return response, 0.7\n                else:\n                    return response, 1.0\n            elif \"PARTIAL_MATCH\" in response:\n                return response, 0.6\n            else:\n                return response, 0.0\n                \n        except Exception as e:\n            return f\"Error in VLM fallback: {e}\", 0.0\n\n\n    from pptx import Presentation\n    from pptx.enum.shapes import MSO_SHAPE_TYPE\n    import difflib\n    \n    try:\n        prs = Presentation(modified_ppt_path)\n        \n        # Get slide 13 (index 12)\n        if len(prs.slides) < 13:\n            return 'Slide 13 not found in modified PPT.', 0.0\n        \n        slide = prs.slides[12]  # 0-based indexing\n        \n        # Find chart and table on slide 13\n        chart_shape = None\n        table_shape = None\n        \n        for shape in slide.shapes:\n            if shape.shape_type == MSO_SHAPE_TYPE.CHART:\n                chart_shape = shape\n            elif shape.shape_type == MSO_SHAPE_TYPE.TABLE:\n                table_shape = shape\n        \n        if not chart_shape:\n            return 'No chart present on slide 13.', 0.0\n        \n        if not table_shape:\n            return 'No table found on slide 13 to extract data.', 0.0\n        \n        # Extract table data\n        table = table_shape.table\n        table_data = []\n        \n        for row_idx in range(len(table.rows)):\n            row = []\n            for cell in table.rows[row_idx].cells:\n                row.append(cell.text.strip())\n            table_data.append(row)\n        \n        if len(table_data) < 2:\n            return 'Table has insufficient data (less than 2 rows).', 0.0\n        \n        # Extract chart data more robustly\n        try:\n            chart = chart_shape.chart\n            chart_data = None\n            chart_categories = None\n            \n            # Try to get data from chart plots\n            if chart.plots and len(chart.plots) > 0:\n                plot = chart.plots[0]\n                if plot.series and len(plot.series) > 0:\n                    series = plot.series[0]\n                    \n                    # Get values\n                    if hasattr(series, 'values') and series.values:\n                        chart_data = [float(v) if v is not None else 0.0 for v in series.values]\n                    \n                    # Get categories \n                    if hasattr(plot, 'categories') and plot.categories:\n                        chart_categories = [str(c) for c in plot.categories]\n                    elif hasattr(series, 'categories') and series.categories:\n                        chart_categories = [str(c) for c in series.categories]\n            \n            if not chart_data:\n                return use_vlm_fallback()\n                \n        except Exception as e:\n            return use_vlm_fallback()\n        \n        # Parse table data (assume first row is header)\n        headers = table_data[0]\n        data_rows = table_data[1:]\n        \n        # Extract categories and values from table\n        table_categories = []\n        table_values = []\n        \n        for row in data_rows:\n            if len(row) >= 2:\n                category = row[0].strip()\n                try:\n                    # Try to parse the value (could be in different columns)\n                    value = None\n                    for cell in row[1:]:\n                        try:\n                            # Remove any non-numeric characters except decimal point\n                            clean_cell = ''.join(c for c in cell if c.isdigit() or c == '.')\n                            if clean_cell:\n                                value = float(clean_cell)\n                                break\n                        except ValueError:\n                            continue\n                    \n                    if value is not None and category:\n                        table_categories.append(category)\n                        table_values.append(value)\n                        \n                except (ValueError, IndexError):\n                    continue\n        \n        if not table_values or not table_categories:\n            return use_vlm_fallback()\n        \n        \n        # Category matching (fuzzy)\n        matched_categories = 0\n        if chart_categories:\n            for table_cat in table_categories:\n                for chart_cat in chart_categories:\n                    # Check for substring match (case insensitive)\n                    if (table_cat.lower() in chart_cat.lower() or \n                        chart_cat.lower() in table_cat.lower() or\n                        difflib.SequenceMatcher(None, table_cat.lower(), chart_cat.lower()).ratio() > 0.7):\n                        matched_categories += 1\n                        break\n        \n        category_score = matched_categories / max(len(table_categories), 1) if table_categories else 0\n        \n        # Value matching\n        value_score = 0\n        if len(table_values) == len(chart_data):\n            # Check if values match within tolerance\n            total_diff = 0\n            total_magnitude = sum(abs(v) for v in table_values)\n            \n            for tv, cv in zip(table_values, chart_data):\n                total_diff += abs(tv - cv)\n            \n            if total_magnitude > 0:\n                relative_error = total_diff / total_magnitude\n                value_score = max(0, 1 - relative_error)\n            else:\n                value_score = 1 if total_diff == 0 else 0\n        \n        # Overall score (weight categories and values equally)\n        overall_score = 0.5 * category_score + 0.5 * value_score\n        \n        \n        if overall_score > 0.9:\n            return 'Chart data accurately matches table data.', 1.0\n        elif overall_score > 0.7:\n            return 'Chart data closely matches table data.', 0.8\n        elif overall_score > 0.5:\n            return 'Chart partially matches table data.', 0.6\n        else:\n            # If programmatic analysis fails, try VLM as fallback\n            return use_vlm_fallback()\n            \n    except Exception as e:\n        return use_vlm_fallback()\n"
        }
      },
      {
        "name": "no_unrelated_changes",
        "description": "Checks that no unrelated changes were made to other slides or extraneous objects added.",
        "is_critical": false,
        "metadata": {},
        "scorer": {
          "type": "function",
          "function_code": "def compute_score():\n    # Check for added slides\n    if ppt_diff.added_slides:\n        return 'Unrelated slides were added.', 0.0\n    # Check for removed slides\n    if ppt_diff.removed_slides:\n        return 'Slides were removed.', 0.0\n    # Check for changes to slides other than 13\n    unrelated_changes = False\n    for s in ppt_diff.modified_slides:\n        s1, s2 = s\n        if (s1.slide_number != 13):\n            unrelated_changes = True\n            break\n    for anim in ppt_diff.added_animations + ppt_diff.removed_animations:\n        if anim.slide_id != '13':\n            unrelated_changes = True\n            break\n    for trn in ppt_diff.added_transitions + ppt_diff.removed_transitions:\n        if trn.slide_id != '13':\n            unrelated_changes = True\n            break\n    if unrelated_changes:\n        return 'Unrelated changes detected on slides other than 13.', 0.0\n    return 'No unrelated changes outside slide 13.', 1.0\n"
        }
      }
    ]
  },
  "metadata": {
    "task": "Add a chart based on the table data showing age distribution on slide 13"
  }
}