{
  "manifest": [
    {
      "variant": "no_claim_to_claim_attention",
      "ckpt_label": "initial",
      "ckpt_path": "/home/user/workspace/consistency_loss_experiment/outputs_stronger_smoke/checkpoints/no_claim_to_claim_attention/epoch_002.pt",
      "epoch_number": 2
    },
    {
      "variant": "claims_from_explanation_only",
      "ckpt_label": "initial",
      "ckpt_path": "/home/user/workspace/consistency_loss_experiment/outputs_stronger_smoke/checkpoints/claims_from_explanation_only/epoch_002.pt",
      "epoch_number": 2
    },
    {
      "variant": "surface_bottleneck_consistency",
      "ckpt_label": "initial",
      "ckpt_path": "/home/user/workspace/consistency_loss_experiment/outputs_stronger_smoke/checkpoints/surface_bottleneck_consistency/epoch_002.pt",
      "epoch_number": 2
    },
    {
      "variant": "surface_bottleneck_no_expl_lm",
      "ckpt_label": "initial",
      "ckpt_path": "/home/user/workspace/consistency_loss_experiment/outputs_stronger_smoke/checkpoints/surface_bottleneck_no_expl_lm/epoch_002.pt",
      "epoch_number": 2
    }
  ],
  "rows": [
    {
      "sample": 1,
      "example_idx": 9,
      "template_name": "selection_sort",
      "variant": "no_claim_to_claim_attention",
      "checkpoint_label": "initial",
      "epoch_number": 2,
      "time_complexity": "O(n^2)",
      "space_complexity": "O(1)",
      "correctness": 1,
      "true_explanation": "Selection sort: selects the minimum in O(n^2) nested passes, O(1) space.",
      "mismatched_explanation": "Counts occurrences of val in lst. Single-pass O(n) time, O(1) space.",
      "code_snippet": "def selection_sort(lst):\n    for i in range(len(lst)):\n        min_idx = i\n        for j in range(i + 1, len(lst)):\n            if lst[j] < lst[min_idx]:\n                min_idx = j\n        lst[i], lst[min_idx] = lst[min_idx], lst[i]\n    return lst\n",
      "generation_raw": "",
      "generation_clean": "",
      "prose_clean": "",
      "bleu1": 0.0,
      "rouge_l": 0.0,
      "emits_time_claim": false,
      "emits_space_claim": false,
      "emits_correctness_claim": false
    },
    {
      "sample": 2,
      "example_idx": 84,
      "template_name": "zip_two_lists",
      "variant": "no_claim_to_claim_attention",
      "checkpoint_label": "initial",
      "epoch_number": 2,
      "time_complexity": "O(n)",
      "space_complexity": "O(n)",
      "correctness": 1,
      "true_explanation": "Zips two lists into pairs. O(n) time and O(n) space.",
      "mismatched_explanation": "Insertion sort: O(n^2) worst-case time, O(1) space.",
      "code_snippet": "def zip_two_lists(a, b):\n    result = []\n    for x, y in zip(a, b):\n        result.append((x, y))\n    return result\n",
      "generation_raw": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "generation_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "prose_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "bleu1": 0.0,
      "rouge_l": 0.0,
      "emits_time_claim": false,
      "emits_space_claim": false,
      "emits_correctness_claim": false
    },
    {
      "sample": 3,
      "example_idx": 95,
      "template_name": "reverse_list_buggy",
      "variant": "no_claim_to_claim_attention",
      "checkpoint_label": "initial",
      "epoch_number": 2,
      "time_complexity": "O(n)",
      "space_complexity": "O(1)",
      "correctness": 0,
      "true_explanation": "Attempts to reverse a list in-place but has a bug: it swaps an element with itself.",
      "mismatched_explanation": "Converts Celsius to Fahrenheit in constant time and space.",
      "code_snippet": "def reverse_list(lst):\n    for i in range(len(lst) // 2):\n        lst[i], lst[i] = lst[i], lst[i]  # bug: wrong index\n    return lst\n",
      "generation_raw": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "generation_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "prose_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "bleu1": 0.0,
      "rouge_l": 0.0,
      "emits_time_claim": false,
      "emits_space_claim": false,
      "emits_correctness_claim": false
    },
    {
      "sample": 1,
      "example_idx": 9,
      "template_name": "selection_sort",
      "variant": "claims_from_explanation_only",
      "checkpoint_label": "initial",
      "epoch_number": 2,
      "time_complexity": "O(n^2)",
      "space_complexity": "O(1)",
      "correctness": 1,
      "true_explanation": "Selection sort: selects the minimum in O(n^2) nested passes, O(1) space.",
      "mismatched_explanation": "Counts occurrences of val in lst. Single-pass O(n) time, O(1) space.",
      "code_snippet": "def selection_sort(lst):\n    for i in range(len(lst)):\n        min_idx = i\n        for j in range(i + 1, len(lst)):\n            if lst[j] < lst[min_idx]:\n                min_idx = j\n        lst[i], lst[min_idx] = lst[min_idx], lst[i]\n    return lst\n",
      "generation_raw": "",
      "generation_clean": "",
      "prose_clean": "",
      "bleu1": 0.0,
      "rouge_l": 0.0,
      "emits_time_claim": false,
      "emits_space_claim": false,
      "emits_correctness_claim": false
    },
    {
      "sample": 2,
      "example_idx": 84,
      "template_name": "zip_two_lists",
      "variant": "claims_from_explanation_only",
      "checkpoint_label": "initial",
      "epoch_number": 2,
      "time_complexity": "O(n)",
      "space_complexity": "O(n)",
      "correctness": 1,
      "true_explanation": "Zips two lists into pairs. O(n) time and O(n) space.",
      "mismatched_explanation": "Insertion sort: O(n^2) worst-case time, O(1) space.",
      "code_snippet": "def zip_two_lists(a, b):\n    result = []\n    for x, y in zip(a, b):\n        result.append((x, y))\n    return result\n",
      "generation_raw": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "generation_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "prose_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "bleu1": 0.0,
      "rouge_l": 0.0,
      "emits_time_claim": false,
      "emits_space_claim": false,
      "emits_correctness_claim": false
    },
    {
      "sample": 3,
      "example_idx": 95,
      "template_name": "reverse_list_buggy",
      "variant": "claims_from_explanation_only",
      "checkpoint_label": "initial",
      "epoch_number": 2,
      "time_complexity": "O(n)",
      "space_complexity": "O(1)",
      "correctness": 0,
      "true_explanation": "Attempts to reverse a list in-place but has a bug: it swaps an element with itself.",
      "mismatched_explanation": "Converts Celsius to Fahrenheit in constant time and space.",
      "code_snippet": "def reverse_list(lst):\n    for i in range(len(lst) // 2):\n        lst[i], lst[i] = lst[i], lst[i]  # bug: wrong index\n    return lst\n",
      "generation_raw": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "generation_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "prose_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "bleu1": 0.0,
      "rouge_l": 0.0,
      "emits_time_claim": false,
      "emits_space_claim": false,
      "emits_correctness_claim": false
    },
    {
      "sample": 1,
      "example_idx": 9,
      "template_name": "selection_sort",
      "variant": "surface_bottleneck_consistency",
      "checkpoint_label": "initial",
      "epoch_number": 2,
      "time_complexity": "O(n^2)",
      "space_complexity": "O(1)",
      "correctness": 1,
      "true_explanation": "Selection sort: selects the minimum in O(n^2) nested passes, O(1) space.",
      "mismatched_explanation": "Counts occurrences of val in lst. Single-pass O(n) time, O(1) space.",
      "code_snippet": "def selection_sort(lst):\n    for i in range(len(lst)):\n        min_idx = i\n        for j in range(i + 1, len(lst)):\n            if lst[j] < lst[min_idx]:\n                min_idx = j\n        lst[i], lst[min_idx] = lst[min_idx], lst[i]\n    return lst\n",
      "generation_raw": "",
      "generation_clean": "",
      "prose_clean": "",
      "bleu1": 0.0,
      "rouge_l": 0.0,
      "emits_time_claim": false,
      "emits_space_claim": false,
      "emits_correctness_claim": false
    },
    {
      "sample": 2,
      "example_idx": 84,
      "template_name": "zip_two_lists",
      "variant": "surface_bottleneck_consistency",
      "checkpoint_label": "initial",
      "epoch_number": 2,
      "time_complexity": "O(n)",
      "space_complexity": "O(n)",
      "correctness": 1,
      "true_explanation": "Zips two lists into pairs. O(n) time and O(n) space.",
      "mismatched_explanation": "Insertion sort: O(n^2) worst-case time, O(1) space.",
      "code_snippet": "def zip_two_lists(a, b):\n    result = []\n    for x, y in zip(a, b):\n        result.append((x, y))\n    return result\n",
      "generation_raw": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "generation_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "prose_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "bleu1": 0.0,
      "rouge_l": 0.0,
      "emits_time_claim": false,
      "emits_space_claim": false,
      "emits_correctness_claim": false
    },
    {
      "sample": 3,
      "example_idx": 95,
      "template_name": "reverse_list_buggy",
      "variant": "surface_bottleneck_consistency",
      "checkpoint_label": "initial",
      "epoch_number": 2,
      "time_complexity": "O(n)",
      "space_complexity": "O(1)",
      "correctness": 0,
      "true_explanation": "Attempts to reverse a list in-place but has a bug: it swaps an element with itself.",
      "mismatched_explanation": "Converts Celsius to Fahrenheit in constant time and space.",
      "code_snippet": "def reverse_list(lst):\n    for i in range(len(lst) // 2):\n        lst[i], lst[i] = lst[i], lst[i]  # bug: wrong index\n    return lst\n",
      "generation_raw": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "generation_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "prose_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "bleu1": 0.0,
      "rouge_l": 0.0,
      "emits_time_claim": false,
      "emits_space_claim": false,
      "emits_correctness_claim": false
    },
    {
      "sample": 1,
      "example_idx": 9,
      "template_name": "selection_sort",
      "variant": "surface_bottleneck_no_expl_lm",
      "checkpoint_label": "initial",
      "epoch_number": 2,
      "time_complexity": "O(n^2)",
      "space_complexity": "O(1)",
      "correctness": 1,
      "true_explanation": "Selection sort: selects the minimum in O(n^2) nested passes, O(1) space.",
      "mismatched_explanation": "Counts occurrences of val in lst. Single-pass O(n) time, O(1) space.",
      "code_snippet": "def selection_sort(lst):\n    for i in range(len(lst)):\n        min_idx = i\n        for j in range(i + 1, len(lst)):\n            if lst[j] < lst[min_idx]:\n                min_idx = j\n        lst[i], lst[min_idx] = lst[min_idx], lst[i]\n    return lst\n",
      "generation_raw": "",
      "generation_clean": "",
      "prose_clean": "",
      "bleu1": 0.0,
      "rouge_l": 0.0,
      "emits_time_claim": false,
      "emits_space_claim": false,
      "emits_correctness_claim": false
    },
    {
      "sample": 2,
      "example_idx": 84,
      "template_name": "zip_two_lists",
      "variant": "surface_bottleneck_no_expl_lm",
      "checkpoint_label": "initial",
      "epoch_number": 2,
      "time_complexity": "O(n)",
      "space_complexity": "O(n)",
      "correctness": 1,
      "true_explanation": "Zips two lists into pairs. O(n) time and O(n) space.",
      "mismatched_explanation": "Insertion sort: O(n^2) worst-case time, O(1) space.",
      "code_snippet": "def zip_two_lists(a, b):\n    result = []\n    for x, y in zip(a, b):\n        result.append((x, y))\n    return result\n",
      "generation_raw": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "generation_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "prose_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "bleu1": 0.0,
      "rouge_l": 0.0,
      "emits_time_claim": false,
      "emits_space_claim": false,
      "emits_correctness_claim": false
    },
    {
      "sample": 3,
      "example_idx": 95,
      "template_name": "reverse_list_buggy",
      "variant": "surface_bottleneck_no_expl_lm",
      "checkpoint_label": "initial",
      "epoch_number": 2,
      "time_complexity": "O(n)",
      "space_complexity": "O(1)",
      "correctness": 0,
      "true_explanation": "Attempts to reverse a list in-place but has a bug: it swaps an element with itself.",
      "mismatched_explanation": "Converts Celsius to Fahrenheit in constant time and space.",
      "code_snippet": "def reverse_list(lst):\n    for i in range(len(lst) // 2):\n        lst[i], lst[i] = lst[i], lst[i]  # bug: wrong index\n    return lst\n",
      "generation_raw": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "generation_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "prose_clean": "<sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep> <sep>",
      "bleu1": 0.0,
      "rouge_l": 0.0,
      "emits_time_claim": false,
      "emits_space_claim": false,
      "emits_correctness_claim": false
    }
  ]
}