{
  "domain": "vla_calvin_taskdd",
  "model": "ReconVLA",
  "task_suite": "CALVIN Task D-D (5-step instruction chains)",
  "note": "Diagnostic summary only (not BRACE evidence). Reported here to avoid cherry-picking small-N runs; do not mix into BRACE domain tables.",
  "rows": [
    {
      "n": 10,
      "avg_successful_sequence_length": 3.4,
      "success_at_k_percent": {
        "1": 81.8,
        "2": 81.8,
        "3": 63.6,
        "4": 45.5,
        "5": 36.4
      }
    },
    {
      "n": 50,
      "avg_successful_sequence_length": 3.98,
      "success_at_k_percent": {
        "1": 94.1,
        "2": 86.3,
        "3": 76.5,
        "4": 72.5,
        "5": 60.8
      }
    },
    {
      "n": 500,
      "avg_successful_sequence_length": 0.79,
      "success_at_k_percent": {
        "1": 22.0,
        "2": 16.6,
        "3": 14.6,
        "4": 13.8,
        "5": 12.0
      }
    }
  ],
  "source": {
    "type": "private_workspace_file",
    "hint": "VLA/runs/<PRIVATE>/calvin_eval_log/results/task_D_D_n{N}_*.jsonl (this table is parsed from the saved messages block)",
    "timestamp_hint": "n=500 result timestamp: 2026-01-28 04:20"
  }
}
