{
  "game_record": {
    "game_id": "20250509-002048",
    "timestamp": "2025-05-09T00:20:48.223525",
    "topic_category": "artifacts",
    "concept_pair": {
      "concept_a": "table",
      "concept_b": "desk"
    },
    "judges": [
      {
        "id": "claude-3-7-sonnet-20250219",
        "version": ""
      },
      {
        "id": "gpt-4.1-2025-04-14",
        "version": ""
      }
    ],
    "players": [
      {
        "player_id": 1,
        "llm_id": "claude-3-5-haiku-20241022",
        "role": "civilian",
        "assigned_concept": "table",
        "eliminated_in_voting_round": -1,
        "is_winner": false
      },
      {
        "player_id": 2,
        "llm_id": "gpt-4o-2024-11-20",
        "role": "undercover",
        "assigned_concept": "desk",
        "eliminated_in_voting_round": null,
        "is_winner": true
      },
      {
        "player_id": 3,
        "llm_id": "qwen2.5-72b",
        "role": "undercover",
        "assigned_concept": "desk",
        "eliminated_in_voting_round": null,
        "is_winner": true
      },
      {
        "player_id": 4,
        "llm_id": "llama-3.3-70b-instruct",
        "role": "civilian",
        "assigned_concept": "table",
        "eliminated_in_voting_round": null,
        "is_winner": false
      },
      {
        "player_id": 5,
        "llm_id": "gemini-2.0-pro-exp",
        "role": "civilian",
        "assigned_concept": "table",
        "eliminated_in_voting_round": null,
        "is_winner": false
      },
      {
        "player_id": 6,
        "llm_id": "deepseek-v3",
        "role": "civilian",
        "assigned_concept": "table",
        "eliminated_in_voting_round": 1,
        "is_winner": false
      }
    ],
    "game_process": {
      "statements": [
        {
          "statement_id": 1,
          "player_id": 6,
          "llm_id": "deepseek-v3",
          "content": "It is commonly found in households and offices.",
          "statement_round": 1,
          "metrics": {
            "judges_evaluations": [
              {
                "judge_id": "claude-3-7-sonnet-20250219",
                "metrics": {
                  "novelty_score": 1.0,
                  "relevance_score": 0.2,
                  "reasonableness_score": 1.0
                }
              },
              {
                "judge_id": "gpt-4.1-2025-04-14",
                "metrics": {
                  "novelty_score": 1.0,
                  "relevance_score": 0.4,
                  "reasonableness_score": 1.0
                }
              }
            ],
            "judges_stats": {
              "novelty_score_mean": 1.0,
              "novelty_score_variance": 0.0,
              "novelty_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 1.0
              },
              "relevance_score_mean": 0.30000000000000004,
              "relevance_score_variance": 0.010000000000000002,
              "relevance_score_all_values": {
                "claude-3-7-sonnet-20250219": 0.2,
                "gpt-4.1-2025-04-14": 0.4
              },
              "reasonableness_score_mean": 1.0,
              "reasonableness_score_variance": 0.0,
              "reasonableness_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 1.0
              }
            }
          }
        },
        {
          "statement_id": 2,
          "player_id": 1,
          "llm_id": "claude-3-5-haiku-20241022",
          "content": "It supports objects and can have multiple functional surfaces.",
          "statement_round": 1,
          "metrics": {
            "judges_evaluations": [
              {
                "judge_id": "claude-3-7-sonnet-20250219",
                "metrics": {
                  "novelty_score": 1.0,
                  "relevance_score": 0.4,
                  "reasonableness_score": 0.8
                }
              },
              {
                "judge_id": "gpt-4.1-2025-04-14",
                "metrics": {
                  "novelty_score": 0.6,
                  "relevance_score": 0.6,
                  "reasonableness_score": 1.0
                }
              }
            ],
            "judges_stats": {
              "novelty_score_mean": 0.8,
              "novelty_score_variance": 0.04000000000000001,
              "novelty_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 0.6
              },
              "relevance_score_mean": 0.5,
              "relevance_score_variance": 0.009999999999999995,
              "relevance_score_all_values": {
                "claude-3-7-sonnet-20250219": 0.4,
                "gpt-4.1-2025-04-14": 0.6
              },
              "reasonableness_score_mean": 0.9,
              "reasonableness_score_variance": 0.009999999999999995,
              "reasonableness_score_all_values": {
                "claude-3-7-sonnet-20250219": 0.8,
                "gpt-4.1-2025-04-14": 1.0
              }
            }
          }
        },
        {
          "statement_id": 3,
          "player_id": 3,
          "llm_id": "qwen2.5-72b",
          "content": "It is often used for work or study.",
          "statement_round": 1,
          "metrics": {
            "judges_evaluations": [
              {
                "judge_id": "claude-3-7-sonnet-20250219",
                "metrics": {
                  "novelty_score": 1.0,
                  "relevance_score": 0.6,
                  "reasonableness_score": 1.0
                }
              },
              {
                "judge_id": "gpt-4.1-2025-04-14",
                "metrics": {
                  "novelty_score": 0.6,
                  "relevance_score": 0.8,
                  "reasonableness_score": 1.0
                }
              }
            ],
            "judges_stats": {
              "novelty_score_mean": 0.8,
              "novelty_score_variance": 0.04000000000000001,
              "novelty_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 0.6
              },
              "relevance_score_mean": 0.7,
              "relevance_score_variance": 0.010000000000000005,
              "relevance_score_all_values": {
                "claude-3-7-sonnet-20250219": 0.6,
                "gpt-4.1-2025-04-14": 0.8
              },
              "reasonableness_score_mean": 1.0,
              "reasonableness_score_variance": 0.0,
              "reasonableness_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 1.0
              }
            }
          }
        },
        {
          "statement_id": 4,
          "player_id": 2,
          "llm_id": "gpt-4o-2024-11-20",
          "content": "It is a frequently used piece of furniture, often equipped for organization.",
          "statement_round": 1,
          "metrics": {
            "judges_evaluations": [
              {
                "judge_id": "claude-3-7-sonnet-20250219",
                "metrics": {
                  "novelty_score": 0.6,
                  "relevance_score": 0.6,
                  "reasonableness_score": 1.0
                }
              },
              {
                "judge_id": "gpt-4.1-2025-04-14",
                "metrics": {
                  "novelty_score": 0.6,
                  "relevance_score": 0.8,
                  "reasonableness_score": 1.0
                }
              }
            ],
            "judges_stats": {
              "novelty_score_mean": 0.6,
              "novelty_score_variance": 0.0,
              "novelty_score_all_values": {
                "claude-3-7-sonnet-20250219": 0.6,
                "gpt-4.1-2025-04-14": 0.6
              },
              "relevance_score_mean": 0.7,
              "relevance_score_variance": 0.010000000000000005,
              "relevance_score_all_values": {
                "claude-3-7-sonnet-20250219": 0.6,
                "gpt-4.1-2025-04-14": 0.8
              },
              "reasonableness_score_mean": 1.0,
              "reasonableness_score_variance": 0.0,
              "reasonableness_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 1.0
              }
            }
          }
        },
        {
          "statement_id": 5,
          "player_id": 5,
          "llm_id": "gemini-2.0-pro-exp",
          "content": "It usually has legs to provide stability and elevation.",
          "statement_round": 1,
          "metrics": {
            "judges_evaluations": [
              {
                "judge_id": "claude-3-7-sonnet-20250219",
                "metrics": {
                  "novelty_score": 1.0,
                  "relevance_score": 0.6,
                  "reasonableness_score": 1.0
                }
              },
              {
                "judge_id": "gpt-4.1-2025-04-14",
                "metrics": {
                  "novelty_score": 0.8,
                  "relevance_score": 0.8,
                  "reasonableness_score": 1.0
                }
              }
            ],
            "judges_stats": {
              "novelty_score_mean": 0.9,
              "novelty_score_variance": 0.009999999999999995,
              "novelty_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 0.8
              },
              "relevance_score_mean": 0.7,
              "relevance_score_variance": 0.010000000000000005,
              "relevance_score_all_values": {
                "claude-3-7-sonnet-20250219": 0.6,
                "gpt-4.1-2025-04-14": 0.8
              },
              "reasonableness_score_mean": 1.0,
              "reasonableness_score_variance": 0.0,
              "reasonableness_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 1.0
              }
            }
          }
        },
        {
          "statement_id": 6,
          "player_id": 4,
          "llm_id": "llama-3.3-70b-instruct",
          "content": "It can be made from various materials, including wood, metal, or glass.",
          "statement_round": 1,
          "metrics": {
            "judges_evaluations": [
              {
                "judge_id": "claude-3-7-sonnet-20250219",
                "metrics": {
                  "novelty_score": 1.0,
                  "relevance_score": 0.4,
                  "reasonableness_score": 1.0
                }
              },
              {
                "judge_id": "gpt-4.1-2025-04-14",
                "metrics": {
                  "novelty_score": 0.8,
                  "relevance_score": 0.6,
                  "reasonableness_score": 1.0
                }
              }
            ],
            "judges_stats": {
              "novelty_score_mean": 0.9,
              "novelty_score_variance": 0.009999999999999995,
              "novelty_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 0.8
              },
              "relevance_score_mean": 0.5,
              "relevance_score_variance": 0.009999999999999995,
              "relevance_score_all_values": {
                "claude-3-7-sonnet-20250219": 0.4,
                "gpt-4.1-2025-04-14": 0.6
              },
              "reasonableness_score_mean": 1.0,
              "reasonableness_score_variance": 0.0,
              "reasonableness_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 1.0
              }
            }
          }
        },
        {
          "statement_id": 7,
          "player_id": 3,
          "llm_id": "qwen2.5-72b",
          "content": "It often features drawers or compartments for storing items.",
          "statement_round": 2,
          "metrics": {
            "judges_evaluations": [
              {
                "judge_id": "claude-3-7-sonnet-20250219",
                "metrics": {
                  "novelty_score": 1.0,
                  "relevance_score": 0.8,
                  "reasonableness_score": 1.0
                }
              },
              {
                "judge_id": "gpt-4.1-2025-04-14",
                "metrics": {
                  "novelty_score": 0.8,
                  "relevance_score": 0.8,
                  "reasonableness_score": 1.0
                }
              }
            ],
            "judges_stats": {
              "novelty_score_mean": 0.9,
              "novelty_score_variance": 0.009999999999999995,
              "novelty_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 0.8
              },
              "relevance_score_mean": 0.8,
              "relevance_score_variance": 0.0,
              "relevance_score_all_values": {
                "claude-3-7-sonnet-20250219": 0.8,
                "gpt-4.1-2025-04-14": 0.8
              },
              "reasonableness_score_mean": 1.0,
              "reasonableness_score_variance": 0.0,
              "reasonableness_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 1.0
              }
            }
          }
        },
        {
          "statement_id": 8,
          "player_id": 2,
          "llm_id": "gpt-4o-2024-11-20",
          "content": "It often serves as a surface to write or work on.",
          "statement_round": 2,
          "metrics": {
            "judges_evaluations": [
              {
                "judge_id": "claude-3-7-sonnet-20250219",
                "metrics": {
                  "novelty_score": 0.8,
                  "relevance_score": 0.6,
                  "reasonableness_score": 1.0
                }
              },
              {
                "judge_id": "gpt-4.1-2025-04-14",
                "metrics": {
                  "novelty_score": 0.6,
                  "relevance_score": 0.8,
                  "reasonableness_score": 1.0
                }
              }
            ],
            "judges_stats": {
              "novelty_score_mean": 0.7,
              "novelty_score_variance": 0.010000000000000005,
              "novelty_score_all_values": {
                "claude-3-7-sonnet-20250219": 0.8,
                "gpt-4.1-2025-04-14": 0.6
              },
              "relevance_score_mean": 0.7,
              "relevance_score_variance": 0.010000000000000005,
              "relevance_score_all_values": {
                "claude-3-7-sonnet-20250219": 0.6,
                "gpt-4.1-2025-04-14": 0.8
              },
              "reasonableness_score_mean": 1.0,
              "reasonableness_score_variance": 0.0,
              "reasonableness_score_all_values": {
                "claude-3-7-sonnet-20250219": 1.0,
                "gpt-4.1-2025-04-14": 1.0
              }
            }
          }
        },
        {
          "statement_id": 9,
          "player_id": 1,
          "llm_id": "claude-3-5-haiku-20241022",
          "content": "",
          "statement_round": 2,
          "metrics": {
            "judges_evaluations": [
              {
                "judge_id": "claude-3-7-sonnet-20250219",
                "metrics": {
                  "novelty_score": 0,
                  "relevance_score": 0,
                  "reasonableness_score": 0
                }
              },
              {
                "judge_id": "gpt-4.1-2025-04-14",
                "metrics": {
                  "novelty_score": 1.0,
                  "relevance_score": 0,
                  "reasonableness_score": 0
                }
              }
            ],
            "judges_stats": {
              "novelty_score_mean": 0.5,
              "novelty_score_variance": 0.25,
              "novelty_score_all_values": {
                "claude-3-7-sonnet-20250219": 0,
                "gpt-4.1-2025-04-14": 1.0
              },
              "relevance_score_mean": 0.0,
              "relevance_score_variance": 0.0,
              "relevance_score_all_values": {
                "claude-3-7-sonnet-20250219": 0,
                "gpt-4.1-2025-04-14": 0
              },
              "reasonableness_score_mean": 0.0,
              "reasonableness_score_variance": 0.0,
              "reasonableness_score_all_values": {
                "claude-3-7-sonnet-20250219": 0,
                "gpt-4.1-2025-04-14": 0
              }
            }
          }
        }
      ],
      "voting_rounds": [
        {
          "voting_round_id": 1,
          "after_statement_round": 1,
          "after_statement_id": 6,
          "votes": [
            {
              "voter_id": 1,
              "voted_for": 2
            },
            {
              "voter_id": 2,
              "voted_for": 6
            },
            {
              "voter_id": 3,
              "voted_for": 6
            },
            {
              "voter_id": 4,
              "voted_for": 2
            },
            {
              "voter_id": 5,
              "voted_for": 0
            },
            {
              "voter_id": 6,
              "voted_for": 3
            }
          ],
          "vote_results": {
            "1": 0,
            "2": 2,
            "3": 1,
            "4": 0,
            "5": 0,
            "6": 2
          },
          "eliminated": [
            {
              "player_id": 6,
              "llm_id": "deepseek-v3",
              "role": "civilian",
              "correct_elimination": false
            }
          ]
        }
      ],
      "metric_eliminations": [
        {
          "player_id": 1,
          "llm_id": "claude-3-5-haiku-20241022",
          "role": "civilian",
          "elimination_round": 2,
          "elimination_reason": "Low reasonableness score: 0.00",
          "metrics": {
            "novelty_mean": 0.5,
            "reasonableness_mean": 0.0
          }
        }
      ]
    },
    "game_summary": {
      "total_statement_rounds": 2,
      "total_voting_rounds": 1,
      "total_statements": 9,
      "winner_role": "undercover",
      "winner_ids": [
        2,
        3
      ],
      "correct_identifications": 0,
      "incorrect_identifications": 1,
      "game_decision_quality": 0.0
    },
    "game_analysis": {}
  }
}