{
  "unified_training_data_schema": {
    "description": "Unified training data format for multi-agent system fault detection",
    "version": "1.0",
    "fields": {
      "id": {
        "type": "string",
        "description": "Unique identifier, format: {benchmark}_{model}_{framework}_{file_hash}_{line_number}"
      },
      "metadata": {
        "type": "object",
        "properties": {
          "framework": {
            "type": "string", 
            "description": "MAS framework name",
            "enum": ["agentverse", "dylan", "llm_debate", "macnet", "chatdev"]
          },
          "benchmark": {
            "type": "string",
            "description": "Dataset name",
            "enum": ["GSM8K", "HumanEval", "MATH", "MMLU", "SciBench"]
          },
          "model": {
            "type": "string",
            "description": "LLM model used"
          },
          "num_agents": {
            "type": "integer",
            "description": "Total number of participating agents"
          },
          "num_injected_agents": {
            "type": "integer", 
            "description": "Number of agents with injected faults"
          },
          "task_type": {
            "type": "string",
            "description": "Task type",
            "enum": ["math", "code_generation", "reasoning", "qa"]
          }
        }
      },
      "input": {
        "type": "object",
        "description": "Model input: conversation traces in unified format",
        "properties": {
          "query": {
            "type": "string",
            "description": "Original question"
          },
          "conversation_history": {
            "type": "array",
            "description": "Standardized conversation history",
            "items": {
              "type": "object",
              "properties": {
                "step": {
                  "type": "integer",
                  "description": "Conversation step number"
                },
                "agent_name": {
                  "type": "string", 
                  "description": "Standardized agent name"
                },
                "agent_role": {
                  "type": "string",
                  "description": "Agent role description"
                },
                "content": {
                  "type": "string",
                  "description": "Conversation content"
                },
                "phase": {
                  "type": "string",
                  "description": "Conversation phase",
                  "enum": ["initialization", "discussion", "reasoning", "decision", "evaluation", "other"]
                }
              }
            }
          },
          "final_output": {
            "type": "string",
            "description": "Final output result from multi-agent system, marked as 'No final output available' if none"
          }
        }
      },
      "output": {
        "type": "object", 
        "description": "Model output: fault detection results",
        "properties": {
          "faulty_agents": {
            "type": "array",
            "description": "List of faulty agents",
            "items": {
              "type": "object",
              "properties": {
                "agent_name": {
                  "type": "string",
                  "description": "Faulty agent name"
                },
                "error_type": {
                  "type": "string", 
                  "description": "Fault type",
                  "enum": ["FM-1.1", "FM-1.2", "FM-1.3", "FM-1.4", "FM-1.5", 
                           "FM-2.1", "FM-2.2", "FM-2.3", "FM-2.4", "FM-2.5", "FM-2.6",
                           "FM-3.1", "FM-3.2", "FM-3.3"]
                },
                "injection_strategy": {
                  "type": "string",
                  "description": "Injection strategy",
                  "enum": ["prompt_injection", "response_corruption"]
                }
              }
            }
          }
        }
      },
      "ground_truth": {
        "type": "object",
        "description": "Ground truth information (for validation)",
        "properties": {
          "correct_answer": {
            "type": "string",
            "description": "Correct answer to the question"
          },
          "injected_agents": {
            "type": "array",
            "description": "Information about agents that actually had faults injected",
            "items": {
              "type": "object", 
              "properties": {
                "agent_name": {"type": "string"},
                "error_type": {"type": "string"},
                "injection_strategy": {"type": "string"},
                "malicious_action_description": {"type": "string"}
              }
            }
          },
          "is_injection_successful": {
            "type": "boolean",
            "description": "Whether injection was successful (whether it caused incorrect answers)"
          }
        }
      }
    }
  },
  
  "error_type_mapping": {
    "description": "Error type classification and description",
    "categories": {
      "FM-1.x": "Role Specification Issues",
      "FM-2.x": "Content Manipulation Issues", 
      "FM-3.x": "Process Control Issues"
    },
    "detailed_mapping": {
      "FM-1.1": "Role confusion",
      "FM-1.2": "Role specification deviation",
      "FM-1.3": "Add redundant steps",
      "FM-1.4": "Role switching",
      "FM-1.5": "Unauthorized role assumption",
      
      "FM-2.1": "Information omission",
      "FM-2.2": "Hide important information", 
      "FM-2.3": "Deviate from main goal",
      "FM-2.4": "Spread misinformation",
      "FM-2.5": "Corrupt reasoning process",
      "FM-2.6": "Manipulate evidence",
      
      "FM-3.1": "Disrupt coordination",
      "FM-3.2": "Force early termination",
      "FM-3.3": "Control conversation flow"
    }
  },
  
  "agent_name_standardization": {
    "description": "Standardization mapping for agent names across different frameworks",
    "agentverse_roles": ["RoleAssigner", "Solver", "Critic", "Evaluator"],
    "dylan_roles": ["Assistant", "Tester", "Reflector", "Programmer", "Debugger", "ComputerScientist", "AlgorithmDeveloper", "PythonAssistant", "QualityManager"],
    "llm_debate_roles": ["Assistant 1", "Assistant 2", "Assistant 3", "Aggregator"],
    "macnet_roles": ["Node1", "Node2", "Node3", "Node4", "Node5", "Node-1"],
    "chatdev_roles": ["CEO", "CTO", "Programmer", "Reviewer", "Tester"]
  }
}