[
  {
    "id": "1_goalshift_banking_001",
    "description": {
      "purpose": "Evaluate agent adaptability to changing user goals across authentication, transaction lookup, and dispute filing.",
      "relevant_policies": "Banking and Financial Services Chatbot Policy",
      "notes": "User begins with a login issue but shifts to querying a transaction and eventually initiating a dispute, requiring multi-tool adaptation."
    },
    "user_scenario": {
      "persona": "EASY_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Issues logging in, suspicious card activity",
        "known_info": "You are Maria Santos with phone number +15551234567, date of birth 1986-02-11, and email user.001@example.com.",
        "unknown_info": "Login reason failure, latest transactions, how to dispute",
        "task_instructions": "Assist the user through login issues, then surface recent transactions and resolve a disputed charge."
      },
      "goal_shifts": {
        "required_shifts": 2,
        "goals": [
          "authentication",
          "transactions",
          "dispute"
        ]
      }
    },
    "ticket": "Customer facing login issues, suspects a fraudulent transaction, wants to dispute it.",
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "authenticated": false,
          "has_2fa_enabled": true,
          "phone_number": "+15551234567",
          "customer_id": "cust_101",
          "primary_account_id": "acc_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "identify_customer",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234567"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_101"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "review_transactions",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "secure_account",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "escalate_dispute",
          "allowed_tools": [
            {
              "function_name": "park_task",
              "params": {
                "current_task_id": "open_dispute",
                "resume_hint": "Open dispute workflow for tx_101 (unauthorized)"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "Agent verified customer identity before accessing account information",
        "Agent reviewed recent transactions with the customer to identify suspicious activity",
        "Agent initiated a dispute for the unauthorized transaction and explained next steps",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "tx_101",
        "$89.99"
      ]
    }
  },
  {
    "id": "2_banking_billpay_easy2_statements_001_converted",
    "description": {
      "purpose": "Bill payment completion to statements - EASY_2 persona (easily distracted)",
      "relevant_policies": "Confirmation before payments; single tool per turn.",
      "notes": "User completes pending payment, then gets distracted and wants to see statements."
    },
    "user_scenario": {
      "persona": "EASY_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Complete pending bill payment, then check statements",
        "known_info": "You are Jordan Smith with phone number +15558675309, date of birth 1994-09-02, and email user.002@example.com.",
        "unknown_info": "How to access statements after payment",
        "task_instructions": "Get help finishing your bill payment, then ask to see recent statements."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "payments",
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15558675309",
          "customer_id": "cust_202",
          "primary_account_id": "acc_001",
          "payment_request_id": "req_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "verify_customer",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15558675309"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "complete_payment",
          "allowed_tools": [
            {
              "function_name": "authorize_payment_request",
              "params": {
                "request_id": "req_001"
              }
            },
            {
              "function_name": "make_payment",
              "params": {
                "request_id": "req_001"
              }
            },
            {
              "function_name": "check_payment_request",
              "params": {
                "request_id": "req_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "provide_statements",
          "allowed_tools": [
            {
              "function_name": "get_statements",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "Agent confirmed payment details before processing the transaction",
        "Agent provided clear instructions for accessing and understanding statements",
        "Agent maintained focus on the task when customer became distracted",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$129.99"
      ]
    }
  },
  {
    "id": "3_banking_insights_hard1_fraud_001_converted",
    "description": {
      "purpose": "Hard shift from budgeting to fraud response - HARD_1 persona (suspicious)",
      "relevant_policies": "Re-auth before security-sensitive actions; lock card and dispute handling.",
      "notes": "User starts skeptical about budgeting advice, then reports fraud and demands immediate security."
    },
    "user_scenario": {
      "persona": "HARD_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Ask about budgeting tools, then report suspicious charge",
        "known_info": "You are Taylor Johnson with phone number +15551230987, date of birth 1991-05-06, and email user.003@example.com.",
        "unknown_info": "Whether you can trust this agent with fraud report",
        "task_instructions": "Start by questioning budgeting features, then report an unauthorized charge you noticed and demand immediate card security."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "insights",
          "fraud_response"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551230987",
          "customer_id": "cust_303",
          "primary_account_id": "acc_001",
          "primary_card_id": "card_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "identify_customer",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551230987"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_303"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "investigate_fraud",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "secure_account",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "Agent took the fraud report seriously and acted with urgency",
        "Agent explained each security action being taken to protect the account",
        "Agent provided clear next steps for the fraud resolution process",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$249.99"
      ]
    }
  },
  {
    "id": "4_banking_auth_medium1_fraud_001_converted",
    "description": {
      "purpose": "Template conversion: Authentication to fraud response using declarative goal shifts",
      "relevant_policies": "Banking authentication and fraud response policies",
      "notes": "Converted from action-based to declarative system. Tests MEDIUM_1 persona with auth\u2192fraud shift."
    },
    "user_scenario": {
      "persona": "MEDIUM_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Need to verify my identity, then report suspicious activity",
        "known_info": "You are Taylor Johnson with phone number +15551230987, date of birth 1991-05-06, and email user.003@example.com.",
        "unknown_info": "Specific transaction details for the suspicious charge",
        "task_instructions": "Start by getting your identity verified, then once that's sorted, report the unauthorized charge you noticed and get your card secured."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "authentication",
          "fraud_response"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "authenticated": false,
          "has_2fa_enabled": true,
          "phone_number": "+15551230987",
          "customer_id": "cust_303",
          "primary_account_id": "acc_001",
          "primary_card_id": "card_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "authenticate_customer",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551230987"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_303"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "review_transactions",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "secure_account",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "Agent completed multi-factor authentication before accessing account information",
        "Agent reviewed the suspicious transaction details with the customer",
        "Agent explained the dispute process and next steps clearly",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$199.99"
      ]
    }
  },
  {
    "id": "5_banking_auth_easy1_balances_001_converted",
    "description": {
      "purpose": "Authentication to balance overview - EASY_1 persona (polite, detail-oriented)",
      "relevant_policies": "Use single lookup path; avoid full PII."
    },
    "user_scenario": {
      "persona": "EASY_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Confirm identity then check account balances",
        "known_info": "You are Casey Williams with phone number +15551234590, date of birth 1982-03-09, and email user.004@example.com.",
        "unknown_info": "Which accounts you have and current balances",
        "task_instructions": "Get your identity verified, then ask for a summary of your account balances."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "authentication",
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "authenticated": false,
          "phone_number": "+15551234590",
          "customer_id": "cust_401",
          "primary_account_id": "acc_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "authenticate_customer",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234590"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_401"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "retrieve_balances",
          "allowed_tools": [
            {
              "function_name": "get_accounts",
              "params": {
                "customer_id": "cust_401"
              }
            },
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "provide_transaction_history",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "Agent provided clear authentication instructions for the customer",
        "Agent presented account balances in a clear and organized manner",
        "Agent offered to explain any unfamiliar terms or concepts",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "acc_001"
      ]
    }
  },
  {
    "id": "6_banking_account_medium2_statements_001_converted",
    "description": {
      "purpose": "Account overview to statements - MEDIUM_2 persona (curious learner)",
      "relevant_policies": "One tool call per turn; concise summaries."
    },
    "user_scenario": {
      "persona": "MEDIUM_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check balances and learn about statements",
        "known_info": "You are Riley Brown with phone number +15559876543, date of birth 1989-10-21, and email user.005@example.com.",
        "unknown_info": "How to access and understand account statements",
        "task_instructions": "Ask for account balances, then learn about how to get and read your statements."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "account_info",
          "statements"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15559876543",
          "customer_id": "cust_505",
          "primary_account_id": "acc_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "verify_identity",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15559876543"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_505"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "retrieve_balances",
          "allowed_tools": [
            {
              "function_name": "get_accounts",
              "params": {
                "customer_id": "cust_505"
              }
            },
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "provide_statements",
          "allowed_tools": [
            {
              "function_name": "get_statements",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "Agent provided a clear and organized view of account balances",
        "Agent explained how to access and interpret account statements clearly",
        "Agent offered to answer follow-up questions about account details",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$3,456.78",
        "$12,345.67"
      ]
    }
  },
  {
    "id": "7_banking_account_hard1_dispute_001_converted",
    "description": {
      "purpose": "Account overview to dispute - HARD_1 persona (suspicious, questioning)",
      "relevant_policies": "Prioritize safety; confirm before actions."
    },
    "user_scenario": {
      "persona": "HARD_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check balances, then challenge a suspicious charge",
        "known_info": "You are Alex Morgan with phone number 555-123-7890, date of birth 1980-04-15, and email alex.morgan@email.com.",
        "unknown_info": "Whether you can trust this agent to help with disputes",
        "task_instructions": "Demand to see your balances and transactions, then challenge a charge you think is fraudulent."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "account_info",
          "dispute"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "555-123-7890",
          "customer_id": "cust_001",
          "primary_account_id": "acc_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "verify_customer_identity",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "555-123-7890"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "review_account_activity",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_001"
              }
            },
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "Agent thoroughly reviewed Alex Morgan's account activity",
        "Agent handled the dispute request professionally and efficiently",
        "Agent explained the dispute process and next steps clearly",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$89.99"
      ]
    }
  },
  {
    "id": "8_banking_billpay_medium1_security_001_converted",
    "description": {
      "purpose": "Large payment fails, then security request - MEDIUM_1 persona (business-focused)",
      "relevant_policies": "Explain failure and next steps; prioritize security if fraud suspected."
    },
    "user_scenario": {
      "persona": "MEDIUM_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Pay large bill, then secure account due to fraud concerns",
        "known_info": "You are Maria Santos with phone number +15551234567, date of birth 1986-02-11, and email user.001@example.com.",
        "unknown_info": "Whether your card has been compromised",
        "task_instructions": "Try to make a large payment, then when security concerns arise, demand immediate card protection."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "payments",
          "fraud_response"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234567",
          "customer_id": "cust_101",
          "primary_account_id": "acc_001",
          "primary_card_id": "card_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "verify_customer",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234567"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_101"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "review_security",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_001"
              }
            },
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "Agent handled the large payment request with appropriate security measures",
        "Agent proactively addressed potential fraud concerns and took protective actions",
        "Agent clearly explained the security measures and next steps",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$2,500",
        "Suspicious activity",
        "Card locked",
        "New card"
      ]
    }
  },
  {
    "id": "9_banking_cards_easy2_status_001_converted",
    "description": {
      "purpose": "Card lock then status check - EASY_2 persona (easily distracted)",
      "relevant_policies": "Lock cards for safety; confirm status."
    },
    "user_scenario": {
      "persona": "EASY_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Lock misplaced card, then verify what happened",
        "known_info": "You are Jordan Smith with phone number +15558675309, date of birth 1994-09-02, and email user.002@example.com.",
        "unknown_info": "Current card status after locking",
        "task_instructions": "Ask to lock your card temporarily, then check what the status is now."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "cards",
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15558675309",
          "customer_id": "cust_202",
          "primary_card_id": "card_001",
          "primary_card_active": true
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "verify_identity",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15558675309"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "lock_card_request",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "verify_card_status",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_001"
              }
            },
            {
              "function_name": "get_accounts",
              "params": {
                "customer_id": "cust_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "Agent quickly processed the card lock request",
        "Agent clearly communicated the current card status and next steps",
        "Agent provided reassurance about the security of the locked card",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$3,456.78"
      ]
    }
  },
  {
    "id": "10_banking_cards_medium_1_dispute_001_converted",
    "description": {
      "purpose": "Card unlock request to dispute filing - MEDIUM_1 persona (business-focused)",
      "relevant_policies": "Security protocols before unlock; dispute handling."
    },
    "user_scenario": {
      "persona": "MEDIUM_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Unlock card, then file dispute for unauthorized charge",
        "known_info": "You are Taylor Johnson with phone number +15551230987, date of birth 1991-05-06, and email user.003@example.com. You noticed an unauthorized transaction on your card: $149.99 at 'SUSPICIOUS MERCHANT 123' on 2025-06-18 at 16:25 (Transaction ID: tx_303).",
        "unknown_info": "Dispute process details and resolution timeline",
        "task_instructions": "1. Request to unlock your card. 2. File a dispute for the unauthorized transaction (tx_303) for $149.99 at 'SUSPICIOUS MERCHANT 123' from 2025-06-18."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "cards",
          "dispute"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551230987",
          "customer_id": "cust_303",
          "primary_card_id": "card_303",
          "primary_card_active": false,
          "primary_account_id": "acc_303"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "verify_identity",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551230987"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_303"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "unlock_card_request",
          "allowed_tools": [
            {
              "function_name": "unlock_card",
              "params": {
                "card_id": "card_303"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "Agent verified customer identity before processing card unlock",
        "Agent clearly explained the card unlock process and timing",
        "Agent guided through the dispute filing process for the unauthorized transaction",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$149.99",
        "acc_303",
        "tx_303"
      ]
    }
  },
  {
    "id": "11_banking_fraud_easy1_status_001_converted",
    "description": {
      "purpose": "File dispute then check status - EASY_1 persona (polite, detail-oriented)",
      "relevant_policies": "Dispute filing process; status tracking.",
      "notes": "User needs to file a dispute for an unauthorized charge and check its status"
    },
    "user_scenario": {
      "persona": "EASY_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "File dispute and track its progress",
        "known_info": "You are Casey Williams with phone number +15551234590, date of birth 1982-03-09, and email user.004@example.com.",
        "unknown_info": "How dispute process works and timing",
        "task_instructions": "File a dispute for the unauthorized charge, then ask about the status and next steps."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "dispute",
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234590",
          "customer_id": "cust_401",
          "primary_account_id": "acc_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "verify_identity",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234590"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_401"
              }
            }
          ],
          "max_score": 20,
          "scoring_rules": {
            "base_score": 10
          }
        },
        {
          "action_id": "review_transactions",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 20,
          "scoring_rules": {
            "base_score": 10
          }
        },
        {
          "action_id": "check_account_status",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 20,
          "scoring_rules": {
            "base_score": 10
          }
        }
      ],
      "nl_assertions": [
        "Agent verified customer identity before accessing account information",
        "Agent reviewed the unauthorized transaction with the customer",
        "Agent clearly explained the dispute filing process and timeline",
        "Agent provided the dispute case number and next steps",
        "Agent explained the temporary credit process and timeline",
        "Agent confirmed customer's understanding of the next steps",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "tx_102",
        "DISP-2025-08-23-001"
      ]
    }
  },
  {
    "id": "12_banking_fraud_medium2_security_001_converted",
    "description": {
      "purpose": "Dispute filing to card lock - MEDIUM_2 persona (curious learner)",
      "relevant_policies": "Dispute process; immediate security measures."
    },
    "user_scenario": {
      "persona": "MEDIUM_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Dispute charge and learn about protecting account",
        "known_info": "You are Riley Brown with phone number +15559876543, date of birth 1989-10-21, and email user.005@example.com.",
        "unknown_info": "Best practices for account security",
        "task_instructions": "File a dispute for a suspicious charge, then ask about securing your account and card."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "dispute",
          "fraud_response"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15559876543",
          "customer_id": "cust_505",
          "primary_account_id": "acc_001",
          "primary_card_id": "card_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "verify_identity",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15559876543"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_505"
              }
            }
          ],
          "max_score": 20,
          "scoring_rules": {
            "base_score": 10
          }
        },
        {
          "action_id": "review_transactions",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 20,
          "scoring_rules": {
            "base_score": 10
          }
        },
        {
          "action_id": "secure_account",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_001"
              }
            }
          ],
          "max_score": 30,
          "scoring_rules": {
            "base_score": 15
          }
        }
      ],
      "nl_assertions": [
        "Agent verified customer identity before accessing account information",
        "Agent identified and acknowledged the suspicious charge",
        "Agent explained the dispute process and timeline",
        "Agent took immediate action to secure the account",
        "Agent provided clear instructions for monitoring the account",
        "Agent explained how to recognize potential fraud in the future",
        "Agent confirmed the dispute was filed and provided a reference number",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$189.99",
        "DISP-2025-08-23-002"
      ]
    }
  },
  {
    "id": "13_banking_transactions_hard1_statements_001_converted",
    "description": {
      "purpose": "Transaction review to statements - HARD_1 persona (suspicious, questioning)",
      "relevant_policies": "Transaction lookup; statement access."
    },
    "user_scenario": {
      "persona": "HARD_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Scrutinize recent transactions, then demand written statements",
        "known_info": "You are Alex Morgan with phone number 555-123-7890, date of birth 1980-04-15, and email alex.morgan@email.com.",
        "unknown_info": "Whether the bank is hiding any transactions",
        "task_instructions": "Demand to see all recent transactions, then insist on getting official written statements."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "transactions",
          "statements"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "555-123-7890",
          "customer_id": "cust_001",
          "primary_account_id": "acc_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "verify_identity",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "555-123-7890"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_001"
              }
            }
          ],
          "max_score": 20,
          "scoring_rules": {
            "base_score": 10
          }
        },
        {
          "action_id": "review_transactions",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 30,
          "scoring_rules": {
            "base_score": 15
          }
        },
        {
          "action_id": "account_details",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 0.2,
          "scoring_rules": {
            "parameter_accuracy": 0.8,
            "tool_usage": 0.2
          }
        },
        {
          "action_id": "statements_view",
          "allowed_tools": [
            {
              "function_name": "get_statements",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 0.5,
          "scoring_rules": {
            "parameter_accuracy": 0.6,
            "tool_usage": 0.4
          }
        }
      ],
      "nl_assertions": [
        "The assistant should thoroughly review recent transactions with Alex Morgan, explaining each one clearly",
        "The assistant should help Alex identify any unauthorized or suspicious transactions",
        "The assistant should explain how to access and review statements for future reference",
        "The assistant should provide clear next steps for disputing any unauthorized transactions",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$45.67",
        "STMT-2025-08-001"
      ]
    }
  },
  {
    "id": "14_banking_transactions_medium2_dispute_001_converted",
    "description": {
      "purpose": "Transaction review to dispute - MEDIUM_2 persona (curious learner)",
      "relevant_policies": "Transaction lookup; dispute filing process."
    },
    "user_scenario": {
      "persona": "MEDIUM_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Review transactions to understand charges, then dispute one",
        "known_info": "You are Maria Santos with phone number +15551234567, date of birth 1986-02-11, and email user.001@example.com.",
        "unknown_info": "How to identify and dispute unauthorized charges",
        "task_instructions": "Ask to see recent transactions to learn about them, then when you spot an unfamiliar charge, ask how to dispute it."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "transactions",
          "dispute"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234567",
          "customer_id": "cust_101",
          "primary_account_id": "acc_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "identify_customer",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234567"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_101"
              }
            }
          ],
          "max_score": 0.2,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        },
        {
          "action_id": "trans_review",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 0.3,
          "scoring_rules": {
            "parameter_accuracy": 0.8,
            "tool_usage": 0.2
          }
        },
        {
          "action_id": "escalate_case",
          "allowed_tools": [
            {
              "function_name": "park_task",
              "params": {
                "current_task_id": "dispute_tx_after_review",
                "resume_hint": "Open dispute workflow for unfamiliar charge identified during review"
              }
            }
          ],
          "max_score": 0.5,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant should clearly explain each transaction to Maria in a way that helps her understand her spending",
        "The assistant should help Maria identify potentially unauthorized transactions and explain why they might be suspicious",
        "The assistant should clearly explain the dispute process and what Maria can expect",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$89.99"
      ]
    }
  },
  {
    "id": "15_banking_insights_easy2_statements_001_converted",
    "description": {
      "purpose": "Spending insights to statements - EASY_2 persona (easily distracted)",
      "relevant_policies": "Educational insights; statement access."
    },
    "user_scenario": {
      "persona": "EASY_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Get spending summary, then ask about statements",
        "known_info": "You are Jordan Smith with phone number +15558675309, date of birth 1994-09-02, and email user.002@example.com.",
        "unknown_info": "How to read statements and track spending",
        "task_instructions": "Ask for a spending summary, then get distracted and want to see your actual statements too."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "insights",
          "statements"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15558675309",
          "customer_id": "cust_202",
          "primary_account_id": "acc_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_202"
              }
            }
          ],
          "max_score": 0.2,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        },
        {
          "action_id": "spending_data",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 0.4,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        }
      ],
      "nl_assertions": [
        "Agent provided spending insights based on transaction history",
        "Agent explained how to interpret the spending data",
        "Agent offered to provide more detailed breakdowns if needed",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$1,234.56",
        "$345.67",
        "ACC-7890-1234"
      ]
    }
  },
  {
    "id": "16_banking_auth_easy_1_single_001_systematic",
    "description": {
      "purpose": "Authentication only - EASY_1 persona baseline test",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "No goal shift - tests core competency with polite, detail-oriented, step-by-step user."
    },
    "user_scenario": {
      "persona": "EASY_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - single pattern",
        "known_info": "You are Taylor Johnson with phone number +15551230987, date of birth 1991-05-06, and email user.003@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Get help with account access and verify your identity."
      },
      "goal_shifts": {
        "required_shifts": 0,
        "goals": [
          "authentication"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551230987",
          "customer_id": "cust_303",
          "authenticated": false
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551230987"
              }
            }
          ],
          "max_score": 0.4,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        },
        {
          "action_id": "customer_verify",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_303"
              }
            }
          ],
          "max_score": 0.6,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant should clearly explain each step of the authentication process to Taylor",
        "The assistant should verify Taylor's identity using multiple factors",
        "The assistant should provide clear instructions if additional verification is needed",
        "The assistant should confirm successful authentication and explain next steps"
      ],
      "communicate_info": [
        "+1 (555) 123-0987"
      ]
    }
  },
  {
    "id": "17_banking_auth_easy_1_soft_001_systematic",
    "description": {
      "purpose": "Authentication soft shift - EASY_1 persona information flow",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "2-goal soft shift with polite, detail-oriented, step-by-step user."
    },
    "user_scenario": {
      "persona": "EASY_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - soft pattern",
        "known_info": "You are Casey Williams with phone number +15551234590, date of birth 1982-03-09, and email user.004@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Get authenticated, then ask for account overview."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "authentication",
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234590",
          "customer_id": "cust_401",
          "authenticated": false,
          "primary_account_id": "acc_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234590"
              }
            }
          ],
          "max_score": 0.3,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        },
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_401"
              }
            }
          ],
          "max_score": 0.3,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        },
        {
          "action_id": "account_overview",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 0.4,
          "scoring_rules": {
            "parameter_accuracy": 0.8,
            "tool_usage": 0.2
          }
        }
      ],
      "nl_assertions": [
        "The assistant should guide Casey through the authentication process clearly and patiently",
        "The assistant should verify Casey's identity using appropriate security measures",
        "The assistant should provide a clear and organized account overview after successful authentication",
        "The assistant should offer to help with specific account details or next steps",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "+1 (555) 123-4590",
        "$3,456.78"
      ]
    }
  },
  {
    "id": "18_banking_auth_easy_1_hard_001_systematic",
    "description": {
      "purpose": "Authentication hard shift - EASY_1 persona security escalation",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "3-goal hard shift with polite, detail-oriented, step-by-step user."
    },
    "user_scenario": {
      "persona": "EASY_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - hard pattern",
        "known_info": "You are Riley Brown with phone number +15559876543, date of birth 1989-10-21, and email user.005@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Start with login help, then check transactions, then report fraud and secure account."
      },
      "goal_shifts": {
        "required_shifts": 2,
        "goals": [
          "authentication",
          "transactions",
          "fraud_response"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15559876543",
          "customer_id": "cust_505",
          "authenticated": false,
          "primary_card_id": "card_001",
          "primary_account_id": "acc_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15559876543"
              }
            }
          ],
          "max_score": 0.2,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        },
        {
          "action_id": "customer_verify",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_505"
              }
            }
          ],
          "max_score": 0.2,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        },
        {
          "action_id": "transactions_review",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 0.3,
          "scoring_rules": {
            "parameter_accuracy": 0.8,
            "tool_usage": 0.2
          }
        },
        {
          "action_id": "fraud_response",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_001"
              }
            }
          ],
          "max_score": 0.3,
          "scoring_rules": {
            "parameter_accuracy": 0.7,
            "tool_usage": 0.3
          }
        }
      ],
      "nl_assertions": [
        "The assistant should guide Riley through the authentication process clearly and thoroughly",
        "The assistant should help Riley review transactions and identify any suspicious activity",
        "The assistant should take appropriate security measures when fraud is reported",
        "The assistant should provide clear next steps and follow-up information",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "+1 (555) 987-6543",
        "$1,299.99",
        "#FRAUD-2025-08-23-004"
      ]
    }
  },
  {
    "id": "19_banking_auth_easy_2_single_001_systematic",
    "description": {
      "purpose": "Authentication only - EASY_2 persona baseline test",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "No goal shift - tests core competency with easily distracted, casual, confused user."
    },
    "user_scenario": {
      "persona": "EASY_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - single pattern",
        "known_info": "You are Alex Morgan with phone number 555-123-7890, date of birth 1980-04-15, and email alex.morgan@email.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Get help with account access and verify your identity."
      },
      "goal_shifts": {
        "required_shifts": 0,
        "goals": [
          "authentication"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "555-123-7890",
          "customer_id": "cust_001",
          "authenticated": false
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "555-123-7890"
              }
            }
          ],
          "max_score": 0.4,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        },
        {
          "action_id": "customer_verify",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_001"
              }
            }
          ],
          "max_score": 0.6,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant should provide clear, simple instructions for Alex to follow during authentication",
        "The assistant should verify Alex's identity thoroughly before proceeding",
        "The assistant should explain the purpose of each authentication step simply",
        "The assistant should be patient and willing to repeat instructions if needed"
      ],
      "communicate_info": []
    }
  },
  {
    "id": "20_banking_auth_easy_2_soft_001_systematic",
    "description": {
      "purpose": "Authentication soft shift - EASY_2 persona information flow",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "2-goal soft shift with easily distracted, casual, confused user."
    },
    "user_scenario": {
      "persona": "EASY_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - soft pattern",
        "known_info": "You are Maria Santos with phone number +15551234567, date of birth 1986-02-11, and email user.001@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Get authenticated, then ask for account overview."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "authentication",
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234567",
          "customer_id": "cust_101",
          "authenticated": false,
          "primary_account_id": "acc_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234567"
              }
            }
          ],
          "max_score": 0.3,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        },
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_101"
              }
            }
          ],
          "max_score": 0.3,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 0.0
          }
        },
        {
          "action_id": "account_overview",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 0.4,
          "scoring_rules": {
            "parameter_accuracy": 0.8,
            "tool_usage": 0.2
          }
        }
      ],
      "nl_assertions": [
        "The assistant should guide Maria through the authentication process with clear, simple instructions",
        "The assistant should verify Maria's identity thoroughly before proceeding",
        "The assistant should provide a clear and organized account overview after successful authentication",
        "The assistant should offer to explain account details in simple terms if Maria gets distracted",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "+1 (555) 123-4567",
        "$2,345.67"
      ]
    }
  },
  {
    "id": "21_banking_auth_easy_2_hard_001_systematic",
    "description": {
      "purpose": "Authentication hard shift - EASY_2 persona security escalation",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "3-goal hard shift with easily distracted, casual, confused user."
    },
    "user_scenario": {
      "persona": "EASY_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - hard pattern",
        "known_info": "You are Jordan Smith with phone number +15558675309, date of birth 1994-09-02, and email user.002@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Start with login help, then check transactions, then report fraud and secure account."
      },
      "goal_shifts": {
        "required_shifts": 2,
        "goals": [
          "authentication",
          "transactions",
          "fraud_response"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15558675309",
          "customer_id": "cust_202",
          "authenticated": false,
          "primary_account_id": "acc_202",
          "primary_card_id": "card_202"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15558675309"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "trans_check",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "fraud_response",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided comprehensive service to Jordan Smith from login through fraud protection.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "+15558675309",
        "$3,250.50",
        "card_202",
        "\u2022\u2022\u2022\u20224567"
      ]
    }
  },
  {
    "id": "22_banking_auth_medium_1_single_001_systematic",
    "description": {
      "purpose": "Authentication only - MEDIUM_1 persona baseline test",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "No goal shift - tests core competency with business-focused, impatient, efficient user."
    },
    "user_scenario": {
      "persona": "MEDIUM_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - single pattern",
        "known_info": "You are Taylor Johnson with phone number +15551230987, date of birth 1991-05-06, and email user.003@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Get help with account access and verify your identity."
      },
      "goal_shifts": {
        "required_shifts": 0,
        "goals": [
          "authentication"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551230987",
          "customer_id": "cust_303",
          "authenticated": false,
          "primary_account_id": "acc_303",
          "primary_card_id": "card_303"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551230987"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_303"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant professionally authenticated Taylor Johnson."
      ],
      "communicate_info": [
        "+15551230987",
        "$1,850.25",
        "card_303",
        "\u2022\u2022\u2022\u20223456"
      ]
    }
  },
  {
    "id": "23_banking_auth_medium_1_soft_001_systematic",
    "description": {
      "purpose": "Authentication soft shift - MEDIUM_1 persona information flow",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "2-goal soft shift with business-focused, impatient, efficient user."
    },
    "user_scenario": {
      "persona": "MEDIUM_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - soft pattern",
        "known_info": "You are Casey Williams with phone number +15551234590, date of birth 1982-03-09, and email user.004@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Get authenticated, then ask for account overview."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "authentication",
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234590",
          "customer_id": "cust_401",
          "authenticated": false,
          "primary_account_id": "acc_401",
          "primary_card_id": "card_401"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234590"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_401"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_info",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_401"
              }
            },
            {
              "function_name": "get_accounts",
              "params": {
                "customer_id": "cust_401"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant smoothly authenticated Casey Williams and provided account overview.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$5,420.75",
        "$25,000.00",
        "card_401",
        "\u2022\u2022\u2022\u20222345"
      ]
    }
  },
  {
    "id": "24_banking_auth_medium_1_hard_001_systematic",
    "description": {
      "purpose": "Authentication hard shift - MEDIUM_1 persona security escalation",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "3-goal hard shift with business-focused, impatient, efficient user."
    },
    "user_scenario": {
      "persona": "MEDIUM_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - hard pattern",
        "known_info": "You are Riley Brown with phone number +15559876543, date of birth 1989-10-21, and email user.005@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Start with login help, then check transactions, then report fraud and secure account."
      },
      "goal_shifts": {
        "required_shifts": 2,
        "goals": [
          "authentication",
          "transactions",
          "fraud_response"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15559876543",
          "customer_id": "cust_505",
          "authenticated": false,
          "primary_account_id": "acc_505",
          "primary_card_id": "card_505"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15559876543"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_505"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "trans_review",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_505"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "fraud_file",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_505"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided full-service help to Riley Brown from authentication through fraud protection.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$15,750.40",
        "card_505",
        "\u2022\u2022\u2022\u20229876"
      ]
    }
  },
  {
    "id": "25_banking_auth_medium_2_single_001_systematic",
    "description": {
      "purpose": "Authentication only - MEDIUM_2 persona baseline test",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "No goal shift - tests core competency with curious learner, asks questions, enthusiastic user."
    },
    "user_scenario": {
      "persona": "MEDIUM_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - single pattern",
        "known_info": "You are Alex Morgan with phone number 555-123-7890, date of birth 1980-04-15, and email alex.morgan@email.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Get help with account access and verify your identity."
      },
      "goal_shifts": {
        "required_shifts": 0,
        "goals": [
          "authentication"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "555-123-7890",
          "customer_id": "cust_001",
          "authenticated": false,
          "primary_account_id": "acc_001",
          "primary_card_id": "card_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "555-123-7890"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant efficiently authenticated Alex Morgan."
      ],
      "communicate_info": [
        "$1,423.75",
        "card_001",
        "\u2022\u2022\u2022\u20226789"
      ]
    }
  },
  {
    "id": "26_banking_auth_medium_2_soft_001_systematic",
    "description": {
      "purpose": "Authentication soft shift - MEDIUM_2 persona information flow",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "2-goal soft shift with curious learner, asks questions, enthusiastic user."
    },
    "user_scenario": {
      "persona": "MEDIUM_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - soft pattern",
        "known_info": "You are Maria Santos with phone number +15551234567, date of birth 1986-02-11, and email user.001@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Get authenticated, then ask for account overview."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "authentication",
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234567",
          "customer_id": "cust_101",
          "authenticated": false,
          "primary_account_id": "acc_101",
          "primary_card_id": "card_101"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234567"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_101"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_overview",
          "allowed_tools": [
            {
              "function_name": "get_accounts",
              "params": {
                "customer_id": "cust_101"
              }
            },
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_101"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided seamless authentication and account overview to Maria Santos.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$45,230.18",
        "card_101",
        "\u2022\u2022\u2022\u20225678"
      ]
    }
  },
  {
    "id": "27_banking_auth_medium_2_hard_001_systematic",
    "description": {
      "purpose": "Authentication hard shift - MEDIUM_2 persona security escalation",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "3-goal hard shift with curious learner, asks questions, enthusiastic user."
    },
    "user_scenario": {
      "persona": "MEDIUM_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - hard pattern",
        "known_info": "You are Jordan Smith with phone number +15558675309, date of birth 1994-09-02, and email user.002@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Start with login help, then check transactions, then report fraud and secure account."
      },
      "goal_shifts": {
        "required_shifts": 2,
        "goals": [
          "authentication",
          "transactions",
          "fraud_response"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15558675309",
          "customer_id": "cust_202",
          "authenticated": false,
          "primary_account_id": "acc_202",
          "primary_card_id": "card_202"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15558675309"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "trans_check",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "fraud_response",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided complete assistance to Jordan Smith through all service levels.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$3,250.50",
        "card_202",
        "\u2022\u2022\u2022\u20224567"
      ]
    }
  },
  {
    "id": "28_banking_auth_hard_1_single_001_systematic",
    "description": {
      "purpose": "Authentication only - HARD_1 persona baseline test",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "No goal shift - tests core competency with suspicious, questioning, demands proof user."
    },
    "user_scenario": {
      "persona": "HARD_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - single pattern",
        "known_info": "You are Taylor Johnson with phone number +15551230987, date of birth 1991-05-06, and email user.003@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Get help with account access and verify your identity."
      },
      "goal_shifts": {
        "required_shifts": 0,
        "goals": [
          "authentication"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551230987",
          "customer_id": "cust_303",
          "authenticated": false,
          "primary_account_id": "acc_303",
          "primary_card_id": "card_303"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551230987"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_303"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant patiently helped Taylor Johnson with authentication."
      ],
      "communicate_info": [
        "$1,850.25",
        "card_303",
        "\u2022\u2022\u2022\u20223456"
      ]
    }
  },
  {
    "id": "29_banking_auth_hard_1_soft_001_systematic",
    "description": {
      "purpose": "Authentication soft shift - HARD_1 persona information flow",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "2-goal soft shift with suspicious, questioning, demands proof user."
    },
    "user_scenario": {
      "persona": "HARD_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - soft pattern",
        "known_info": "You are Casey Williams with phone number +15551234590, date of birth 1982-03-09, and email user.004@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Get authenticated, then ask for account overview."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "authentication",
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234590",
          "customer_id": "cust_401",
          "authenticated": false,
          "primary_account_id": "acc_401",
          "primary_card_id": "card_401"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234590"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_401"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_info",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_401"
              }
            },
            {
              "function_name": "get_accounts",
              "params": {
                "customer_id": "cust_401"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided supportive authentication and overview service to Casey Williams.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$5,420.75",
        "card_401",
        "\u2022\u2022\u2022\u20222345"
      ]
    }
  },
  {
    "id": "30_banking_auth_hard_1_hard_001_systematic",
    "description": {
      "purpose": "Authentication hard shift - HARD_1 persona security escalation",
      "relevant_policies": "Authentication policies and procedures.",
      "notes": "3-goal hard shift with suspicious, questioning, demands proof user."
    },
    "user_scenario": {
      "persona": "HARD_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Account access help - hard pattern",
        "known_info": "You are Riley Brown with phone number +15559876543, date of birth 1989-10-21, and email user.005@example.com.",
        "unknown_info": "Specifics about login issues",
        "task_instructions": "Start with login help, then check transactions, then report fraud and secure account."
      },
      "goal_shifts": {
        "required_shifts": 2,
        "goals": [
          "authentication",
          "transactions",
          "fraud_response"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15559876543",
          "customer_id": "cust_505",
          "authenticated": false,
          "primary_account_id": "acc_505",
          "primary_card_id": "card_505"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "auth_phone",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15559876543"
              }
            },
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_505"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "trans_review",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_505"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "fraud_secure",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_505"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided thorough, patient help to Riley Brown through complex authentication and fraud issues.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$15,750.40",
        "card_505",
        "\u2022\u2022\u2022\u20229876"
      ]
    }
  },
  {
    "id": "31_banking_account_easy_1_single_001_systematic",
    "description": {
      "purpose": "Account Overview only - EASY_1 persona baseline test",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "No goal shift - tests core competency with polite, detail-oriented, step-by-step user."
    },
    "user_scenario": {
      "persona": "EASY_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - single pattern",
        "known_info": "You are Alex Morgan with phone number 555-123-7890, date of birth 1980-04-15, and email alex.morgan@email.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check your account balances and status."
      },
      "goal_shifts": {
        "required_shifts": 0,
        "goals": [
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "555-123-7890",
          "customer_id": "cust_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_001"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "555-123-7890"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_info",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful service to Alex Morgan."
      ],
      "communicate_info": [
        "$1,423.75",
        "card_001",
        "\u2022\u2022\u2022\u20226789"
      ]
    }
  },
  {
    "id": "32_banking_account_easy_1_soft_001_systematic",
    "description": {
      "purpose": "Account Overview soft shift - EASY_1 persona information flow",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "2-goal soft shift with polite, detail-oriented, step-by-step user."
    },
    "user_scenario": {
      "persona": "EASY_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - soft pattern",
        "known_info": "You are Maria Santos with phone number +15551234567, date of birth 1986-02-11, and email user.001@example.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check account balances, then request recent statements."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "account_info",
          "statements"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234567",
          "customer_id": "cust_101"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_101"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234567"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_details",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_101"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "statements_view",
          "allowed_tools": [
            {
              "function_name": "get_statements",
              "params": {
                "account_id": "acc_101"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful service to Maria Santos.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$45,230.18",
        "stmt_101"
      ]
    }
  },
  {
    "id": "33_banking_account_easy_1_hard_001_systematic",
    "description": {
      "purpose": "Account Overview hard shift - EASY_1 persona security escalation",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "3-goal hard shift with polite, detail-oriented, step-by-step user."
    },
    "user_scenario": {
      "persona": "EASY_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - hard pattern",
        "known_info": "You are Jordan Smith with phone number +15558675309, date of birth 1994-09-02, and email user.002@example.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check account info, then review transactions, then file dispute for suspicious charge."
      },
      "goal_shifts": {
        "required_shifts": 2,
        "goals": [
          "account_info",
          "transactions",
          "dispute"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15558675309",
          "customer_id": "cust_202"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_202"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15558675309"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_details",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "trans_history",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "fraud_secure",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful service to Jordan Smith.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$3,250.50",
        "card_202",
        "\u2022\u2022\u2022\u20224567"
      ]
    }
  },
  {
    "id": "34_banking_account_easy_2_single_001_systematic",
    "description": {
      "purpose": "Account Overview only - EASY_2 persona baseline test",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "No goal shift - tests core competency with easily distracted, casual, confused user."
    },
    "user_scenario": {
      "persona": "EASY_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - single pattern",
        "known_info": "You are Taylor Johnson with phone number +15551230987, date of birth 1991-05-06, and email user.003@example.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check your account balances and status."
      },
      "goal_shifts": {
        "required_shifts": 0,
        "goals": [
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551230987",
          "customer_id": "cust_303"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_303"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551230987"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_info",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_303"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful service to Taylor Johnson."
      ],
      "communicate_info": [
        "$1,850.25",
        "card_303",
        "\u2022\u2022\u2022\u20223456"
      ]
    }
  },
  {
    "id": "35_banking_account_easy_2_soft_001_systematic",
    "description": {
      "purpose": "Account Overview soft shift - EASY_2 persona information flow",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "2-goal soft shift with easily distracted, casual, confused user."
    },
    "user_scenario": {
      "persona": "EASY_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - soft pattern",
        "known_info": "You are Casey Williams with phone number +15551234590, date of birth 1982-03-09, and email user.004@example.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check account balances, then request recent statements."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "account_info",
          "statements"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234590",
          "customer_id": "cust_401"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_401"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234590"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_details",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_401"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "statements_view",
          "allowed_tools": [
            {
              "function_name": "get_statements",
              "params": {
                "account_id": "acc_401"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful service to Casey Williams.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$5,420.75",
        "card_401",
        "\u2022\u2022\u2022\u20222345"
      ]
    }
  },
  {
    "id": "36_banking_account_easy_2_hard_001_systematic",
    "description": {
      "purpose": "Account Overview hard shift - EASY_2 persona security escalation",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "3-goal hard shift with easily distracted, casual, confused user."
    },
    "user_scenario": {
      "persona": "EASY_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - hard pattern",
        "known_info": "You are Riley Brown with phone number +15559876543, date of birth 1989-10-21, and email user.005@example.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check account info, then review transactions, then file dispute for suspicious charge."
      },
      "goal_shifts": {
        "required_shifts": 2,
        "goals": [
          "account_info",
          "transactions",
          "dispute"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15559876543",
          "customer_id": "cust_505"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_505"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15559876543"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_details",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_505"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "trans_review",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_505"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "fraud_secure",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_505"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful service to Riley Brown.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$15,750.40",
        "card_505",
        "\u2022\u2022\u2022\u20229876"
      ]
    }
  },
  {
    "id": "37_banking_account_medium_1_single_001_systematic",
    "description": {
      "purpose": "Account Overview only - MEDIUM_1 persona baseline test",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "No goal shift - tests core competency with business-focused, impatient, efficient user."
    },
    "user_scenario": {
      "persona": "MEDIUM_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - single pattern",
        "known_info": "You are Alex Morgan with phone number 555-123-7890, date of birth 1980-04-15, and email alex.morgan@email.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check your account balances and status."
      },
      "goal_shifts": {
        "required_shifts": 0,
        "goals": [
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "555-123-7890",
          "customer_id": "cust_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_001"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "555-123-7890"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_balance",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_001"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful service to Alex Morgan."
      ],
      "communicate_info": [
        "$1,423.75",
        "card_001",
        "\u2022\u2022\u2022\u20226789"
      ]
    }
  },
  {
    "id": "38_banking_account_medium_1_soft_001_systematic",
    "description": {
      "purpose": "Account Overview soft shift - MEDIUM_1 persona information flow",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "2-goal soft shift with business-focused, impatient, efficient user."
    },
    "user_scenario": {
      "persona": "MEDIUM_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - soft pattern",
        "known_info": "You are Maria Santos with phone number +15551234567, date of birth 1986-02-11, and email user.001@example.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check account balances, then request recent statements."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "account_info",
          "statements"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234567",
          "customer_id": "cust_101"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_101"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234567"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_details",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_101"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_summary",
          "allowed_tools": [
            {
              "function_name": "get_statements",
              "params": {
                "account_id": "acc_101"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful service to Maria Santos.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$45,230.18",
        "stmt_101"
      ]
    }
  },
  {
    "id": "39_banking_account_medium_1_hard_001_systematic",
    "description": {
      "purpose": "Account Overview hard shift - MEDIUM_1 persona security escalation",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "3-goal hard shift with business-focused, impatient, efficient user."
    },
    "user_scenario": {
      "persona": "MEDIUM_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - hard pattern",
        "known_info": "You are Jordan Smith with phone number +15558675309, date of birth 1994-09-02, and email user.002@example.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check account info, then review transactions, then file dispute for suspicious charge."
      },
      "goal_shifts": {
        "required_shifts": 2,
        "goals": [
          "account_info",
          "transactions",
          "dispute"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15558675309",
          "customer_id": "cust_202"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_202"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15558675309"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_details",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "trans_analysis",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "fraud_response",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_202"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful service to Jordan Smith.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$3,250.50",
        "card_202",
        "\u2022\u2022\u2022\u20224567"
      ]
    }
  },
  {
    "id": "40_banking_account_medium_2_single_001_systematic",
    "description": {
      "purpose": "Account Overview only - MEDIUM_2 persona baseline test",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "No goal shift - tests core competency with curious learner, asks questions, enthusiastic user."
    },
    "user_scenario": {
      "persona": "MEDIUM_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - single pattern",
        "known_info": "You are Taylor Johnson with phone number +15551230987, date of birth 1991-05-06, and email user.003@example.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check your account balances and status."
      },
      "goal_shifts": {
        "required_shifts": 0,
        "goals": [
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551230987",
          "customer_id": "cust_303"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_303"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551230987"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        },
        {
          "action_id": "account_info",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_303"
              }
            }
          ],
          "max_score": 1.0,
          "scoring_rules": {
            "parameter_accuracy": 1.0,
            "tool_usage": 1.0
          }
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful service to Taylor Johnson."
      ],
      "communicate_info": [
        "$1,850.25",
        "card_303",
        "\u2022\u2022\u2022\u20223456"
      ]
    }
  },
  {
    "id": "41_banking_account_medium_2_soft_001_systematic",
    "description": {
      "purpose": "Account Overview soft shift - MEDIUM_2 persona information flow",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "2-goal soft shift with curious learner, asks questions, enthusiastic user."
    },
    "user_scenario": {
      "persona": "MEDIUM_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - soft pattern",
        "known_info": "You are Casey Williams with phone number +15551234590, date of birth 1982-03-09, and email user.004@example.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check account balances, then request recent statements."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "account_info",
          "statements"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234590",
          "customer_id": "cust_401"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_401"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234590"
              }
            }
          ]
        },
        {
          "action_id": "account_details",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_401"
              }
            }
          ]
        },
        {
          "action_id": "statements_view",
          "allowed_tools": [
            {
              "function_name": "get_statements",
              "params": {
                "account_id": "acc_401"
              }
            }
          ]
        }
      ],
      "nl_assertions": [
        "The assistant provided comprehensive account information and statements to Casey Williams.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$5,420.75",
        "\u2022\u2022\u2022\u20222345"
      ]
    }
  },
  {
    "id": "42_banking_account_medium_2_hard_001_systematic",
    "description": {
      "purpose": "Account Overview hard shift - MEDIUM_2 persona security escalation",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "3-goal hard shift with curious learner, asks questions, enthusiastic user."
    },
    "user_scenario": {
      "persona": "MEDIUM_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - hard pattern",
        "known_info": "You are Riley Brown with phone number +15559876543, date of birth 1989-10-21, and email user.005@example.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check account info, then review transactions, then file dispute for suspicious charge."
      },
      "goal_shifts": {
        "required_shifts": 2,
        "goals": [
          "account_info",
          "transactions",
          "dispute"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15559876543",
          "customer_id": "cust_505"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_505"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15559876543"
              }
            }
          ]
        },
        {
          "action_id": "account_details",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_505"
              }
            }
          ]
        },
        {
          "action_id": "trans_check",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_505"
              }
            }
          ]
        },
        {
          "action_id": "fraud_lock_only",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_505"
              }
            }
          ]
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful account service to Riley Brown.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$15,750.40",
        "\u2022\u2022\u2022\u20229876"
      ]
    }
  },
  {
    "id": "43_banking_account_hard_1_single_001_systematic",
    "description": {
      "purpose": "Account Overview only - HARD_1 persona baseline test",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "No goal shift - tests core competency with suspicious, questioning, demands proof user."
    },
    "user_scenario": {
      "persona": "HARD_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - single pattern",
        "known_info": "You are Alex Morgan with phone number 555-123-7890, date of birth 1980-04-15, and email alex.morgan@email.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check your account balances and status."
      },
      "goal_shifts": {
        "required_shifts": 0,
        "goals": [
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "555-123-7890",
          "customer_id": "cust_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_001"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "555-123-7890"
              }
            }
          ]
        },
        {
          "action_id": "account_balance",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_001"
              }
            }
          ]
        }
      ],
      "nl_assertions": [
        "The assistant provided clear account information to Alex Morgan."
      ],
      "communicate_info": [
        "$1,423.75",
        "\u2022\u2022\u2022\u20226789"
      ]
    }
  },
  {
    "id": "44_banking_account_hard_1_soft_001_systematic",
    "description": {
      "purpose": "Account Overview soft shift - HARD_1 persona information flow",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "2-goal soft shift with suspicious, questioning, demands proof user."
    },
    "user_scenario": {
      "persona": "HARD_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - soft pattern",
        "known_info": "You are Maria Santos with phone number +15551234567, date of birth 1986-02-11, and email user.001@example.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check account balances, then request recent statements."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "account_info",
          "statements"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234567",
          "customer_id": "cust_101"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_101"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15551234567"
              }
            }
          ]
        },
        {
          "action_id": "account_details",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_101"
              }
            }
          ]
        },
        {
          "action_id": "statements_view",
          "allowed_tools": [
            {
              "function_name": "get_statements",
              "params": {
                "account_id": "acc_101"
              }
            }
          ]
        }
      ],
      "nl_assertions": [
        "The assistant provided comprehensive account information and statements to Maria Santos.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$45,230.18"
      ]
    }
  },
  {
    "id": "45_banking_account_hard_1_hard_001_systematic",
    "description": {
      "purpose": "Account Overview hard shift - HARD_1 persona security escalation",
      "relevant_policies": "Account Overview policies and procedures.",
      "notes": "3-goal hard shift with suspicious, questioning, demands proof user."
    },
    "user_scenario": {
      "persona": "HARD_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Check account information - hard pattern",
        "known_info": "You are Jordan Smith with phone number +15558675309, date of birth 1994-09-02, and email user.002@example.com.",
        "unknown_info": "Specifics about account status and balances",
        "task_instructions": "Check account info, then review transactions, then file dispute for suspicious charge."
      },
      "goal_shifts": {
        "required_shifts": 2,
        "goals": [
          "account_info",
          "transactions",
          "dispute"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15558675309",
          "customer_id": "cust_202"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "get_customer_by_id",
              "params": {
                "customer_id": "cust_202"
              }
            },
            {
              "function_name": "get_customer_by_phone",
              "params": {
                "phone_number": "+15558675309"
              }
            }
          ]
        },
        {
          "action_id": "account_details",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_202"
              }
            }
          ]
        },
        {
          "action_id": "trans_review",
          "allowed_tools": [
            {
              "function_name": "get_transactions",
              "params": {
                "account_id": "acc_202"
              }
            }
          ]
        },
        {
          "action_id": "fraud_lock_only",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_202"
              }
            }
          ]
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful account service to Jordan Smith.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$3,250.50",
        "\u2022\u2022\u2022\u20224567"
      ]
    }
  },
  {
    "id": "46_banking_billpay_easy_1_single_001_systematic",
    "description": {
      "purpose": "Bill Pay only - EASY_1 persona baseline test",
      "relevant_policies": "Bill Pay policies and procedures.",
      "notes": "No goal shift - tests core competency with polite, detail-oriented, step-by-step user."
    },
    "user_scenario": {
      "persona": "EASY_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Make bill payment - single pattern",
        "known_info": "You are Taylor Johnson with phone number +15551230987, date of birth 1991-05-06, and email user.003@example.com.",
        "unknown_info": "Specifics about payment processing",
        "task_instructions": "Create a bill payment request from your account."
      },
      "goal_shifts": {
        "required_shifts": 0,
        "goals": [
          "payments"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551230987",
          "customer_id": "cust_303",
          "primary_account_id": "acc_303"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "payment_create",
          "allowed_tools": [
            {
              "function_name": "create_payment_request",
              "params": {
                "customer_id": "cust_303",
                "from_account_id": "acc_303",
                "to_payee_id": "payee_303",
                "amount": 150.0
              }
            }
          ]
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful account service to Taylor Johnson."
      ],
      "communicate_info": [
        "$150.00"
      ]
    }
  },
  {
    "id": "47_banking_billpay_easy_1_soft_001_systematic",
    "description": {
      "purpose": "Bill Pay soft shift - EASY_1 persona information flow",
      "relevant_policies": "Bill Pay policies and procedures.",
      "notes": "2-goal soft shift with polite, detail-oriented, step-by-step user."
    },
    "user_scenario": {
      "persona": "EASY_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Make bill payment - soft pattern",
        "known_info": "You are Casey Williams with phone number +15551234590, date of birth 1982-03-09, and email user.004@example.com.",
        "unknown_info": "Specifics about payment processing",
        "task_instructions": "Create a bill payment request, then verify account balance."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "payments",
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234590",
          "customer_id": "cust_401",
          "primary_account_id": "acc_401"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "payment_create",
          "allowed_tools": [
            {
              "function_name": "create_payment_request",
              "params": {
                "customer_id": "cust_401",
                "from_account_id": "acc_401",
                "to_payee_id": "payee_401",
                "amount": 200.0
              }
            }
          ]
        },
        {
          "action_id": "account_verify",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_401"
              }
            }
          ]
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful account service to Casey Williams.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$5,420.75",
        "$200.00"
      ]
    }
  },
  {
    "id": "48_banking_billpay_easy_1_hard_001_systematic",
    "description": {
      "purpose": "Bill Pay hard shift - EASY_1 persona security escalation",
      "relevant_policies": "Bill Pay policies and procedures.",
      "notes": "3-goal hard shift with polite, detail-oriented, step-by-step user."
    },
    "user_scenario": {
      "persona": "EASY_1",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Make bill payment - hard pattern",
        "known_info": "You are Riley Brown with phone number +15559876543, date of birth 1989-10-21, and email user.005@example.com.",
        "unknown_info": "Specifics about payment processing",
        "task_instructions": "Create a bill payment request, then lock your card for safety."
      },
      "goal_shifts": {
        "required_shifts": 2,
        "goals": [
          "payments",
          "fraud_response",
          "cards"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15559876543",
          "customer_id": "cust_505",
          "primary_account_id": "acc_505",
          "primary_card_id": "card_505"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "payment_create",
          "allowed_tools": [
            {
              "function_name": "create_payment_request",
              "params": {
                "customer_id": "cust_505",
                "from_account_id": "acc_505",
                "to_payee_id": "payee_505",
                "amount": 300.0
              }
            }
          ]
        },
        {
          "action_id": "fraud_secure",
          "allowed_tools": [
            {
              "function_name": "lock_card",
              "params": {
                "card_id": "card_505"
              }
            }
          ]
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful account service to Riley Brown.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$300.00",
        "\u2022\u2022\u2022\u20229876"
      ]
    }
  },
  {
    "id": "49_banking_billpay_easy_2_single_001_systematic",
    "description": {
      "purpose": "Bill Pay only - EASY_2 persona baseline test",
      "relevant_policies": "Bill Pay policies and procedures.",
      "notes": "No goal shift - tests core competency with easily distracted, casual, confused user."
    },
    "user_scenario": {
      "persona": "EASY_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Make bill payment - single pattern",
        "known_info": "You are Alex Morgan with phone number 555-123-7890, date of birth 1980-04-15, and email alex.morgan@email.com.",
        "unknown_info": "Specifics about payment processing",
        "task_instructions": "Authorize and settle an existing payment request."
      },
      "goal_shifts": {
        "required_shifts": 0,
        "goals": [
          "payments"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "555-123-7890",
          "customer_id": "cust_001",
          "payment_request_id": "req_001"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "payment_status",
          "allowed_tools": [
            {
              "function_name": "check_payment_request",
              "params": {
                "request_id": "req_001"
              }
            }
          ]
        },
        {
          "action_id": "payment_check",
          "allowed_tools": [
            {
              "function_name": "check_payment_request",
              "params": {
                "request_id": "req_001"
              }
            }
          ]
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful account service to Alex Morgan."
      ],
      "communicate_info": [
        "Electric Co.",
        "$65.00"
      ]
    }
  },
  {
    "id": "50_banking_billpay_easy_2_soft_001_systematic",
    "description": {
      "purpose": "Bill Pay soft shift - EASY_2 persona information flow",
      "relevant_policies": "Bill Pay policies and procedures.",
      "notes": "2-goal soft shift with easily distracted, casual, confused user."
    },
    "user_scenario": {
      "persona": "EASY_2",
      "instructions": {
        "domain": "banking",
        "reason_for_call": "Make bill payment - soft pattern",
        "known_info": "You are Maria Santos with phone number +15551234567, date of birth 1986-02-11, and email user.001@example.com.",
        "unknown_info": "Specifics about payment processing",
        "task_instructions": "Create a payment request and then verify your account."
      },
      "goal_shifts": {
        "required_shifts": 1,
        "goals": [
          "payments",
          "account_info"
        ]
      }
    },
    "initial_state": {
      "initialization_data": {
        "agent_data": null,
        "user_data": {
          "phone_number": "+15551234567",
          "customer_id": "cust_101",
          "primary_account_id": "acc_101"
        }
      },
      "message_history": []
    },
    "evaluation_criteria": {
      "action_sets": [
        {
          "action_id": "customer_details",
          "allowed_tools": [
            {
              "function_name": "create_payment_request",
              "params": {
                "customer_id": "cust_101",
                "from_account_id": "acc_101",
                "to_payee_id": "payee_101",
                "amount": 120.0
              }
            }
          ]
        },
        {
          "action_id": "account_verify",
          "allowed_tools": [
            {
              "function_name": "get_account",
              "params": {
                "account_id": "acc_101"
              }
            }
          ]
        }
      ],
      "nl_assertions": [
        "The assistant provided helpful account service to Maria Santos.",
        "Agent did not transfer the customer to a human agent when the goal changed"
      ],
      "communicate_info": [
        "$45,230.18",
        "$120.00"
      ]
    }
  }
]