[
    {
        "problem_id": 2442,
        "domain": [
            "Mathematics -> Applied Mathematics -> Statistics -> Probability -> Counting Methods -> Combinations"
        ],
        "difficulty": 4.0,
        "problem_text": "2015 people sit down at a restaurant. Each person orders a soup with probability $\\frac{1}{2}$. Independently, each person orders a salad with probability $\\frac{1}{2}$. What is the probability that the number of people who ordered a soup is exactly one more than the number of people who ordered a salad?",
        "sample_id": 1,
        "final_answer": "$\\frac{\\binom{4030}{2016}}{2^{4030}}$",
        "steps": [
            {
                "step_id": 1,
                "edge": "We establish the total number of people as given in the problem statement, which is 2015. This foundational count sets the scale for all subsequent random variables and combinatorial calculations.",
                "direct_dependent_steps": null,
                "node": "There are $2015$ people."
            },
            {
                "step_id": 2,
                "edge": "The problem specifies that each person independently orders soup with probability $\\frac{1}{2}$. This independence and identical probability per person are critical for modeling soup orders as a sequence of Bernoulli trials.",
                "direct_dependent_steps": null,
                "node": "Each person orders soup with probability $\\tfrac{1}{2}$ independently."
            },
            {
                "step_id": 3,
                "edge": "Building on the total population count from Step 1, we define $S$ as the random variable representing the number of soup orders. This formalizes the quantity we need to analyze, where $S$ will aggregate outcomes across all 2015 individuals.",
                "direct_dependent_steps": [
                    1
                ],
                "node": "Define $S$ as the number of soups ordered among the $2015$ people."
            },
            {
                "step_id": 4,
                "edge": "Given the independent soup orders with fixed probability $\\frac{1}{2}$ per person (Step 2) and the definition of $S$ (Step 3), we recognize $S$ follows a binomial distribution. Specifically, $S \\sim \\mathrm{Binomial}(n=2015, p=\\frac{1}{2})$ because it counts successes in $n$ identical independent Bernoulli trials.",
                "direct_dependent_steps": [
                    2,
                    3
                ],
                "node": "Then $S\\sim\\mathrm{Binomial}(n=2015,p=\\tfrac{1}{2})$."
            },
            {
                "step_id": 5,
                "edge": "The problem states that salad orders also occur independently per person with probability $\\frac{1}{2}$. This mirrors the soup order setup and will enable symmetric treatment of both food items.",
                "direct_dependent_steps": null,
                "node": "Each person orders salad with probability $\\tfrac{1}{2}$ independently."
            },
            {
                "step_id": 6,
                "edge": "Using the population size from Step 1, we define $T$ as the count of salad orders. This parallels Step 3 for soups, creating a counterpart random variable for salads over the same 2015 people.",
                "direct_dependent_steps": [
                    1
                ],
                "node": "Define $T$ as the number of salads ordered among the $2015$ people."
            },
            {
                "step_id": 7,
                "edge": "Since salad orders are independent with probability $\\frac{1}{2}$ per person (Step 5) and $T$ represents the salad count (Step 6), $T$ must follow $\\mathrm{Binomial}(n=2015, p=\\frac{1}{2})$. This completes the probabilistic model for both food items.",
                "direct_dependent_steps": [
                    5,
                    6
                ],
                "node": "Then $T\\sim\\mathrm{Binomial}(n=2015,p=\\tfrac{1}{2})$."
            },
            {
                "step_id": 8,
                "edge": "The problem clarifies that soup and salad orders are independent for each individual. This per-person independence is a key structural assumption that will later justify independence between the aggregate counts $S$ and $T$.",
                "direct_dependent_steps": null,
                "node": "Soup orders and salad orders by each person are independent."
            },
            {
                "step_id": 9,
                "edge": "Because soup and salad orders are independent per person (Step 8), and all orders are independent across people, the collections defining $S$ (Step 4) and $T$ (Step 7) are independent. Thus, $S$ and $T$ are independent random variables, a crucial property for joint probability calculations.",
                "direct_dependent_steps": [
                    4,
                    7,
                    8
                ],
                "node": "Therefore $S$ and $T$ are independent random variables."
            },
            {
                "step_id": 10,
                "edge": "The problem asks for the probability that soup orders exceed salad orders by exactly one, which translates directly to the event $S = T + 1$. This defines our target probability expression.",
                "direct_dependent_steps": null,
                "node": "We seek $P(S = T + 1)$."
            },
            {
                "step_id": 11,
                "edge": "To compute $P(S = T + 1)$ from Step 10, we apply the law of total probability by conditioning on possible values of $S$. Specifically, we decompose the event into disjoint cases where $S = k$ and $T = k-1$ for some $k$, then sum the joint probabilities over all valid $k$.",
                "direct_dependent_steps": [
                    10
                ],
                "node": "By the law of total probability, $P(S = T + 1)=\\sum_{k}P(S=k\\text{ and }T=k-1)$."
            },
            {
                "step_id": 12,
                "edge": "Given the summation structure from Step 11, we identify valid $k$ values: $S$ must be between 0 and 2015, and $T = k-1$ must also be in [0,2015]. Thus $k$ ranges from 1 to 2015 (inclusive), as $k=0$ would make $T=-1$ (invalid) and $k=2016$ would exceed $S$'s maximum.",
                "direct_dependent_steps": [
                    11
                ],
                "node": "The nonzero terms occur for $k=1,2,\\dots,2015$."
            },
            {
                "step_id": 13,
                "edge": "For $k$ in [1,2015] (Step 12), the independence of $S$ and $T$ (Step 9) allows us to factor the joint probability $P(S=k \\text{ and } T=k-1)$ into the product $P(S=k)P(T=k-1)$. This simplifies the computation by separating the two binomial distributions.",
                "direct_dependent_steps": [
                    9,
                    12
                ],
                "node": "For $1\\le k\\le2015$, independence gives $P(S=k\\text{ and }T=k-1)=P(S=k)P(T=k-1)$."
            },
            {
                "step_id": 14,
                "edge": "Using the binomial distribution of $S$ (Step 4), the probability mass function gives $P(S=k) = \\binom{2015}{k} \\left(\\frac{1}{2}\\right)^k \\left(\\frac{1}{2}\\right)^{2015-k} = \\binom{2015}{k} \\left(\\frac{1}{2}\\right)^{2015}$. The exponents combine cleanly due to $p = 1-p = \\frac{1}{2}$.",
                "direct_dependent_steps": [
                    4
                ],
                "node": "The binomial PMF yields $P(S=k)=\\binom{2015}{k}(\\tfrac{1}{2})^{2015}$."
            },
            {
                "step_id": 15,
                "edge": "Similarly, for $T$ (Step 7), $P(T=k-1) = \\binom{2015}{k-1} \\left(\\frac{1}{2}\\right)^{k-1} \\left(\\frac{1}{2}\\right)^{2015-(k-1)} = \\binom{2015}{k-1} \\left(\\frac{1}{2}\\right)^{2015}$. This mirrors Step 14 but shifts the index to $k-1$ for the salad count.",
                "direct_dependent_steps": [
                    7
                ],
                "node": "Similarly, $P(T=k-1)=\\binom{2015}{k-1}(\\tfrac{1}{2})^{2015}$."
            },
            {
                "step_id": 16,
                "edge": "Combining the factorization from Step 13 with the marginal probabilities from Steps 14 and 15, we multiply the expressions: $\\binom{2015}{k} \\left(\\frac{1}{2}\\right)^{2015} \\times \\binom{2015}{k-1} \\left(\\frac{1}{2}\\right)^{2015} = \\binom{2015}{k} \\binom{2015}{k-1} \\left(\\frac{1}{2}\\right)^{4030}$. The exponents add since $2015 + 2015 = 4030$.",
                "direct_dependent_steps": [
                    13,
                    14,
                    15
                ],
                "node": "Therefore $P(S=k\\text{ and }T=k-1)=\\binom{2015}{k}\\binom{2015}{k-1}(\\tfrac{1}{2})^{4030}$."
            },
            {
                "step_id": 17,
                "edge": "Substituting the joint probability from Step 16 into the total probability sum from Step 11, and restricting to valid $k$ from Step 12, we obtain $P(S=T+1) = \\sum_{k=1}^{2015} \\binom{2015}{k} \\binom{2015}{k-1} \\left(\\frac{1}{2}\\right)^{4030}$. This consolidates all prior components into a single summation expression.",
                "direct_dependent_steps": [
                    11,
                    12,
                    16
                ],
                "node": "Hence $P(S=T+1)=\\sum_{k=1}^{2015}\\binom{2015}{k}\\binom{2015}{k-1}(\\tfrac{1}{2})^{4030}$."
            },
            {
                "step_id": 18,
                "edge": "To reindex the summation in Step 17 for combinatorial simplification, we set $i = k - 1$. This substitution shifts the index so $k = i + 1$, which will align the binomial coefficients with Vandermonde's identity later. The substitution is algebraically reversible and preserves the sum's value.",
                "direct_dependent_steps": [
                    17
                ],
                "node": "Let $i=k-1$, which implies $k=i+1$."
            },
            {
                "step_id": 19,
                "edge": "Applying the substitution $k = i + 1$ (Step 18) to Step 17's sum: when $k=1$, $i=0$; when $k=2015$, $i=2014$. The binomial coefficients become $\\binom{2015}{i+1}$ and $\\binom{2015}{i}$, yielding $\\sum_{i=0}^{2014} \\binom{2015}{i+1} \\binom{2015}{i} \\left(\\frac{1}{2}\\right)^{4030}$. The constant factor remains unchanged.",
                "direct_dependent_steps": [
                    17,
                    18
                ],
                "node": "Then the summation transforms to $\\sum_{i=0}^{2014}\\binom{2015}{i+1}\\binom{2015}{i}(\\tfrac{1}{2})^{4030}$."
            },
            {
                "step_id": 20,
                "edge": "We recall the fundamental binomial coefficient symmetry: $\\binom{n}{r} = \\binom{n}{n-r}$ for $0 \\leq r \\leq n$. This identity, derived from the definition $\\binom{n}{r} = \\frac{n!}{r!(n-r)!}$, will help rewrite terms to match Vandermonde's form.",
                "direct_dependent_steps": null,
                "node": "The binomial coefficient symmetry is $\\binom{n}{r}=\\binom{n}{n-r}$."
            },
            {
                "step_id": 21,
                "edge": "Applying the symmetry identity from Step 20 with $n=2015$ and $r=i+1$, we rewrite $\\binom{2015}{i+1} = \\binom{2015}{2015 - (i+1)}$. This transformation is exact and leverages the combinatorial property that choosing $i+1$ items is equivalent to choosing the remaining $2015 - (i+1)$ items.",
                "direct_dependent_steps": [
                    20
                ],
                "node": "Applying this with $n=2015$ and $r=i+1$ yields $\\binom{2015}{i+1}=\\binom{2015}{2015-(i+1)}$."
            },
            {
                "step_id": 22,
                "edge": "Simplifying the index from Step 21: $2015 - (i + 1) = 2015 - i - 1 = 2014 - i$. This basic algebraic step prepares the binomial coefficient for the upcoming identity application.",
                "direct_dependent_steps": [
                    21
                ],
                "node": "Simplifying gives $2015-(i+1)=2014-i$."
            },
            {
                "step_id": 23,
                "edge": "Combining Steps 21 and 22, we replace $\\binom{2015}{i+1}$ with $\\binom{2015}{2014 - i}$, so the product becomes $\\binom{2015}{2014 - i} \\binom{2015}{i}$. This rewrites the summand into a form where the indices sum to a constant (2014), matching Vandermonde's structure.",
                "direct_dependent_steps": [
                    21,
                    22
                ],
                "node": "Hence $\\binom{2015}{i+1}\\binom{2015}{i}=\\binom{2015}{2014-i}\\binom{2015}{i}$."
            },
            {
                "step_id": 24,
                "edge": "Substituting the transformed product from Step 23 into Step 19's sum, we get $\\sum_{i=0}^{2014} \\binom{2015}{2014 - i} \\binom{2015}{i} \\left(\\frac{1}{2}\\right)^{4030}$. The summation limits and constant factor are preserved, but the binomial indices now satisfy the condition for Vandermonde's identity.",
                "direct_dependent_steps": [
                    19,
                    23
                ],
                "node": "Therefore the sum becomes $\\sum_{i=0}^{2014}\\binom{2015}{2014-i}\\binom{2015}{i}(\\tfrac{1}{2})^{4030}$."
            },
            {
                "step_id": 25,
                "edge": "We invoke Vandermonde's identity, a standard combinatorial result: $\\sum_{i=0}^{m} \\binom{a}{i} \\binom{b}{m-i} = \\binom{a+b}{m}$ for non-negative integers $a, b, m$. This identity arises from expanding $(1+x)^{a+b}$ and equating coefficients, and will collapse our sum into a single binomial coefficient.",
                "direct_dependent_steps": null,
                "node": "Vandermonde's identity states $\\sum_{i=0}^{m}\\binom{a}{i}\\binom{b}{m-i}=\\binom{a+b}{m}$."
            },
            {
                "step_id": 26,
                "edge": "Applying Vandermonde's identity (Step 25) with $a = 2015$, $b = 2015$, and $m = 2014$, the sum $\\sum_{i=0}^{2014} \\binom{2015}{i} \\binom{2015}{2014 - i}$ equals $\\binom{2015 + 2015}{2014} = \\binom{4030}{2014}$. Note the upper limit $2014$ matches $m$, so all terms are valid (no out-of-range binomial coefficients).",
                "direct_dependent_steps": [
                    25
                ],
                "node": "Applying this with $a=b=2015$ and $m=2014$ gives $\\sum_{i=0}^{2014}\\binom{2015}{i}\\binom{2015}{2014-i}=\\binom{4030}{2014}$."
            },
            {
                "step_id": 27,
                "edge": "From Step 26, the summation in Step 24 evaluates to $\\binom{4030}{2014}$. This replaces the entire combinatorial sum with a single binomial coefficient, significantly simplifying the expression.",
                "direct_dependent_steps": [
                    26
                ],
                "node": "Hence the sum equals $\\binom{4030}{2014}$."
            },
            {
                "step_id": 28,
                "edge": "Multiplying the sum result from Step 27 by the constant factor $\\left(\\frac{1}{2}\\right)^{4030}$ (from Step 24), we obtain $P(S=T+1) = \\binom{4030}{2014} \\left(\\frac{1}{2}\\right)^{4030}$. This expresses the probability in closed form, though we will further simplify the binomial coefficient.",
                "direct_dependent_steps": [
                    24,
                    27
                ],
                "node": "Therefore $P(S=T+1)=\\binom{4030}{2014}(\\tfrac{1}{2})^{4030}$."
            },
            {
                "step_id": 29,
                "edge": "We compute $4030 - 2014 = 2016$ to prepare for binomial symmetry. Arithmetic verification: $4030 - 2000 = 2030$, then $2030 - 14 = 2016$. This difference is needed for the symmetry transformation in the next step.",
                "direct_dependent_steps": [
                    28
                ],
                "node": "Compute $4030-2014=2016$."
            },
            {
                "step_id": 30,
                "edge": "Using binomial symmetry (Step 20) with $n=4030$ and $r=2014$, we have $\\binom{4030}{2014} = \\binom{4030}{4030 - 2014}$. This identity holds because the binomial coefficient depends only on the distance from the endpoints, not the specific index.",
                "direct_dependent_steps": [
                    20,
                    28
                ],
                "node": "By symmetry, $\\binom{4030}{2014}=\\binom{4030}{4030-2014}$."
            },
            {
                "step_id": 31,
                "edge": "Substituting the computed difference $4030 - 2014 = 2016$ (Step 29) into the symmetry expression from Step 30, we conclude $\\binom{4030}{2014} = \\binom{4030}{2016}$. This reindexes the binomial coefficient to the form matching the final answer.",
                "direct_dependent_steps": [
                    29,
                    30
                ],
                "node": "Hence $\\binom{4030}{2014}=\\binom{4030}{2016}$."
            },
            {
                "step_id": 32,
                "edge": "Replacing $\\binom{4030}{2014}$ with $\\binom{4030}{2016}$ (Step 31) in the probability expression from Step 28 gives $\\binom{4030}{2016} \\left(\\frac{1}{2}\\right)^{4030} = \\frac{\\binom{4030}{2016}}{2^{4030}}$. This matches the required final answer format and completes the solution.",
                "direct_dependent_steps": [
                    28,
                    31
                ],
                "node": "The final answer is \\boxed{\\frac{\\binom{4030}{2016}}{2^{4030}}}."
            }
        ]
    }
]
