[
    {
        "problem_id": 2354,
        "domain": [
            "Mathematics -> Applied Mathematics -> Statistics -> Probability -> Counting Methods -> Combinations"
        ],
        "difficulty": 5.0,
        "problem_text": "Pick a random integer between 0 and 4095, inclusive. Write it in base 2 (without any leading zeroes). What is the expected number of consecutive digits that are not the same (that is, the expected number of occurrences of either 01 or 10 in the base 2 representation)?",
        "sample_id": 1,
        "final_answer": "\\boxed{20481/4096}",
        "steps": [
            {
                "step_id": 1,
                "edge": "The problem explicitly states that we select an integer uniformly at random from 0 to 4095 inclusive, so we begin by formalizing this uniform selection over the discrete set {0,1,…,4095} as the foundational probability space.",
                "direct_dependent_steps": null,
                "node": "We choose an integer uniformly at random from the set {0,1,…,4095}."
            },
            {
                "step_id": 2,
                "edge": "Since 4096 = 2^12, all integers in [0,4095] have unique 12-bit binary representations when padded with leading zeros to maintain fixed width; this is standard background knowledge in binary number systems for covering exactly 4096 distinct values.",
                "direct_dependent_steps": null,
                "node": "Every integer in this set has a unique 12-bit binary representation possibly including leading zeros."
            },
            {
                "step_id": 3,
                "edge": "Building on the 12-bit representation established in Step 2, we define an indicator random variable Ri for each adjacent bit position i from 1 to 11 to systematically track whether the i-th and (i+1)-th bits differ, creating a structured approach to count transitions.",
                "direct_dependent_steps": [
                    2
                ],
                "node": "We define for each i∈{1,2,…,11} a random variable Ri."
            },
            {
                "step_id": 4,
                "edge": "Following the definition of Ri in Step 3, we specify that Ri equals 1 precisely when the i-th and (i+1)-th bits in the 12-bit string are different (0 and 1 or 1 and 0), which corresponds to the patterns 01 or 10 at position i; this formalizes the transition condition for each pair.",
                "direct_dependent_steps": [
                    3
                ],
                "node": "The random variable Ri equals 1 if and only if the i-th and (i+1)-th bits of the 12-bit representation differ."
            },
            {
                "step_id": 5,
                "edge": "Using the random variables Ri defined in Step 3, we define Y as the sum R1 + R2 + … + R11 to aggregate the total count of adjacent differing bit pairs across the entire 12-bit string, establishing Y as the raw count before considering representation trimming.",
                "direct_dependent_steps": [
                    3
                ],
                "node": "We define Y = R1 + R2 + … + R11."
            },
            {
                "step_id": 6,
                "edge": "By the definition in Step 4 (where each Ri indicates a differing adjacent pair) and Step 5 (where Y is the sum of the Ri), Y directly counts the total number of adjacent differing bit pairs in the 12-bit representation, as each Ri contributes 1 for every transition and 0 otherwise, making Y the unadjusted transition count.",
                "direct_dependent_steps": [
                    4,
                    5
                ],
                "node": "By definition Y counts the number of adjacent differing bit pairs in the 12-bit representation."
            },
            {
                "step_id": 7,
                "edge": "Applying the linearity of expectation to the sum Y defined in Step 5, we express E[Y] as the sum of the individual expectations E[R1] + E[R2] + … + E[R11]; this holds regardless of dependence between the Ri and simplifies the computation by breaking it into identical components.",
                "direct_dependent_steps": [
                    5
                ],
                "node": "The linearity of expectation yields E[Y] = E[R1] + E[R2] + … + E[R11]."
            },
            {
                "step_id": 8,
                "edge": "Given the uniform random selection of the integer (Step 1) and the resulting uniform distribution over all 4096 possible 12-bit strings (Step 2), each pair of adjacent bits is equally likely to be 00, 01, 10, or 11 because the bits are independent and uniformly random in this fixed-length representation, providing symmetry for probability calculations.",
                "direct_dependent_steps": [
                    1,
                    2
                ],
                "node": "In a uniform random 12-bit string each adjacent bit pair is equally likely to be 00, 01, 10, or 11."
            },
            {
                "step_id": 9,
                "edge": "Combining Step 4 (which defines Ri=1 for the patterns 01 or 10) and Step 8 (which states each adjacent pair is equally likely to be one of four possibilities), the probability that Ri=1 is 2/4 = 1/2 for any i, as two favorable outcomes exist out of four equally probable bit pairs.",
                "direct_dependent_steps": [
                    4,
                    8
                ],
                "node": "For each i we have P(Ri = 1) = P(bit-pair is 01 or 10) = 2/4 = 1/2."
            },
            {
                "step_id": 10,
                "edge": "Since Ri is an indicator random variable (from Step 9), its expectation E[Ri] equals the probability that Ri=1, which is 1/2 as established in Step 9, leveraging the fundamental property that E[I_A] = P(A) for any event A.",
                "direct_dependent_steps": [
                    9
                ],
                "node": "Hence E[Ri] = 1/2 for each i."
            },
            {
                "step_id": 11,
                "edge": "Substituting the result from Step 10 (E[Ri]=1/2 for each i) into the linearity expression from Step 7 (E[Y] = sum of E[Ri]), we compute E[Y] = 11 * (1/2) = 11/2, performing the arithmetic as 11 multiplied by 0.5 equals 5.5, which is consistent with the expectation for the padded representation.",
                "direct_dependent_steps": [
                    7,
                    10
                ],
                "node": "Consequently E[Y] = 11 * (1/2) = 11/2."
            },
            {
                "step_id": 12,
                "edge": "From Step 6, Y counts adjacent differing pairs in the full 12-bit string including leading zeros, and Step 11 computed E[Y] for this padded representation; however, the problem requires counting in the trimmed representation without leading zeros, so this expectation includes extraneous pairs that must be adjusted for accuracy.",
                "direct_dependent_steps": [
                    6,
                    11
                ],
                "node": "The value E[Y] includes counts of adjacent differing pairs that involve any leading zeros."
            },
            {
                "step_id": 13,
                "edge": "The problem statement explicitly requires writing the binary representation without leading zeros before counting transitions, so Step 12 highlights that our current expectation E[Y] does not match the problem's requirement because it uses the padded 12-bit string, necessitating a correction.",
                "direct_dependent_steps": [
                    12
                ],
                "node": "The problem requires writing the binary representation without leading zeros before counting adjacent differing pairs."
            },
            {
                "step_id": 14,
                "edge": "Following Step 13's requirement to use the trimmed representation, we observe that if the leading bit (bit 1) of the 12-bit string is zero, then the first adjacent pair (between bit 1 and bit 2) is absent in the trimmed string because leading zeros are removed entirely, regardless of the specific bits in that pair.",
                "direct_dependent_steps": [
                    13
                ],
                "node": "If the leading bit of the 12-bit string is zero then the first adjacent pair in the 12-bit representation does not appear in the trimmed representation."
            },
            {
                "step_id": 15,
                "edge": "From Step 8, the entire 12-bit string is uniformly random, so the first bit is equally likely to be 0 or 1; thus, the probability of a leading zero is 1/2, as there are 2048 strings starting with 0 out of 4096 total strings.",
                "direct_dependent_steps": [
                    8
                ],
                "node": "In a uniform 12-bit string the probability of a leading zero is 1/2."
            },
            {
                "step_id": 16,
                "edge": "Combining Step 14 (which states that a leading zero causes the first adjacent pair to be structurally absent in the trimmed representation) and Step 15 (which gives P(leading zero)=1/2), we find that the expected number of times the first adjacent pair is removed is 1 * (1/2) = 1/2; this adjustment accounts for the structural removal but will later require refinement for differing-pair accuracy.",
                "direct_dependent_steps": [
                    14,
                    15
                ],
                "node": "Therefore the expected number of first adjacent pairs removed equals 1 * (1/2) = 1/2."
            },
            {
                "step_id": 17,
                "edge": "Step 16 introduces a removal adjustment based on leading zeros, but we must consider the edge case where the integer is zero because its representation behaves exceptionally when trimming leading zeros, as zero has no non-zero bits to define the trimmed length.",
                "direct_dependent_steps": [
                    16
                ],
                "node": "An important edge case occurs when the chosen integer is zero."
            },
            {
                "step_id": 18,
                "edge": "As identified in Step 17, when the integer is zero, its 12-bit representation is all zeros (000000000000), so Y=0 (no differing pairs) as per Step 6's definition, meaning there are no transitions to count in either representation.",
                "direct_dependent_steps": [
                    17
                ],
                "node": "If the chosen integer is zero then its 12-bit representation is 000000000000 and Y = 0 yields no adjacent differing pairs."
            },
            {
                "step_id": 19,
                "edge": "In the zero case (Step 18), Step 16's adjustment subtracted 1 for the removal of the first adjacent pair (since leading bit is zero), but because Y=0 there were no differing pairs to lose; thus, this subtraction was invalid as it incorrectly reduced the count by 1 for a case with no pairs, requiring a correction.",
                "direct_dependent_steps": [
                    16,
                    18
                ],
                "node": "In that edge case subtracting a removal of the first pair is incorrect because no pairs existed."
            },
            {
                "step_id": 20,
                "edge": "Given the uniform selection over 4096 integers (Step 1), the probability of selecting zero is exactly 1/4096, as there is only one zero in the set {0,1,…,4095}.",
                "direct_dependent_steps": [
                    1
                ],
                "node": "The probability that the chosen integer equals zero is 1/4096."
            },
            {
                "step_id": 21,
                "edge": "To correct the over-subtraction identified in Step 19 (where we subtracted 1 for zero but should not have), we add back 1 specifically for the zero-integer case, ensuring the expectation accurately reflects the absence of transitions in this edge scenario.",
                "direct_dependent_steps": [
                    19
                ],
                "node": "We must therefore add back 1 for this zero-integer case."
            },
            {
                "step_id": 22,
                "edge": "Multiplying the correction from Step 21 (adding 1 for zero) by the probability from Step 20 (P(zero)=1/4096), the expected contribution of this correction is 1 * (1/4096) = 1/4096, performing the multiplication as a straightforward probability-weighted adjustment.",
                "direct_dependent_steps": [
                    20,
                    21
                ],
                "node": "That added value contributes 1 * (1/4096) = 1/4096 to the expectation."
            },
            {
                "step_id": 23,
                "edge": "Combining the original expectation from Step 11 (E[Y]=11/2), the removal adjustment from Step 16 (subtracting 1/2), and the zero-case correction from Step 22 (adding 1/4096), we form the adjusted expectation as E[Y] - 1/2 + 1/4096 to account for trimming leading zeros correctly, as the net adjustment captures the true expected loss of transitions.",
                "direct_dependent_steps": [
                    11,
                    16,
                    22
                ],
                "node": "Combining these adjustments yields the desired expectation E[Y] − 1/2 + 1/4096."
            },
            {
                "step_id": 24,
                "edge": "Substituting the value E[Y]=11/2 from Step 11 into the adjusted expression from Step 23 yields 11/2 - 1/2 + 1/4096, simplifying the subtraction of the first two terms while preserving the fractional correction term.",
                "direct_dependent_steps": [
                    11,
                    23
                ],
                "node": "Substituting E[Y] = 11/2 gives 11/2 − 1/2 + 1/4096."
            },
            {
                "step_id": 25,
                "edge": "Simplifying the arithmetic: 11/2 - 1/2 = 10/2 = 5, then 5 + 1/4096 = (5 * 4096 + 1)/4096 = 20480/4096 + 1/4096 = 20481/4096; a quick sanity check confirms 20481 ÷ 4096 ≈ 5.000244, which is consistent with the problem's context of counting transitions in a 12-bit system after trimming.",
                "direct_dependent_steps": [
                    24
                ],
                "node": "Simplifying yields 5 + 1/4096 = 20481/4096."
            },
            {
                "step_id": 26,
                "edge": "The simplified fraction 20481/4096 from Step 25 is the final expected value for the number of consecutive differing digits in the trimmed binary representation, so we present it as the boxed answer per the problem's requirement.",
                "direct_dependent_steps": [
                    25
                ],
                "node": "The final answer is \\boxed{20481/4096}."
            }
        ]
    }
]
