data = {'aqua' :[
{"question": "160 is what percent of 50 ?", "options": ["A) 5%", "B) 20%", "C) 320%", "D) 200%", "E) 500%"], "rationale": "50*x=160 --> x=3.2 --> 3.2 expressed as percent is 320%.\nAnswer: C.", "correct": "C"},
{"question": "What will come in place of the x in the following Number series? 46080, 3840, ?, 48, 8, 2, 1", "options": ["A)1", "B)384", "C)5", "D)7", "E)9"], "rationale": "46080 /12 = 3840\n3840 /10 = 384\n384 /8 = 48\n48 /6 = 8\n8/4 = 2\n2 /2 = 1\nB", "correct": "B"},
{"question": "The length of a rectangle is reduced by 20%. By what % would the width have to be increased to maintainthe original area?", "options": ["A)10%", "B)20%", "C)25%", "D)30%", "E)45%"], "rationale": "Sol. Required change = (20*100)/(100-20)=25%\nC", "correct": "C"},
{"question": "Find the average of first 20 natural numbers?", "options": ["A)5.5", "B)7.2", "C)10.5", "D)12.3", "E)15.5"], "rationale": "Sum of first n natural numbers = n(n+1)/2\nsum of first 20 natural numbers = 20*21/2 =210\naverage = 210/20 = 10.5\nAnswer is C", "correct": "C"},
{"question": "The inverse ratio of 4: 2: 1 is?", "options": ["A)2:4:8", "B)2:3:9", "C)2:3:2", "D)2:3:6", "E)2:3:1"], "rationale": "1/4: 1/2: 1/1 = 2:4:8\nAnswer:A", "correct": "A"},
{"question": "A password of a computer used two digits where they are from 0 and 9. What is the probability that the password solely consists of prime numbers and zero?", "options": ["A)1/32", "B)1/16", "C)1/8", "D)2/5", "E)1/4"], "rationale": "We have two digits can be used for password -0,2,3,5,7.\nAssuming that the numbers can be repeated any number of times in the password, probability of selecting any one of them is 5/10 (out of 10 digits from 0-9)\nSo, 5/10 * 5/10=1/4(E)", "correct": "E"},
{"question": "Three times the first of three consecutive odd integers is 8 more than twice the third. The third integer is:", "options": ["A)9", "B)11", "C)13", "D)15", "E)20"], "rationale": "Let the three integers be x, x + 2 and x+ 4.\nThen,\n3x = 2(x + 4) + 8\nx = 16\nThird integer = x + 4 = 20.\nANSWER:E", "correct": "E"},
{"question": "NHAI employs 100 men to build a highway of 2km in 50 days working 8 hours a day. If in 25 days they completed 1/3 part of work .than how many more employees should NHAI hire to finish it in time working 10 hours a day?", "options": ["A)22", "B)60", "C)28", "D)11", "E)218"], "rationale": "Here 2km is immaterial. The given problem can be written in a tabular form like below.\nWe can apply chain rule now.\nTotal men required to complete the remaining work = 100\u00d72525\u00d7810\u00d72313100\u00d72525\u00d7810\u00d72313 = 160\nSo additional men required = 160 - 100 = 60\nAnswer:B", "correct": "B"},
{"question": "Two trains 111 meters and 165 meters in length respectively are running in opposite directions, one at the rate of 60 km and the other at the rate of 90 kmph. In what time will they be completely clear of each other from the moment they meet?", "options": ["A)4.85", "B)7.85", "C)6.85", "D)5.85", "E)6.62"], "rationale": "T = (111 + 165)/ (60 + 90) * 18/5\nT = 6.62\nANSWER:E", "correct": "E"},
{"question": "A train 500 m long is running at a speed of 78 km/hr. If it crosses a tunnel in 1 min, then the length of the tunnel is?", "options": ["A)277 m", "B)700 m", "C)800 m", "D)187 m", "E)1678 m"], "rationale": "Speed = 78 * 5/18 = 65/3 m/sec.\nTime = 1 min = 60 sec.\nLet the length of the train be x meters.\nThen, (500 + x)/60 = 65/3\nx = 800 m.\nAnswer:C", "correct": "C"},
{"question": "The price of a radio was increased by 25 percent. The new price was then increased by 40 percent. A single increase of what percent is equivalent to these two successive increases?", "options": ["A)80%", "B)75%", "C)65%", "D)50%", "E)45%"], "rationale": "consider base price - $100\n25% increase = 1.25*100 = $125\nanother 40% increase on new price = 1.4* 125 = $175\nso final price of radio - $175\ntherefore a 75% increase\ncorrect option - B", "correct": "B"},
{"question": "Two trains start from P and Q respectively and travel towards each other at a speed of 50 km/hr and 40 km/hr respectively. By the time they meet, the first train has travelled 100 km more than the second. The distance between P and Q is :", "options": ["A)500 km", "B)630 km", "C)900 km", "D)660 km", "E)None"], "rationale": "Sol.\nAt the time of meeting, let the distane travelled byb the second train be x km. Then,\ndistance covered by the first train is (x + 100) km\n\u2234 x/40 = (x+100)/50 \u21d4 50x = 40x 4000 \u21d4 x = 400.\nSo, distance between P and Q = (x+x+100) km = 900 km.\nAnswer C", "correct": "C"},
{"question": "What is the investment made if one invests in 15% stock at 50 and earns Rs.2000?", "options": ["A)5000", "B)2767", "C)2697", "D)126967", "E)19771"], "rationale": "Explanation:\nTo earn Rs.15, investment = Rs.50.\nHence, to earn Rs.1500, investment = (1500*50)/15\n= Rs.5000\nANSWER: A", "correct": "A"},
{"question": "The seating chart of an airplane shows 30 rows of seats. Each row has 3 seats on each side of the center aisle, and one of the seats on each side is a window saet. The view from the window seats in 25 of the rows is obscured by the wings of the airplane. If the first person to be assigned a seat is assigned a window seat and thw window seat is assigned randomly, what is the probability that the person will get a seat with an unobscured view?", "options": ["A)1/6", "B)1/3", "C)2/3", "D)5/6", "E)17/18"], "rationale": "priyalr\n6 seats per row, think of a boeing 737. We have 30 rows, therefore window 30 seats one one side and 30 window seats on the other, totaling 60 window seats on the whole plane.\nthe view of the window of 25 rows is blocked. two wings, therefore 50 window seats are blocked.\nTotal window seats = 60\nTotal blocked window seats = 50\nTotal unblocked seats = 10\nWe know that a window seat was given, therefore probability for not window seat is 10/60 =1/6\nANS A", "correct": "A"},
{"question": "Krishan and Nandan jointly started a business. Krishan invested three times as Nandan did and invested his money for double time as compared to Nandan. If the gain is proportional to the money invested and the time for which the money is invested and the total gain was Rs. 28000, find the earning of Nandan.", "options": ["A)Rs.7000", "B)Rs.5000", "C)Rs.6000", "D)Rs.Rs.4000", "E)Rs.6500"], "rationale": "3:1\n2:1\n------\n6:1\n7 ----- Rs.28000\n1 ----- ? => Rs.28,000/7=Rs. 4000\nAnswer: D", "correct": "D"},
{"question": "A certain bakery sells six different-sized wedding cakes. Each cake costs x dollars more than the next one below it in size, and the price of the largest cake is $24.50. If the sum of the prices of the six different cakes is $109.50, what is the value of x?", "options": ["A) 1.50", "B) 1.75", "C) 2.00", "D) 2.50", "E) 3.00"], "rationale": "Since the price of the largest cake (6th) is $24.50, then the price of the smallest cake (1st) is $(24.50-5x). Now, the prices of the cakes are evenly spaced so the sum of the prices is (average price)*(# of cakes)=(first+last)/2*(# of cakes). So, (24.50-5x+24.50)/2*6= 109.50 --> x=2.5.\nAnswer: D.", "correct": "D"},
{"question": "Three bells chime at intervals of 18 min., 24 min. and 32 min. respectively. At a certain time they begin together. What length Z of time will elapse before they chime together again?", "options": ["A)2 hr. and 24 min.", "B)4 hr. and 48 min.", "C)1 hr. and 36 min.", "D)5 hr.", "E)2 hr."], "rationale": "It should be simple. All the three bells will chime again together whenver their time intervals intersect eachother.\nSo the LCM of the three time intervals (18, 24,32) would be the answer.\nLCM (18, 24, 32) Z= 288 => 4 hours 48 mins.B", "correct": "B"},
{"question": "A man can row downstream at 25 kmph and upstream at 15 kmph. Find the time to reach a destination point at a distance of 50km along the downstream.", "options": ["A)4 hrs.", "B)1 hrs.", "C)3 hrs.", "D)2 hrs.", "E)2 1/2 hrs."], "rationale": "Let the speed of the man in downstream=25 kmph. distance to be covered along the stream=50kmph\n=>time taken =D/S =50/25 =2 Hrs.\nAnswer:D", "correct": "D"},
{"question": "Find the number that fits somewhere into the middle of the series. Some of the items involve both numbers and letters\nLook at this series: C19, E21, __, I25, K27, ... What number should fill the blank?", "options": ["A)D20", "B)E21", "C)F22", "D)G23", "E)H24"], "rationale": "B\nG23\nIn this series, the letters progress by 2, and the numbers increase by 2.", "correct": "B"},
{"question": "A train crosses a platform of 120 m in 15 sec, same train crosses another platform of length 180 m in 18 sec. then find the length of the train?", "options": ["A)276m", "B)180m", "C)286m", "D)288m", "E)277m"], "rationale": "Length of the train be \u2018X\u2019\nX + 120/15 = X + 180/18\n6X + 720 = 5X + 900\nX = 180m\nAnswer:B", "correct": "B"},
{"question": "The ratio of three numbers is 2:3:5 and their sum is 150. The second number of the three numbers is?", "options": ["A)24", "B)26", "C)27", "D)29", "E)45"], "rationale": "2:3:5\nTotal parts = 10\n10 parts --> 150\n1 part ---->15\nThe second number of the three numbers is = 3*15= 45\nAnswer : E", "correct": "E"},
{"question": "For any real number x, the operatoris defined as:\n(x) = x(2 \u2212 x)\nIf p + 2 =(p + 2), then p =", "options": ["A)1", "B)0", "C)1", "D)-2", "E)3"], "rationale": "(x) = x(2 \u2212 x)\n(p + 2) = (p + 2)(2 - p - 2) = -p(p+1)\nWe are given that p + 2 =(p + 2)\nTherefore -p(p+2) = (p + 2)\nOr (p + 2) + p(p+2) = 0\n(p + 2)(p+1) = 0\np = -1,p=-2\nOption D", "correct": "D"},
{"question": "Calculate the circumference of a circular field whose radius is 5 centimeters.", "options": ["A)2", "B)4", "C)6", "D)8", "E)10"], "rationale": "Circumference C is given by\nC = 2\u03c0r = 2\u03c0*5 = 10 \u03c0 cm\ncorrect answer E", "correct": "E"},
{"question": "The average age of five persons is 40 years while the average age of some other 10 persons is 25 years. The average age of all the 15 persons is:", "options": ["A)27 Years", "B)32 Years", "C)37 Years", "D)30 Years", "E)35 Years"], "rationale": "x/5==40\nx==200\nafter 10 person\nx/10==25\nx==250\nso avg btwn 15 person is,,\n(250+200) / 15==30 ans\nANSWER:D", "correct": "D"},
{"question": "A slot machine in a Las Vegas casino has an average profit of $600 for each 8-hour shift for the five days Sunday through Thursday, inclusive. If the average per-shift profit on Friday and Saturday is 25% greater than on the other days of the week and the slot machine is in operation every hour of every day, what is the total weekly profit that the casino makes from the slot machine?", "options": ["A)a - 4500", "B)b - 9000", "C)c - 13,500", "D)d - 15,500", "E)e - 27,000"], "rationale": "Correct answer is C - 13500.\nTotal profit per weekday = $600 X 3 (shifts)= $1800\nTotal profit per week (apart from SaturdaySunday) = $1800 X 5 = $9000\nTotal profit per shift on weekends = $600 X 125/100 = $750\nTotal profit on weekends = $750 X 3 (shifts) X 2 (Saturday, Sunday) = $4500.\nHence the answer is - $4500 + $9000 = $13,500. (C)", "correct": "C"},
{"question": "What is the greatest prime factor of 2^10 - 1?", "options": ["A)17", "B)19", "C)23", "D)29", "E)31"], "rationale": "2^10-1 = (2^5-1)(2^5+1) = 31*33\nThe answer is E.", "correct": "E"},
{"question": "A train overtakes two persons walking along a railway track. The first person walks at 4.5 km/hr and the other walks at 5.4 km/hr. The train needs 8.4 and 8.5 seconds respectively to overtake them. What is the speed of the train if both the persons are walking in the same direction as the train?", "options": ["A)81 km/hr", "B)88 km/hr", "C)62 km/hr", "D)46 km/hr", "E)34 km/hr"], "rationale": "Explanation:\nLet x is the length of the train in meter and y is its speed in kmph\nx/8.4 = (y-4.5)(10/36) ---(1)\nx/8.5 = (y-5.4)(10/36) ---(2)\nDividing 1 by 2\n8.5/8.4 = (y-4.5)/ (y-5.4)\n=> 8.4y - 8.4 \u00d7 4.5 = 8.5y - 8.5\u00d75.4\n.1y = 8.5\u00d75.4 - 8.4\u00d74.5\n=> .1y = 45.9-37.8 = 8.1\n=> y = 81 km/hr\nAnswer: Option A", "correct": "A"},
{"question": "Jones covered a distance of 50 miles on his first trip. On a later trip he traveled 300 miles while going three times as fast. His new time compared with the old time was:", "options": ["A)three times as much", "B)twice as much", "C)the same", "D)half as much", "E)a third as much"], "rationale": "Let speed of the 1st trip x miles / hr. and speed of the 2nd trip 3x / hr.\nWe know that\nSpeed = Distance/Time.\nOr, Time = Distance/Speed.\nSo, times taken to covered a distance of 50 miles on his first trip = 50/x hr.\nAnd times taken to covered a distance of 300 miles on his later trip = 300/3x hr.\n= 100/x hr.\nSo we can clearly see that his new time compared with the old time was: twice as much.\ncorrect answer B", "correct": "B"},
{"question": "There are 32 stations between Ernakulam and Chennai. How many second class tickets have to be printed, so that a passenger can travel from one station to any other station?", "options": ["A)1800", "B)1820", "C)1150", "D)1122", "E)1900"], "rationale": "The total number of stations= 34\nFrom 34 Stations we have to choose any two stations and the direction of travel (Ernakulam to Chennai is different from Chennai to Ernakulam) in 34P2 ways.\n34P2= 34*33= 1122\nANSWER:D", "correct": "D"},
{"question": "A sum of money at simple interest amounts to Rs. 815 in 3 years and to Rs. 854 in 4 years. The sum is?", "options": ["A)650", "B)690", "C)698", "D)700", "E)710"], "rationale": "S.I. for 1 year = Rs. (854 - 815) = Rs. 39.\nS.I. for 3 years = Rs.(39 x 3) = Rs. 117.\nPrincipal = Rs. (815 - 117) = Rs. 698.\nAnswer: Option C", "correct": "C"},
{"question": "A can do a particular work in 6 days . B can do the same work in 8 days. A and B signed to do it for Rs. 3200. They completed the work in 3 days with the help of C. How much is to be paid to C?", "options": ["A)100", "B)400", "C)300", "D)500", "E)700"], "rationale": "Explanation :\nAmount of work A can do in 1 day = 1/6\nAmount of work B can do in 1 day = 1/8\nAmount of work A + B can do in 1 day = 1/6 + 1/8 = 7/24\nAmount of work A + B + C can do = 1/3\nAmount of work C can do in 1 day = 1/3 - 7/24 = 1/24\nwork A can do in 1 day: work B can do in 1 day: work C can do in 1 day\n= 1/6 : 1/8 : 1/24 = 4 : 3 : 1\nAmount to be paid to C = 3200 \u00d7 (1/8) = 400\nANSWER:B", "correct": "B"},
{"question": "A man has Rs.355 in the denominations of one-rupee notes, 20-rupee notes and 50-rupee notes. The number of notes of each denomination is equal. What is the total number of notes that he has ?", "options": ["A)20", "B)15", "C)71", "D)40", "E)60"], "rationale": "Let number of notes of each denomination be x.\nThen x + 20x + 50x = 355\n71x = 355\nx = 5\nHence, total number of notes = 3x = 15.\nAnswer is B.", "correct": "B"}
],
'hotpot' :[
    {
        "question": "Who is older Danny Green or James Worthy?",
        "answer": "James Worthy",
        "type": "bridge"
    },
    {
        "question": "Author David Chanoff has collaborated with a U.S. Navy admiral who served as the ambassador to the United Kingdom under which President?",
        "answer": "Bill Clinton",
        "type": "bridge"
    },
    {
        "question": "What was the first year a scientific journal published by an organization located in the Bronx was published?",
        "answer": "1909",
        "type": "bridge"
    },
    {
        "question": "Geoff LaTulippe is an American writer whose best-known work was directed by whom?",
        "answer": "Nanette Burstein",
        "type": "bridge"
    },
    {
        "question": "Are Hoodoo Gurus and Pierre Bouvier of the same nationality?",
        "answer": "no",
        "type": "comparison"
    },
    {
        "question": "Hardley Flood is an area of lagoons that support populations of the waterfowl that are a medium sized version of what animal?",
        "answer": "duck",
        "type": "bridge"
    },
    {
        "question": "The Twelfth United States Army Group commander was the first chairman of what?",
        "answer": "Joint Chiefs of Staff",
        "type": "bridge"
    },
    {
        "question": "Michael Braz completed a libretto for what Georgia college, founded in 1906?",
        "answer": "A Scholar Under Siege",
        "type": "bridge"
    },
    {
        "question": "The 2000 British film Snatch was later adapted into a television series for what streaming service?",
        "answer": "Crackle",
        "type": "bridge"
    },
    {
        "question": "Kurt Fuller from Stockton, CA appeared in which American Detective Comedy Drama television series created by Steve Franks?",
        "answer": "Psych is an American detective comedy-drama",
        "type": "bridge"
    },
    {
        "question": "The central figure used in the corporate branding of Singapore Airlines has been an element of it's marketing since what year?",
        "answer": "1972",
        "type": "bridge"
    },
    {
        "question": "Who was older, Andrew Preston or James Taylor?",
        "answer": "James Taylor",
        "type": "bridge"
    },
    {
        "question": "How many households does the network that Di-Gata Defenders plays on in South Africa reach?",
        "answer": "1.5 million households",
        "type": "bridge"
    },
    {
        "question": "What star of Parks and Recreation appeared in November?",
        "answer": "Nick Offerman",
        "type": "bridge"
    },
    {
        "question": "\"Tunak\", is a bhangra/pop love song by an artist born in which year ?",
        "answer": "1967",
        "type": "bridge"
    },
    {
        "question": "Which peak is flanked by Manaslu, Shispare or Ngadi Chuli?",
        "answer": "Ngadi Chuli",
        "type": "comparison"
    },
    {
        "question": "What was the middle name of the actress who was cast alongside Harvey Fierstein, Linda Hart, Dick Latessa, Clarke Thorell, Mary Bond Davis, Laura Bell Bundy, Matthew Morrison, Corey Reynolds, and Marissa Jaret Winokur in Hairspray?",
        "answer": "Marie",
        "type": "bridge"
    },
    {
        "question": "According to the 2011 census what is the population of the city where Royal Wahingdoh F.C. are based ?",
        "answer": "143,007",
        "type": "bridge"
    },
    {
        "question": "The Ranters were a loose collection of radical so-called heretics whose main objection was with what major division of Christendom?",
        "answer": "Roman Catholicism",
        "type": "bridge"
    },
    {
        "question": "Ruth Vollmer begins work designing window displays for which American luxury jewelry and specialty retailer, headquartered in New York City",
        "answer": "Tiffany's",
        "type": "bridge"
    },
    {
        "question": "What city does the company that owns Bumble and bumble have its headquarters in?",
        "answer": "New York City",
        "type": "bridge"
    },
    {
        "question": "What languages did the son of Sacagawea speak?",
        "answer": "French and English",
        "type": "bridge"
    },
    {
        "question": "Ferdinand Zvonimir von Habsburg is the eldest son of the head of which House",
        "answer": "House of Habsburg-Lorraine",
        "type": "bridge"
    },
    {
        "question": "What schools of thought are drawn from in the academic discipline of Hafiz Rashid Khan?",
        "answer": "postmodern schools of thought",
        "type": "bridge"
    },
    {
        "question": "Alfie Allen played Theon Greyjoy on which show?",
        "answer": "Game of Thrones",
        "type": "bridge"
    },
    {
        "question": "Was Vanderbilt University or Emory University founded first?",
        "answer": "Emory University.",
        "type": "comparison"
    },
    {
        "question": "Hivange is a village in a country that has how many official languages ?",
        "answer": "three official languages",
        "type": "bridge"
    },
    {
        "question": "South Dade High School is located between what two national parks?",
        "answer": "Biscayne National Park to the east and Everglades National Park to the west",
        "type": "bridge"
    },
    {
        "question": "What does the organization associated with Carl Wieland believe about anything other than the young earth view? ",
        "answer": "a compromise on biblical inerrancy",
        "type": "bridge"
    },
    {
        "question": "What award was an actor born in 1955 that acted in the movie Ransom nominated for?",
        "answer": "Academy Award",
        "type": "bridge"
    },
    {
        "question": "Is Northeast Florida Regional Airport farther from St. Augustine than Glacier Park International Airport is to Kalispell?",
        "answer": "no",
        "type": "comparison"
    },
    {
        "question": "Are both Delmer Daves and Jean-Pierre Jeunet film directors?",
        "answer": "yes",
        "type": "comparison"
    },]
}

# --- add this after your existing data dict ---

from datasets import load_dataset


def _parse_gsm8k_answer(answer_str: str) -> str:
    """
    GSM8K answers usually end with a line like:
        '#### 72'
    Extract the final answer as a string.
    """
    lines = [l.strip() for l in answer_str.strip().splitlines() if l.strip()]
    for line in reversed(lines):
        if line.startswith("####"):
            return line.replace("####", "", 1).strip()
    return lines[-1] if lines else ""


def load_gsm8k_subset(n_samples: int = 200, seed: int | None = 0):
    """
    Load n_samples from GSM8K train split and format them as:
        {"question": ..., "rationale": ..., "answer": ...}
    """
    ds = load_dataset("openai/gsm8k", "main", split="train")

    if seed is not None:
        ds = ds.shuffle(seed=seed)

    ds = ds.select(range(min(n_samples, len(ds))))

    gsm_list = []
    for ex in ds:
        q = ex["question"]
        rationale = ex["answer"]
        final_ans = _parse_gsm8k_answer(rationale)

        gsm_list.append(
            {
                "question": q,
                "rationale": rationale,
                "answer": final_ans,
            }
        )

    return gsm_list


# actually load 200 samples and register them under the same `data` dict
gsm8k_subset = load_gsm8k_subset(n_samples=200, seed=0)
data["gsm8k"] = gsm8k_subset
