from statistics import mean, stdev

# DistRL (Qwen3-0.6B)
# time_usage = [
#     566.8, 534.2, 527.4, 528.6, 520.5,      504.7, 480.0, 474.6, 460.2, 467.2,
#     472.3, 482.1, 494.3, 460.4, 453.0,      464.7, 453.8, 459.0, 440.9, 449.0,
#     454.0, 445.1, 435.9, 429.2, 430.7,      447.3, 413.4, 437.5, 421.8, 422.7,
#     444.6,        466.6, 431.9, 453.6,      467.1, 445.4, 475.6, 436.3, 446.0,
#     447.1, 433.4, 462.4, 454.7, 414.1,      444.8, 418.7, 447.9, 420.4, 435.3,

# ]

# GRPO (Qwen3-0.6B)
# time_usage = [
#     538.3, 540.8, 537.4, 526.3, 521.5,      491.5, 491.7, 491.8, 481.0, 476.9,
#     468.5, 502.8, 474.4, 510.8, 478.7,      469.4, 444.2, 461.5, 465.9, 496.4,
#     453.0, 468.9, 458.5, 449.1, 472.5,      457.9, 429.8, 470.4, 469.3, 453.2,
#     466.6,        503.4, 488.0, 480.7,      492.2, 495.4, 523.2, 466.5, 483.9,
#     474.4, 485.7, 514.5, 495.5, 478.1,      509.3, 497.3, 512.3, 552.3, 513.8,
# ]


# DistRL (Llama3.2-1B)
# time_usage = [
#     356.3, 351.1, 349.4, 347.0, 349.4,      343.9, 335.2, 333.0, 334.7, 320.8,
#     316.9, 321.1, 319.5, 323.5, 311.4,      318.2, 315.3, 308.8, 315.5, 308.4,
#     309.3, 309.3, 307.7, 318.0, 319.2,      317.8, 312.3, 310.0, 309.9, 308.7,
#     315.5,        313.3, 313.7, 323.2,      316.8, 320.0, 316.6, 314.4, 316.1,
#     312.1, 309.5, 310.2, 307.4, 313.5,      314.0, 310.1, 314.1, 312.3, 307.3
# ]

# # GRPO (Llama3.2-1B)
time_usage = [
    372.3, 367.2, 365.5, 363.1, 364.0,      357.7, 358.6, 357.7, 359.2, 366.2, 
    355.3, 358.5, 357.6, 345.5, 354.6,      354.1, 334.8, 332.1, 351.8, 325.2,
    333.6, 349.1, 338.6, 329.4, 333.4,      344.1, 340.2, 324.8, 328.3, 331.2,
    351.8,        333.1, 350.6, 339.2,      340.9, 339.0, 365.0, 357.8, 352.2,
    365.5, 348.6, 352.6, 355.2, 353.4,      359.5, 347.6, 358.5, 363.8, 351.6
]


print(mean(time_usage), stdev(time_usage))
