model_baseline,model_variation,alternative_hypo,p_value,effect_size,reject_null_95,reject_null_99,reject_null_999,effect_size_small,effect_size_middle,effect_size_large
llama-3.1-8b,llama_far,llama < llama_far,0.7444857469749591,0.06978239699533395,False,False,False,False,False,False
llama-3.1-8b,llama_pt,llama < llama_pt,0.6305119085371806,0.02358615870397829,False,False,False,False,False,False
llama-3.1-8b,llama_sft,llama < llama_sft,0.7928063986305165,0.09244191088096976,False,False,False,False,False,False
llama-3.1-8b,llama_rl,llama < llama_rl,0.4999999999999999,-0.023948690601140132,False,False,False,False,False,False
gpt-4o,gpt_far,gpt < gpt_far,0.7580713984498729,0.07435690320130961,False,False,False,False,False,False
gpt-4o,gpt_pt,gpt < gpt_pt,0.7018671691042075,0.0500140125301205,False,False,False,False,False,False
gpt-4o,gpt_sft,gpt < gpt_sft,0.7580713984498729,0.07435690320130961,False,False,False,False,False,False
llama-3.1-8b,llama_far,llama > llama_far,0.371262371003717,0.06978239699533395,False,False,False,False,False,False
llama-3.1-8b,llama_pt,llama > llama_pt,0.5,0.02358615870397829,False,False,False,False,False,False
llama-3.1-8b,llama_sft,llama > llama_sft,0.3122384962728688,0.09244191088096976,False,False,False,False,False,False
llama-3.1-8b,llama_rl,llama > llama_rl,0.63243434254182,-0.023948690601140132,False,False,False,False,False,False
gpt-4o,gpt_far,gpt > gpt_far,0.3632114122434048,0.07435690320130961,False,False,False,False,False,False
gpt-4o,gpt_pt,gpt > gpt_pt,0.42993755261247585,0.0500140125301205,False,False,False,False,False,False
gpt-4o,gpt_sft,gpt > gpt_sft,0.3632114122434048,0.07435690320130961,False,False,False,False,False,False
