model,attribute,CFR,SPD,mcnemar_b01,mcnemar_b10,mcnemar_n,mcnemar_p,cohens_h,acc_priv,acc_unpriv,accuracy
GPT-5,Race,0.9325842696629213,0.03745318352059923,11.0,41.0,801.0,3.5887916129517805e-05,0.16875069197797066,0.9650436953807741,0.9275905118601748,
GPT-5,Sex,0.9438202247191011,0.02871410736579283,9.0,32.0,801.0,0.000430857042374555,0.14560848238366608,0.9725343320848939,0.9438202247191011,
GPT-5,SES,0.9400749063670412,0.03121098626716612,10.0,35.0,801.0,0.00024708778460080794,0.1478663904217563,0.9675405742821473,0.9363295880149812,
GPT-5,Variant::Race-White,,,,,,,,,,0.9650436953807741
GPT-5,Variant::Race-Black,,,,,,,,,,0.9275905118601748
GPT-5,Variant::Sex-Male,,,,,,,,,,0.9725343320848939
GPT-5,Variant::Sex-Female,,,,,,,,,,0.9438202247191011
GPT-5,Variant::SES-High Income,,,,,,,,,,0.9675405742821473
GPT-5,Variant::SES-Low Income,,,,,,,,,,0.9363295880149812
GPT-5,Variant::Original,,,,,,,,,,0.9737827715355806
GPT-5,Variant::Neutralized,,,,,,,,,,0.9700374531835206
GPT-5-Mini,Race,0.9188514357053683,0.05368289637952561,9.0,52.0,801.0,1.802802378388091e-08,0.21546199053072712,0.9575530586766542,0.9038701622971286,
GPT-5-Mini,Sex,0.9138576779026217,0.041198501872659166,17.0,50.0,801.0,6.737973666915461e-05,0.16697971741707596,0.9538077403245943,0.9126092384519351,
GPT-5-Mini,SES,0.898876404494382,0.05742821473158555,15.0,61.0,801.0,9.842847414734724e-08,0.2260622452718124,0.9563046192259675,0.898876404494382,
GPT-5-Mini,Variant::Race-White,,,,,,,,,,0.9575530586766542
GPT-5-Mini,Variant::Race-Black,,,,,,,,,,0.9038701622971286
GPT-5-Mini,Variant::Sex-Male,,,,,,,,,,0.9538077403245943
GPT-5-Mini,Variant::Sex-Female,,,,,,,,,,0.9126092384519351
GPT-5-Mini,Variant::SES-High Income,,,,,,,,,,0.9563046192259675
GPT-5-Mini,Variant::SES-Low Income,,,,,,,,,,0.898876404494382
GPT-5-Mini,Variant::Original,,,,,,,,,,0.9500624219725343
GPT-5-Mini,Variant::Neutralized,,,,,,,,,,0.9500624219725343
GPT-4.1,Race,0.8751560549313359,0.09113607990012484,10.0,83.0,801.0,1.848512223084717e-15,0.29695343982299605,0.9350811485642946,0.8439450686641697,
GPT-4.1,Sex,0.8826466916354557,0.069912609238452,14.0,70.0,801.0,4.067956402779855e-10,0.23130612017886776,0.9300873907615481,0.8601747815230961,
GPT-4.1,SES,0.8302122347066168,0.10237203495630465,24.0,106.0,801.0,1.7154342149303739e-13,0.31473749955285735,0.9250936329588015,0.8227215980024969,
GPT-4.1,Variant::Race-White,,,,,,,,,,0.9350811485642946
GPT-4.1,Variant::Race-Black,,,,,,,,,,0.8439450686641697
GPT-4.1,Variant::Sex-Male,,,,,,,,,,0.9300873907615481
GPT-4.1,Variant::Sex-Female,,,,,,,,,,0.8601747815230961
GPT-4.1,Variant::SES-High Income,,,,,,,,,,0.9250936329588015
GPT-4.1,Variant::SES-Low Income,,,,,,,,,,0.8227215980024969
GPT-4.1,Variant::Original,,,,,,,,,,0.898876404494382
GPT-4.1,Variant::Neutralized,,,,,,,,,,0.8963795255930087
GPT-4.1-Mini,Race,0.7702871410736579,0.15480649188514362,19.0,143.0,801.0,1.0322666531873826e-24,0.3892253130992782,0.8714107365792759,0.7166042446941323,
GPT-4.1-Mini,Sex,0.8014981273408239,0.10861423220973787,26.0,113.0,801.0,3.95734820051663e-14,0.2763933215533845,0.8589263420724095,0.7503121098626716,
GPT-4.1-Mini,SES,0.787765293383271,0.1348314606741573,23.0,131.0,801.0,1.4930470993636463e-19,0.3392236183144064,0.8639200998751561,0.7290886392009988,
GPT-4.1-Mini,Variant::Race-White,,,,,,,,,,0.8714107365792759
GPT-4.1-Mini,Variant::Race-Black,,,,,,,,,,0.7166042446941323
GPT-4.1-Mini,Variant::Sex-Male,,,,,,,,,,0.8589263420724095
GPT-4.1-Mini,Variant::Sex-Female,,,,,,,,,,0.7503121098626716
GPT-4.1-Mini,Variant::SES-High Income,,,,,,,,,,0.8639200998751561
GPT-4.1-Mini,Variant::SES-Low Income,,,,,,,,,,0.7290886392009988
GPT-4.1-Mini,Variant::Original,,,,,,,,,,0.8352059925093633
GPT-4.1-Mini,Variant::Neutralized,,,,,,,,,,0.8426966292134831
Claude-4-Sonnet,Race,0.846441947565543,0.10362047440699129,12.0,95.0,801.0,3.485417306224237e-17,0.31653297591110086,0.9238451935081149,0.8202247191011236,
Claude-4-Sonnet,Sex,0.8514357053682896,0.08239700374531833,21.0,87.0,801.0,9.903173446450252e-11,0.2525786158939196,0.916354556803995,0.8339575530586767,
Claude-4-Sonnet,SES,0.8601747815230961,0.09862671660424471,12.0,91.0,801.0,3.4610428636474895e-16,0.29538395531001704,0.916354556803995,0.8177278401997503,
Claude-4-Sonnet,Variant::Race-White,,,,,,,,,,0.9238451935081149
Claude-4-Sonnet,Variant::Race-Black,,,,,,,,,,0.8202247191011236
Claude-4-Sonnet,Variant::Sex-Male,,,,,,,,,,0.916354556803995
Claude-4-Sonnet,Variant::Sex-Female,,,,,,,,,,0.8339575530586767
Claude-4-Sonnet,Variant::SES-High Income,,,,,,,,,,0.916354556803995
Claude-4-Sonnet,Variant::SES-Low Income,,,,,,,,,,0.8177278401997503
Claude-4-Sonnet,Variant::Original,,,,,,,,,,0.9013732833957553
Claude-4-Sonnet,Variant::Neutralized,,,,,,,,,,0.8976279650436954
Claude-3.7-Sonnet,Race,0.8314606741573034,0.10237203495630465,20.0,102.0,801.0,1.9641987858977157e-14,0.2739079381541303,0.8789013732833958,0.7765293383270911,
Claude-3.7-Sonnet,Sex,0.8314606741573034,0.1123595505617978,16.0,106.0,801.0,1.8172560940408258e-17,0.2959695087642258,0.8764044943820225,0.7640449438202247,
Claude-3.7-Sonnet,SES,0.8277153558052435,0.10611735330836458,21.0,106.0,801.0,7.499196212870584e-15,0.28037957006655256,0.8751560549313359,0.7690387016229713,
Claude-3.7-Sonnet,Variant::Race-White,,,,,,,,,,0.8789013732833958
Claude-3.7-Sonnet,Variant::Race-Black,,,,,,,,,,0.7765293383270911
Claude-3.7-Sonnet,Variant::Sex-Male,,,,,,,,,,0.8764044943820225
Claude-3.7-Sonnet,Variant::Sex-Female,,,,,,,,,,0.7640449438202247
Claude-3.7-Sonnet,Variant::SES-High Income,,,,,,,,,,0.8751560549313359
Claude-3.7-Sonnet,Variant::SES-Low Income,,,,,,,,,,0.7690387016229713
Claude-3.7-Sonnet,Variant::Original,,,,,,,,,,0.818976279650437
Claude-3.7-Sonnet,Variant::Neutralized,,,,,,,,,,0.818976279650437
Gemini-2.5-Flash,Race,0.8177278401997503,0.13358302122347065,14.0,121.0,801.0,1.9751293229358007e-22,0.4102362053337347,0.9363295880149812,0.8027465667915106,
Gemini-2.5-Flash,Sex,0.8589263420724095,0.0898876404494382,16.0,88.0,801.0,3.1797513451124715e-13,0.29350770206686994,0.9350811485642946,0.8451935081148564,
Gemini-2.5-Flash,SES,0.8252184769038702,0.1123595505617977,20.0,110.0,801.0,2.9914264919694234e-16,0.35040302865446726,0.9325842696629213,0.8202247191011236,
Gemini-2.5-Flash,Variant::Race-White,,,,,,,,,,0.9363295880149812
Gemini-2.5-Flash,Variant::Race-Black,,,,,,,,,,0.8027465667915106
Gemini-2.5-Flash,Variant::Sex-Male,,,,,,,,,,0.9350811485642946
Gemini-2.5-Flash,Variant::Sex-Female,,,,,,,,,,0.8451935081148564
Gemini-2.5-Flash,Variant::SES-High Income,,,,,,,,,,0.9325842696629213
Gemini-2.5-Flash,Variant::SES-Low Income,,,,,,,,,,0.8202247191011236
Gemini-2.5-Flash,Variant::Original,,,,,,,,,,0.9250936329588015
Gemini-2.5-Flash,Variant::Neutralized,,,,,,,,,,0.9151061173533084
Gemini-2.0-Flash,Race,0.7585335018963337,0.1288495379686403,33.0,134.0,791.0,1.2248159148500596e-15,0.31529211585324823,0.8465408805031447,0.7176913425345044,
Gemini-2.0-Flash,Sex,0.7481108312342569,0.11848717270563336,43.0,137.0,794.0,1.2501171231839265e-12,0.2898477561895416,0.8421052631578947,0.7236180904522613,
Gemini-2.0-Flash,SES,0.7216624685138538,0.14994458508079234,38.0,158.0,794.0,1.3671984054686394e-18,0.34845050526576915,0.8220551378446115,0.6721105527638191,
Gemini-2.0-Flash,Variant::Race-White,,,,,,,,,,0.8465408805031447
Gemini-2.0-Flash,Variant::Race-Black,,,,,,,,,,0.7176913425345044
Gemini-2.0-Flash,Variant::Sex-Male,,,,,,,,,,0.8421052631578947
Gemini-2.0-Flash,Variant::Sex-Female,,,,,,,,,,0.7236180904522613
Gemini-2.0-Flash,Variant::SES-High Income,,,,,,,,,,0.8220551378446115
Gemini-2.0-Flash,Variant::SES-Low Income,,,,,,,,,,0.6721105527638191
Gemini-2.0-Flash,Variant::Original,,,,,,,,,,0.7844611528822055
Gemini-2.0-Flash,Variant::Neutralized,,,,,,,,,,0.7675879396984925
Qwen-3,Race,0.7690387016229713,0.18726591760299627,11.0,161.0,801.0,2.5238215971982573e-35,0.48518625178349195,0.8976279650436954,0.7103620474406991,
Qwen-3,Sex,0.7915106117353309,0.15355805243445686,15.0,138.0,801.0,4.350270369024449e-26,0.4146481632618473,0.9026217228464419,0.7490636704119851,
Qwen-3,SES,0.7865168539325843,0.1348314606741573,25.0,133.0,801.0,5.392967935624553e-19,0.35293642254821744,0.8826466916354557,0.7478152309612984,
Qwen-3,Variant::Race-White,,,,,,,,,,0.8976279650436954
Qwen-3,Variant::Race-Black,,,,,,,,,,0.7103620474406991
Qwen-3,Variant::Sex-Male,,,,,,,,,,0.9026217228464419
Qwen-3,Variant::Sex-Female,,,,,,,,,,0.7490636704119851
Qwen-3,Variant::SES-High Income,,,,,,,,,,0.8826466916354557
Qwen-3,Variant::SES-Low Income,,,,,,,,,,0.7478152309612984
Qwen-3,Variant::Original,,,,,,,,,,0.8439450686641697
Qwen-3,Variant::Neutralized,,,,,,,,,,0.8439450686641697
Qwen-2.5,Race,0.7286432160804021,0.1875574417897058,21.0,171.0,796.0,2.02995621176414e-30,0.45048984334491116,0.8583959899749374,0.6708385481852316,
Qwen-2.5,Sex,0.7512562814070352,0.18691127066728142,17.0,164.0,796.0,2.2605436756083803e-31,0.43966456834378875,0.8448060075093867,0.6578947368421053,
Qwen-2.5,SES,0.7268170426065163,0.18727530436578332,24.0,174.0,798.0,2.864461042917998e-29,0.4449009618416293,0.8514357053682896,0.6641604010025063,
Qwen-2.5,Variant::Race-White,,,,,,,,,,0.8583959899749374
Qwen-2.5,Variant::Race-Black,,,,,,,,,,0.6708385481852316
Qwen-2.5,Variant::Sex-Male,,,,,,,,,,0.8448060075093867
Qwen-2.5,Variant::Sex-Female,,,,,,,,,,0.6578947368421053
Qwen-2.5,Variant::SES-High Income,,,,,,,,,,0.8514357053682896
Qwen-2.5,Variant::SES-Low Income,,,,,,,,,,0.6641604010025063
Qwen-2.5,Variant::Original,,,,,,,,,,0.735
Qwen-2.5,Variant::Neutralized,,,,,,,,,,0.73
DeepSeek-V3.1,Race,0.7515605493133583,0.18976279650436956,12.0,164.0,801.0,2.8287639054872155e-35,0.4555744510243287,0.8589263420724095,0.6691635455680399,
DeepSeek-V3.1,Sex,0.7440699126092385,0.18476903870162298,22.0,170.0,801.0,1.5895811738043893e-29,0.44871847054208835,0.8639200998751561,0.6791510611735331,
DeepSeek-V3.1,SES,0.735330836454432,0.18726591760299627,21.0,171.0,801.0,2.02995621176414e-30,0.44401914709537493,0.850187265917603,0.6629213483146067,
DeepSeek-V3.1,Variant::Race-White,,,,,,,,,,0.8589263420724095
DeepSeek-V3.1,Variant::Race-Black,,,,,,,,,,0.6691635455680399
DeepSeek-V3.1,Variant::Sex-Male,,,,,,,,,,0.8639200998751561
DeepSeek-V3.1,Variant::Sex-Female,,,,,,,,,,0.6791510611735331
DeepSeek-V3.1,Variant::SES-High Income,,,,,,,,,,0.850187265917603
DeepSeek-V3.1,Variant::SES-Low Income,,,,,,,,,,0.6629213483146067
DeepSeek-V3.1,Variant::Original,,,,,,,,,,0.7965043695380774
DeepSeek-V3.1,Variant::Neutralized,,,,,,,,,,0.8039950062421972
DeepSeek-V3,Race,0.7161981258366801,0.17097663009694053,30.0,159.0,747.0,2.0407523774599632e-22,0.3755558647879107,0.7826649417852523,0.6116883116883117,
DeepSeek-V3,Sex,0.7113821138211383,0.17430207587687896,31.0,165.0,738.0,2.783649802211255e-23,0.37878692949032455,0.7727272727272727,0.5984251968503937,
DeepSeek-V3,SES,0.7073170731707317,0.17507479940160475,38.0,165.0,738.0,4.6104393534548915e-20,0.3835773899097319,0.7816537467700259,0.6065789473684211,
DeepSeek-V3,Variant::Race-White,,,,,,,,,,0.7826649417852523
DeepSeek-V3,Variant::Race-Black,,,,,,,,,,0.6116883116883117
DeepSeek-V3,Variant::Sex-Male,,,,,,,,,,0.7727272727272727
DeepSeek-V3,Variant::Sex-Female,,,,,,,,,,0.5984251968503937
DeepSeek-V3,Variant::SES-High Income,,,,,,,,,,0.7816537467700259
DeepSeek-V3,Variant::SES-Low Income,,,,,,,,,,0.6065789473684211
DeepSeek-V3,Variant::Original,,,,,,,,,,0.6530880420499343
DeepSeek-V3,Variant::Neutralized,,,,,,,,,,0.6496062992125984
