[
    {
        "model": "bge-m3",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7878544330596924,
        "spearman_correlation": 0.7543961601342547,
        "mse_loss": 0.17216134071350098,
        "mae": 0.3627490699291229,
        "baseline_pearson": 0.1369253396987915,
        "baseline_spearman": 0.1879581421769938,
        "baseline_mse": 0.5585750341415405,
        "baseline_mae": 0.5949968695640564,
        "improvement_pearson": 0.6509290933609009,
        "improvement_spearman": 0.5664380179572609,
        "improvement_mse": 0.38641369342803955,
        "improvement_mae": 0.23224779963493347
    },
    {
        "model": "bge-m3",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.8349303007125854,
        "spearman_correlation": 0.7945293638789871,
        "mse_loss": 0.1768345981836319,
        "mae": 0.3836427927017212,
        "baseline_pearson": 0.19434280693531036,
        "baseline_spearman": 0.24139741735584885,
        "baseline_mse": 0.5662572383880615,
        "baseline_mae": 0.6023175120353699,
        "improvement_pearson": 0.6405874937772751,
        "improvement_spearman": 0.5531319465231382,
        "improvement_mse": 0.3894226402044296,
        "improvement_mae": 0.21867471933364868
    },
    {
        "model": "bge-m3",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6339865922927856,
        "spearman_correlation": 0.5858641045473694,
        "mse_loss": 0.020672688260674477,
        "mae": 0.11130212247371674,
        "baseline_pearson": 0.522790253162384,
        "baseline_spearman": 0.4645520194382577,
        "baseline_mse": 0.02561061829328537,
        "baseline_mae": 0.12287967652082443,
        "improvement_pearson": 0.11119633913040161,
        "improvement_spearman": 0.12131208510911168,
        "improvement_mse": 0.004937930032610893,
        "improvement_mae": 0.011577554047107697
    },
    {
        "model": "bge-m3",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7528175115585327,
        "spearman_correlation": 0.6260901682555584,
        "mse_loss": 0.03381844982504845,
        "mae": 0.14318707585334778,
        "baseline_pearson": 0.5660955905914307,
        "baseline_spearman": 0.49117351636769296,
        "baseline_mse": 0.25588467717170715,
        "baseline_mae": 0.47704368829727173,
        "improvement_pearson": 0.18672192096710205,
        "improvement_spearman": 0.13491665188786545,
        "improvement_mse": 0.2220662273466587,
        "improvement_mae": 0.33385661244392395
    },
    {
        "model": "bge-m3",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.8344340324401855,
        "spearman_correlation": 0.6655367595699058,
        "mse_loss": 0.26997730135917664,
        "mae": 0.40559378266334534,
        "baseline_pearson": 0.5859602093696594,
        "baseline_spearman": 0.5579253824890382,
        "baseline_mse": 0.7526915669441223,
        "baseline_mae": 0.6014391779899597,
        "improvement_pearson": 0.24847382307052612,
        "improvement_spearman": 0.10761137708086754,
        "improvement_mse": 0.4827142655849457,
        "improvement_mae": 0.19584539532661438
    },
    {
        "model": "bge-m3",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.8010587692260742,
        "spearman_correlation": 0.6154916202835405,
        "mse_loss": 0.38905099034309387,
        "mae": 0.5237476825714111,
        "baseline_pearson": 0.4892534911632538,
        "baseline_spearman": 0.4473216254290259,
        "baseline_mse": 0.9372732639312744,
        "baseline_mae": 0.7346985936164856,
        "improvement_pearson": 0.31180527806282043,
        "improvement_spearman": 0.16816999485451462,
        "improvement_mse": 0.5482222735881805,
        "improvement_mae": 0.21095091104507446
    },
    {
        "model": "bge-m3",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6060261130332947,
        "spearman_correlation": 0.6312887920976898,
        "mse_loss": 0.004919460974633694,
        "mae": 0.05487659573554993,
        "baseline_pearson": 0.6254838705062866,
        "baseline_spearman": 0.6152419471327459,
        "baseline_mse": 0.00713055906817317,
        "baseline_mae": 0.0656806230545044,
        "improvement_pearson": -0.019457757472991943,
        "improvement_spearman": 0.016046844964943907,
        "improvement_mse": 0.0022110980935394764,
        "improvement_mae": 0.010804027318954468
    },
    {
        "model": "bge-m3",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7786622047424316,
        "spearman_correlation": 0.763300663145236,
        "mse_loss": 0.010667126625776291,
        "mae": 0.08388462662696838,
        "baseline_pearson": 0.760079026222229,
        "baseline_spearman": 0.750672885029825,
        "baseline_mse": 0.02188076637685299,
        "baseline_mae": 0.1293335258960724,
        "improvement_pearson": 0.018583178520202637,
        "improvement_spearman": 0.012627778115411048,
        "improvement_mse": 0.011213639751076698,
        "improvement_mae": 0.045448899269104004
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7551729083061218,
        "spearman_correlation": 0.7556168993350396,
        "mse_loss": 0.19515091180801392,
        "mae": 0.38062337040901184,
        "baseline_pearson": 0.15410667657852173,
        "baseline_spearman": 0.2822503974099985,
        "baseline_mse": 0.5542832016944885,
        "baseline_mae": 0.5983566641807556,
        "improvement_pearson": 0.6010662317276001,
        "improvement_spearman": 0.4733665019250411,
        "improvement_mse": 0.3591322898864746,
        "improvement_mae": 0.21773329377174377
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.8120492696762085,
        "spearman_correlation": 0.8026585699155417,
        "mse_loss": 0.20149953663349152,
        "mae": 0.3930036723613739,
        "baseline_pearson": 0.2834065854549408,
        "baseline_spearman": 0.3522057091203521,
        "baseline_mse": 0.5192927122116089,
        "baseline_mae": 0.5712752938270569,
        "improvement_pearson": 0.5286426842212677,
        "improvement_spearman": 0.45045286079518965,
        "improvement_mse": 0.31779317557811737,
        "improvement_mae": 0.17827162146568298
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6899670958518982,
        "spearman_correlation": 0.6367656258535181,
        "mse_loss": 0.015276269055902958,
        "mae": 0.09382165223360062,
        "baseline_pearson": 0.5688055157661438,
        "baseline_spearman": 0.5112976173272475,
        "baseline_mse": 0.024452416226267815,
        "baseline_mae": 0.12087169289588928,
        "improvement_pearson": 0.1211615800857544,
        "improvement_spearman": 0.1254680085262706,
        "improvement_mse": 0.009176147170364857,
        "improvement_mae": 0.027050040662288666
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7424056529998779,
        "spearman_correlation": 0.6052256906082247,
        "mse_loss": 0.03785615786910057,
        "mae": 0.14720584452152252,
        "baseline_pearson": 0.6344751119613647,
        "baseline_spearman": 0.5507238507937425,
        "baseline_mse": 0.21676893532276154,
        "baseline_mae": 0.4377840459346771,
        "improvement_pearson": 0.10793054103851318,
        "improvement_spearman": 0.0545018398144822,
        "improvement_mse": 0.17891277745366096,
        "improvement_mae": 0.2905782014131546
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7276942729949951,
        "spearman_correlation": 0.5975694727575159,
        "mse_loss": 0.4447619616985321,
        "mae": 0.5073715448379517,
        "baseline_pearson": 0.2964806854724884,
        "baseline_spearman": 0.31383153000159686,
        "baseline_mse": 0.7356319427490234,
        "baseline_mae": 0.594689667224884,
        "improvement_pearson": 0.4312135875225067,
        "improvement_spearman": 0.28373794275591907,
        "improvement_mse": 0.29086998105049133,
        "improvement_mae": 0.08731812238693237
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.6357685327529907,
        "spearman_correlation": 0.5359049554968467,
        "mse_loss": 0.5952085852622986,
        "mae": 0.6219803094863892,
        "baseline_pearson": 0.20780715346336365,
        "baseline_spearman": 0.2383830798937171,
        "baseline_mse": 0.9059097170829773,
        "baseline_mae": 0.7093422412872314,
        "improvement_pearson": 0.4279613792896271,
        "improvement_spearman": 0.2975218756031296,
        "improvement_mse": 0.3107011318206787,
        "improvement_mae": 0.08736193180084229
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.5119025707244873,
        "spearman_correlation": 0.48590362115134605,
        "mse_loss": 0.0053964839316904545,
        "mae": 0.06020312011241913,
        "baseline_pearson": 0.5396547913551331,
        "baseline_spearman": 0.5272751919465771,
        "baseline_mse": 0.011953599750995636,
        "baseline_mae": 0.08633793890476227,
        "improvement_pearson": -0.027752220630645752,
        "improvement_spearman": -0.04137157079523107,
        "improvement_mse": 0.0065571158193051815,
        "improvement_mae": 0.02613481879234314
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7426567077636719,
        "spearman_correlation": 0.7482519519327383,
        "mse_loss": 0.011972521431744099,
        "mae": 0.08651026338338852,
        "baseline_pearson": 0.7233819365501404,
        "baseline_spearman": 0.7216921089468069,
        "baseline_mse": 0.020307404920458794,
        "baseline_mae": 0.11912278831005096,
        "improvement_pearson": 0.019274771213531494,
        "improvement_spearman": 0.026559842985931392,
        "improvement_mse": 0.008334883488714695,
        "improvement_mae": 0.032612524926662445
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.8777076005935669,
        "spearman_correlation": 0.8643990454562551,
        "mse_loss": 0.11885278671979904,
        "mae": 0.2950340509414673,
        "baseline_pearson": 0.4163680672645569,
        "baseline_spearman": 0.5432736055686197,
        "baseline_mse": 0.4616161286830902,
        "baseline_mae": 0.5406297445297241,
        "improvement_pearson": 0.46133953332901,
        "improvement_spearman": 0.3211254398876354,
        "improvement_mse": 0.34276334196329117,
        "improvement_mae": 0.24559569358825684
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.9136272072792053,
        "spearman_correlation": 0.8876150753906337,
        "mse_loss": 0.1199968084692955,
        "mae": 0.29267191886901855,
        "baseline_pearson": 0.5243231654167175,
        "baseline_spearman": 0.5987330520238902,
        "baseline_mse": 0.49014800786972046,
        "baseline_mae": 0.5528956055641174,
        "improvement_pearson": 0.3893040418624878,
        "improvement_spearman": 0.2888820233667435,
        "improvement_mse": 0.37015119940042496,
        "improvement_mae": 0.2602236866950989
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6465219855308533,
        "spearman_correlation": 0.6224778621854278,
        "mse_loss": 0.01981373131275177,
        "mae": 0.10592655837535858,
        "baseline_pearson": 0.5368365049362183,
        "baseline_spearman": 0.509599906312962,
        "baseline_mse": 0.04638472571969032,
        "baseline_mae": 0.17725123465061188,
        "improvement_pearson": 0.10968548059463501,
        "improvement_spearman": 0.11287795587246574,
        "improvement_mse": 0.026570994406938553,
        "improvement_mae": 0.0713246762752533
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7056251764297485,
        "spearman_correlation": 0.5765291324777772,
        "mse_loss": 0.04091168940067291,
        "mae": 0.1537952572107315,
        "baseline_pearson": 0.6150497198104858,
        "baseline_spearman": 0.5715964042787275,
        "baseline_mse": 0.15905116498470306,
        "baseline_mae": 0.36223718523979187,
        "improvement_pearson": 0.0905754566192627,
        "improvement_spearman": 0.004932728199049663,
        "improvement_mse": 0.11813947558403015,
        "improvement_mae": 0.20844192802906036
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.8258661031723022,
        "spearman_correlation": 0.6978581523508371,
        "mse_loss": 0.253279447555542,
        "mae": 0.3714354336261749,
        "baseline_pearson": 0.5234269499778748,
        "baseline_spearman": 0.5864759981881295,
        "baseline_mse": 0.6183682084083557,
        "baseline_mae": 0.5109743475914001,
        "improvement_pearson": 0.3024391531944275,
        "improvement_spearman": 0.11138215416270769,
        "improvement_mse": 0.3650887608528137,
        "improvement_mae": 0.13953891396522522
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.7649705410003662,
        "spearman_correlation": 0.6014489621389167,
        "mse_loss": 0.3746911287307739,
        "mae": 0.4983021020889282,
        "baseline_pearson": 0.432989239692688,
        "baseline_spearman": 0.4368091815720614,
        "baseline_mse": 0.8056158423423767,
        "baseline_mae": 0.6695317029953003,
        "improvement_pearson": 0.3319813013076782,
        "improvement_spearman": 0.16463978056685535,
        "improvement_mse": 0.4309247136116028,
        "improvement_mae": 0.17122960090637207
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.48266592621803284,
        "spearman_correlation": 0.5435455949510549,
        "mse_loss": 0.007368025835603476,
        "mae": 0.07009919732809067,
        "baseline_pearson": 0.5525341033935547,
        "baseline_spearman": 0.5639582662029577,
        "baseline_mse": 0.008408023975789547,
        "baseline_mae": 0.07173997163772583,
        "improvement_pearson": -0.06986817717552185,
        "improvement_spearman": -0.020412671251902825,
        "improvement_mse": 0.0010399981401860714,
        "improvement_mae": 0.0016407743096351624
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6551828384399414,
        "spearman_correlation": 0.6829750690033419,
        "mse_loss": 0.01584281586110592,
        "mae": 0.09991515427827835,
        "baseline_pearson": 0.5883725881576538,
        "baseline_spearman": 0.6480148733153028,
        "baseline_mse": 0.025501079857349396,
        "baseline_mae": 0.13185398280620575,
        "improvement_pearson": 0.0668102502822876,
        "improvement_spearman": 0.0349601956880391,
        "improvement_mse": 0.009658263996243477,
        "improvement_mae": 0.0319388285279274
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.8594282865524292,
        "spearman_correlation": 0.8538727404576648,
        "mse_loss": 0.13385331630706787,
        "mae": 0.31019875407218933,
        "baseline_pearson": 0.4976809620857239,
        "baseline_spearman": 0.6156559137276979,
        "baseline_mse": 0.7888655066490173,
        "baseline_mae": 0.6898810863494873,
        "improvement_pearson": 0.3617473244667053,
        "improvement_spearman": 0.2382168267299669,
        "improvement_mse": 0.6550121903419495,
        "improvement_mae": 0.379682332277298
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.8992952704429626,
        "spearman_correlation": 0.8615558840931518,
        "mse_loss": 0.12002211064100266,
        "mae": 0.2864231467247009,
        "baseline_pearson": 0.6277625560760498,
        "baseline_spearman": 0.7019842619521564,
        "baseline_mse": 0.6773322820663452,
        "baseline_mae": 0.5756174325942993,
        "improvement_pearson": 0.27153271436691284,
        "improvement_spearman": 0.1595716221409954,
        "improvement_mse": 0.5573101714253426,
        "improvement_mae": 0.2891942858695984
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.5400815606117249,
        "spearman_correlation": 0.49985130627415486,
        "mse_loss": 0.027304736897349358,
        "mae": 0.12807168066501617,
        "baseline_pearson": 0.37987083196640015,
        "baseline_spearman": 0.35132273589146856,
        "baseline_mse": 0.08493253588676453,
        "baseline_mae": 0.24908985197544098,
        "improvement_pearson": 0.1602107286453247,
        "improvement_spearman": 0.1485285703826863,
        "improvement_mse": 0.05762779898941517,
        "improvement_mae": 0.1210181713104248
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.5925794839859009,
        "spearman_correlation": 0.5497968496840806,
        "mse_loss": 0.07335476577281952,
        "mae": 0.19527225196361542,
        "baseline_pearson": 0.4823821187019348,
        "baseline_spearman": 0.4816329804237789,
        "baseline_mse": 0.5332337617874146,
        "baseline_mae": 0.7104365229606628,
        "improvement_pearson": 0.11019736528396606,
        "improvement_spearman": 0.06816386926030171,
        "improvement_mse": 0.45987899601459503,
        "improvement_mae": 0.5151642709970474
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.8570863008499146,
        "spearman_correlation": 0.7198318589506133,
        "mse_loss": 0.22251948714256287,
        "mae": 0.3427633047103882,
        "baseline_pearson": 0.7716249823570251,
        "baseline_spearman": 0.7200223642926882,
        "baseline_mse": 0.7771866917610168,
        "baseline_mae": 0.566684901714325,
        "improvement_pearson": 0.0854613184928894,
        "improvement_spearman": -0.0001905053420748759,
        "improvement_mse": 0.554667204618454,
        "improvement_mae": 0.22392159700393677
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.782118022441864,
        "spearman_correlation": 0.6489993300262328,
        "mse_loss": 0.3278059959411621,
        "mae": 0.45458343625068665,
        "baseline_pearson": 0.701436460018158,
        "baseline_spearman": 0.6187674946816014,
        "baseline_mse": 0.8923483490943909,
        "baseline_mae": 0.6829137206077576,
        "improvement_pearson": 0.08068156242370605,
        "improvement_spearman": 0.030231835344631364,
        "improvement_mse": 0.5645423531532288,
        "improvement_mae": 0.22833028435707092
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.38312816619873047,
        "spearman_correlation": 0.4630011444571606,
        "mse_loss": 0.009905961342155933,
        "mae": 0.08297523856163025,
        "baseline_pearson": 0.26931232213974,
        "baseline_spearman": 0.34380115334614825,
        "baseline_mse": 0.007926326245069504,
        "baseline_mae": 0.07401411980390549,
        "improvement_pearson": 0.11381584405899048,
        "improvement_spearman": 0.11919999111101237,
        "improvement_mse": -0.0019796350970864296,
        "improvement_mae": -0.008961118757724762
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7003799676895142,
        "spearman_correlation": 0.712931301783626,
        "mse_loss": 0.02349545992910862,
        "mae": 0.12829819321632385,
        "baseline_pearson": 0.5901201367378235,
        "baseline_spearman": 0.6602471835947109,
        "baseline_mse": 0.04947347193956375,
        "baseline_mae": 0.19630166888237,
        "improvement_pearson": 0.11025983095169067,
        "improvement_spearman": 0.05268411818891505,
        "improvement_mse": 0.02597801201045513,
        "improvement_mae": 0.06800347566604614
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.8590815663337708,
        "spearman_correlation": 0.8601419434088466,
        "mse_loss": 0.13181819021701813,
        "mae": 0.30235427618026733,
        "baseline_pearson": 0.27423495054244995,
        "baseline_spearman": 0.399863267427577,
        "baseline_mse": 0.5485295057296753,
        "baseline_mae": 0.5816904902458191,
        "improvement_pearson": 0.5848466157913208,
        "improvement_spearman": 0.46027867598126965,
        "improvement_mse": 0.41671131551265717,
        "improvement_mae": 0.27933621406555176
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.9125617146492004,
        "spearman_correlation": 0.8765667784686424,
        "mse_loss": 0.112386055290699,
        "mae": 0.2783728539943695,
        "baseline_pearson": 0.455720990896225,
        "baseline_spearman": 0.5347046421790798,
        "baseline_mse": 0.517350971698761,
        "baseline_mae": 0.556111216545105,
        "improvement_pearson": 0.45684072375297546,
        "improvement_spearman": 0.34186213628956263,
        "improvement_mse": 0.404964916408062,
        "improvement_mae": 0.2777383625507355
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6059024930000305,
        "spearman_correlation": 0.550020614048313,
        "mse_loss": 0.02248263917863369,
        "mae": 0.11351320147514343,
        "baseline_pearson": 0.5106189250946045,
        "baseline_spearman": 0.4993518198480432,
        "baseline_mse": 0.03302350640296936,
        "baseline_mae": 0.1428980827331543,
        "improvement_pearson": 0.09528356790542603,
        "improvement_spearman": 0.05066879420026982,
        "improvement_mse": 0.01054086722433567,
        "improvement_mae": 0.029384881258010864
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6891536712646484,
        "spearman_correlation": 0.5853158877802812,
        "mse_loss": 0.04254316911101341,
        "mae": 0.15477752685546875,
        "baseline_pearson": 0.610828161239624,
        "baseline_spearman": 0.54753524302367,
        "baseline_mse": 0.20536838471889496,
        "baseline_mae": 0.4215392470359802,
        "improvement_pearson": 0.07832551002502441,
        "improvement_spearman": 0.03778064475661125,
        "improvement_mse": 0.16282521560788155,
        "improvement_mae": 0.2667617201805115
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.8008086085319519,
        "spearman_correlation": 0.7040256549003703,
        "mse_loss": 0.3687315881252289,
        "mae": 0.45897185802459717,
        "baseline_pearson": 0.43017083406448364,
        "baseline_spearman": 0.47153640262470703,
        "baseline_mse": 0.8090472221374512,
        "baseline_mae": 0.6062833666801453,
        "improvement_pearson": 0.37063777446746826,
        "improvement_spearman": 0.23248925227566325,
        "improvement_mse": 0.4403156340122223,
        "improvement_mae": 0.1473115086555481
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.6662585139274597,
        "spearman_correlation": 0.4687185989901955,
        "mse_loss": 0.4226611256599426,
        "mae": 0.5228760242462158,
        "baseline_pearson": 0.3109879493713379,
        "baseline_spearman": 0.30700615625369004,
        "baseline_mse": 0.7535920143127441,
        "baseline_mae": 0.6142871379852295,
        "improvement_pearson": 0.3552705645561218,
        "improvement_spearman": 0.16171244273650548,
        "improvement_mse": 0.3309308886528015,
        "improvement_mae": 0.09141111373901367
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.4793967008590698,
        "spearman_correlation": 0.5343326036955965,
        "mse_loss": 0.007684791926294565,
        "mae": 0.07259005308151245,
        "baseline_pearson": 0.507156491279602,
        "baseline_spearman": 0.5328441427126968,
        "baseline_mse": 0.006578793749213219,
        "baseline_mae": 0.06252744048833847,
        "improvement_pearson": -0.027759790420532227,
        "improvement_spearman": 0.0014884609828997863,
        "improvement_mse": -0.0011059981770813465,
        "improvement_mae": -0.01006261259317398
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7231854200363159,
        "spearman_correlation": 0.7244225446690274,
        "mse_loss": 0.018668396398425102,
        "mae": 0.11309074610471725,
        "baseline_pearson": 0.6602195501327515,
        "baseline_spearman": 0.6783163340616626,
        "baseline_mse": 0.030490506440401077,
        "baseline_mae": 0.14886574447155,
        "improvement_pearson": 0.06296586990356445,
        "improvement_spearman": 0.04610621060736486,
        "improvement_mse": 0.011822110041975975,
        "improvement_mae": 0.03577499836683273
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.832750141620636,
        "spearman_correlation": 0.8261213123752821,
        "mse_loss": 0.14581722021102905,
        "mae": 0.3267531096935272,
        "baseline_pearson": 0.3544366955757141,
        "baseline_spearman": 0.4849287299060889,
        "baseline_mse": 0.4522722661495209,
        "baseline_mae": 0.5203538537025452,
        "improvement_pearson": 0.4783134460449219,
        "improvement_spearman": 0.3411925824691932,
        "improvement_mse": 0.3064550459384918,
        "improvement_mae": 0.19360074400901794
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.8814281821250916,
        "spearman_correlation": 0.8448582931821239,
        "mse_loss": 0.12945516407489777,
        "mae": 0.3154312074184418,
        "baseline_pearson": 0.5131227970123291,
        "baseline_spearman": 0.5954285078527701,
        "baseline_mse": 0.42912471294403076,
        "baseline_mae": 0.5194165110588074,
        "improvement_pearson": 0.36830538511276245,
        "improvement_spearman": 0.24942978532935378,
        "improvement_mse": 0.299669548869133,
        "improvement_mae": 0.2039853036403656
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.5880706310272217,
        "spearman_correlation": 0.5798310328892936,
        "mse_loss": 0.02136288210749626,
        "mae": 0.1105075404047966,
        "baseline_pearson": 0.5162912607192993,
        "baseline_spearman": 0.4731187399860438,
        "baseline_mse": 0.04374175891280174,
        "baseline_mae": 0.17367644608020782,
        "improvement_pearson": 0.07177937030792236,
        "improvement_spearman": 0.1067122929032498,
        "improvement_mse": 0.02237887680530548,
        "improvement_mae": 0.06316890567541122
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7259281873703003,
        "spearman_correlation": 0.6270294838587284,
        "mse_loss": 0.04331798478960991,
        "mae": 0.15996935963630676,
        "baseline_pearson": 0.6720682382583618,
        "baseline_spearman": 0.5876094328454649,
        "baseline_mse": 0.1567925065755844,
        "baseline_mae": 0.36030521988868713,
        "improvement_pearson": 0.05385994911193848,
        "improvement_spearman": 0.03942005101326351,
        "improvement_mse": 0.1134745217859745,
        "improvement_mae": 0.20033586025238037
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7719403505325317,
        "spearman_correlation": 0.6458984830894092,
        "mse_loss": 0.3592841625213623,
        "mae": 0.45410487055778503,
        "baseline_pearson": 0.4285154938697815,
        "baseline_spearman": 0.442573864766155,
        "baseline_mse": 0.7264881134033203,
        "baseline_mae": 0.5855805277824402,
        "improvement_pearson": 0.34342485666275024,
        "improvement_spearman": 0.2033246183232542,
        "improvement_mse": 0.367203950881958,
        "improvement_mae": 0.13147565722465515
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.6758673191070557,
        "spearman_correlation": 0.5393560135790849,
        "mse_loss": 0.43966421484947205,
        "mae": 0.5307916402816772,
        "baseline_pearson": 0.31865382194519043,
        "baseline_spearman": 0.31022110517987883,
        "baseline_mse": 0.7838441133499146,
        "baseline_mae": 0.6526228189468384,
        "improvement_pearson": 0.35721349716186523,
        "improvement_spearman": 0.22913490839920608,
        "improvement_mse": 0.3441798985004425,
        "improvement_mae": 0.12183117866516113
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.3190738558769226,
        "spearman_correlation": 0.38840609340103777,
        "mse_loss": 0.008641705848276615,
        "mae": 0.07599636167287827,
        "baseline_pearson": 0.5391713380813599,
        "baseline_spearman": 0.5480069778553095,
        "baseline_mse": 0.009122451767325401,
        "baseline_mae": 0.07388684898614883,
        "improvement_pearson": -0.22009748220443726,
        "improvement_spearman": -0.15960088445427173,
        "improvement_mse": 0.00048074591904878616,
        "improvement_mae": -0.002109512686729431
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7149261236190796,
        "spearman_correlation": 0.7222609949763814,
        "mse_loss": 0.012350030243396759,
        "mae": 0.08965839445590973,
        "baseline_pearson": 0.6887919902801514,
        "baseline_spearman": 0.6846353040499118,
        "baseline_mse": 0.019931739196181297,
        "baseline_mae": 0.11592590063810349,
        "improvement_pearson": 0.026134133338928223,
        "improvement_spearman": 0.03762569092646961,
        "improvement_mse": 0.007581708952784538,
        "improvement_mae": 0.026267506182193756
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.764320969581604,
        "spearman_correlation": 0.7785728794994328,
        "mse_loss": 0.18738017976284027,
        "mae": 0.3718876838684082,
        "baseline_pearson": 0.22939276695251465,
        "baseline_spearman": 0.35403896246579186,
        "baseline_mse": 0.5291363000869751,
        "baseline_mae": 0.574612557888031,
        "improvement_pearson": 0.5349282026290894,
        "improvement_spearman": 0.4245339170336409,
        "improvement_mse": 0.3417561203241348,
        "improvement_mae": 0.2027248740196228
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.823514461517334,
        "spearman_correlation": 0.8048980634836973,
        "mse_loss": 0.18900097906589508,
        "mae": 0.3768625557422638,
        "baseline_pearson": 0.2351376861333847,
        "baseline_spearman": 0.2856273665911698,
        "baseline_mse": 0.5350087881088257,
        "baseline_mae": 0.5797888040542603,
        "improvement_pearson": 0.5883767753839493,
        "improvement_spearman": 0.5192706968925276,
        "improvement_mse": 0.3460078090429306,
        "improvement_mae": 0.20292624831199646
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.5484712719917297,
        "spearman_correlation": 0.49931072276361305,
        "mse_loss": 0.022776229307055473,
        "mae": 0.11638258397579193,
        "baseline_pearson": 0.46735748648643494,
        "baseline_spearman": 0.41971960569222405,
        "baseline_mse": 0.02937251701951027,
        "baseline_mae": 0.1361221969127655,
        "improvement_pearson": 0.0811137855052948,
        "improvement_spearman": 0.079591117071389,
        "improvement_mse": 0.006596287712454796,
        "improvement_mae": 0.019739612936973572
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6904107928276062,
        "spearman_correlation": 0.6140638172687956,
        "mse_loss": 0.051585473120212555,
        "mae": 0.17177043855190277,
        "baseline_pearson": 0.6116666793823242,
        "baseline_spearman": 0.5506784572062604,
        "baseline_mse": 0.22397971153259277,
        "baseline_mae": 0.4395391047000885,
        "improvement_pearson": 0.07874411344528198,
        "improvement_spearman": 0.06338536006253515,
        "improvement_mse": 0.17239423841238022,
        "improvement_mae": 0.26776866614818573
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7557564973831177,
        "spearman_correlation": 0.6463959583032958,
        "mse_loss": 0.3815827965736389,
        "mae": 0.45541733503341675,
        "baseline_pearson": 0.4744443893432617,
        "baseline_spearman": 0.4610792475736326,
        "baseline_mse": 0.7267817258834839,
        "baseline_mae": 0.5657123327255249,
        "improvement_pearson": 0.28131210803985596,
        "improvement_spearman": 0.18531671072966316,
        "improvement_mse": 0.34519892930984497,
        "improvement_mae": 0.11029499769210815
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.6800497770309448,
        "spearman_correlation": 0.5777898764114695,
        "mse_loss": 0.4863570034503937,
        "mae": 0.5645930171012878,
        "baseline_pearson": 0.4218469262123108,
        "baseline_spearman": 0.40016438373463264,
        "baseline_mse": 0.8783612251281738,
        "baseline_mae": 0.6989898681640625,
        "improvement_pearson": 0.25820285081863403,
        "improvement_spearman": 0.17762549267683686,
        "improvement_mse": 0.39200422167778015,
        "improvement_mae": 0.13439685106277466
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.411537766456604,
        "spearman_correlation": 0.43231280347559414,
        "mse_loss": 0.00750502897426486,
        "mae": 0.07296514511108398,
        "baseline_pearson": 0.3918226957321167,
        "baseline_spearman": 0.3917674640829342,
        "baseline_mse": 0.01130613498389721,
        "baseline_mae": 0.08203740417957306,
        "improvement_pearson": 0.019715070724487305,
        "improvement_spearman": 0.04054533939265992,
        "improvement_mse": 0.003801106009632349,
        "improvement_mae": 0.009072259068489075
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7320911884307861,
        "spearman_correlation": 0.7299742370816393,
        "mse_loss": 0.014263728633522987,
        "mae": 0.09850780665874481,
        "baseline_pearson": 0.6382540464401245,
        "baseline_spearman": 0.6604100013471242,
        "baseline_mse": 0.025656284764409065,
        "baseline_mae": 0.13358990848064423,
        "improvement_pearson": 0.09383714199066162,
        "improvement_spearman": 0.06956423573451509,
        "improvement_mse": 0.011392556130886078,
        "improvement_mae": 0.035082101821899414
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.8399763107299805,
        "spearman_correlation": 0.8210307969517204,
        "mse_loss": 0.14171536266803741,
        "mae": 0.31245917081832886,
        "baseline_pearson": 0.35473158955574036,
        "baseline_spearman": 0.46378230166891415,
        "baseline_mse": 0.6676440238952637,
        "baseline_mae": 0.6364850401878357,
        "improvement_pearson": 0.4852447211742401,
        "improvement_spearman": 0.3572484952828063,
        "improvement_mse": 0.5259286612272263,
        "improvement_mae": 0.32402586936950684
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.9068217277526855,
        "spearman_correlation": 0.867183009358275,
        "mse_loss": 0.11533339321613312,
        "mae": 0.28775012493133545,
        "baseline_pearson": 0.4321386218070984,
        "baseline_spearman": 0.5111647572788524,
        "baseline_mse": 0.6598177552223206,
        "baseline_mae": 0.5959032773971558,
        "improvement_pearson": 0.47468310594558716,
        "improvement_spearman": 0.3560182520794226,
        "improvement_mse": 0.5444843620061874,
        "improvement_mae": 0.3081531524658203
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.5616196990013123,
        "spearman_correlation": 0.5480673972848967,
        "mse_loss": 0.024458400905132294,
        "mae": 0.11709094047546387,
        "baseline_pearson": 0.45749902725219727,
        "baseline_spearman": 0.44685567482315164,
        "baseline_mse": 0.04830919951200485,
        "baseline_mae": 0.17485623061656952,
        "improvement_pearson": 0.10412067174911499,
        "improvement_spearman": 0.10121172246174509,
        "improvement_mse": 0.02385079860687256,
        "improvement_mae": 0.05776529014110565
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6567656993865967,
        "spearman_correlation": 0.6140730791174231,
        "mse_loss": 0.06717979162931442,
        "mae": 0.19228427112102509,
        "baseline_pearson": 0.5422202348709106,
        "baseline_spearman": 0.5299408109139192,
        "baseline_mse": 0.4307238757610321,
        "baseline_mae": 0.6335455179214478,
        "improvement_pearson": 0.11454546451568604,
        "improvement_spearman": 0.08413226820350395,
        "improvement_mse": 0.3635440841317177,
        "improvement_mae": 0.44126124680042267
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7739048004150391,
        "spearman_correlation": 0.7014263839029636,
        "mse_loss": 0.3563307225704193,
        "mae": 0.43641605973243713,
        "baseline_pearson": 0.5303269624710083,
        "baseline_spearman": 0.5734046278376633,
        "baseline_mse": 0.8097094893455505,
        "baseline_mae": 0.5952159762382507,
        "improvement_pearson": 0.24357783794403076,
        "improvement_spearman": 0.1280217560653003,
        "improvement_mse": 0.4533787667751312,
        "improvement_mae": 0.1587999165058136
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.780505895614624,
        "spearman_correlation": 0.6796285080962353,
        "mse_loss": 0.396475613117218,
        "mae": 0.49477308988571167,
        "baseline_pearson": 0.4782516360282898,
        "baseline_spearman": 0.4954520379295767,
        "baseline_mse": 0.9582951664924622,
        "baseline_mae": 0.702655017375946,
        "improvement_pearson": 0.30225425958633423,
        "improvement_spearman": 0.1841764701666586,
        "improvement_mse": 0.5618195533752441,
        "improvement_mae": 0.20788192749023438
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.47615206241607666,
        "spearman_correlation": 0.5143906043400481,
        "mse_loss": 0.007285355124622583,
        "mae": 0.07091518491506577,
        "baseline_pearson": 0.5339566469192505,
        "baseline_spearman": 0.5327174746386071,
        "baseline_mse": 0.0052171689458191395,
        "baseline_mae": 0.058514486998319626,
        "improvement_pearson": -0.05780458450317383,
        "improvement_spearman": -0.01832687029855895,
        "improvement_mse": -0.002068186178803444,
        "improvement_mae": -0.01240069791674614
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6740978956222534,
        "spearman_correlation": 0.6808784404952558,
        "mse_loss": 0.020031841471791267,
        "mae": 0.11348078399896622,
        "baseline_pearson": 0.6054565906524658,
        "baseline_spearman": 0.6154023082145812,
        "baseline_mse": 0.04138600826263428,
        "baseline_mae": 0.17928119003772736,
        "improvement_pearson": 0.0686413049697876,
        "improvement_spearman": 0.06547613228067461,
        "improvement_mse": 0.02135416679084301,
        "improvement_mae": 0.06580040603876114
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7633247375488281,
        "spearman_correlation": 0.7574473326433752,
        "mse_loss": 0.18595586717128754,
        "mae": 0.3730149567127228,
        "baseline_pearson": 0.41168516874313354,
        "baseline_spearman": 0.4985081900083937,
        "baseline_mse": 0.6779193878173828,
        "baseline_mae": 0.6596677303314209,
        "improvement_pearson": 0.3516395688056946,
        "improvement_spearman": 0.25893914263498147,
        "improvement_mse": 0.4919635206460953,
        "improvement_mae": 0.2866527736186981
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.8595728874206543,
        "spearman_correlation": 0.8306928513012591,
        "mse_loss": 0.16006244719028473,
        "mae": 0.3586815297603607,
        "baseline_pearson": 0.5663049221038818,
        "baseline_spearman": 0.6142242678065588,
        "baseline_mse": 0.7275902032852173,
        "baseline_mae": 0.643936038017273,
        "improvement_pearson": 0.29326796531677246,
        "improvement_spearman": 0.21646858349470033,
        "improvement_mse": 0.5675277560949326,
        "improvement_mae": 0.28525450825691223
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.549225926399231,
        "spearman_correlation": 0.5309159299131506,
        "mse_loss": 0.023437535390257835,
        "mae": 0.11615528911352158,
        "baseline_pearson": 0.355010986328125,
        "baseline_spearman": 0.3140805262462881,
        "baseline_mse": 0.06817207485437393,
        "baseline_mae": 0.21681912243366241,
        "improvement_pearson": 0.19421494007110596,
        "improvement_spearman": 0.2168354036668625,
        "improvement_mse": 0.044734539464116096,
        "improvement_mae": 0.10066383332014084
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7076656818389893,
        "spearman_correlation": 0.5954015111805891,
        "mse_loss": 0.044551949948072433,
        "mae": 0.16024616360664368,
        "baseline_pearson": 0.5842751264572144,
        "baseline_spearman": 0.5358324453694526,
        "baseline_mse": 0.48011693358421326,
        "baseline_mae": 0.6743825674057007,
        "improvement_pearson": 0.1233905553817749,
        "improvement_spearman": 0.05956906581113652,
        "improvement_mse": 0.4355649836361408,
        "improvement_mae": 0.514136403799057
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.832744836807251,
        "spearman_correlation": 0.6843186535862302,
        "mse_loss": 0.2517277002334595,
        "mae": 0.36894911527633667,
        "baseline_pearson": 0.6128219366073608,
        "baseline_spearman": 0.6085898200467367,
        "baseline_mse": 0.7050703167915344,
        "baseline_mae": 0.5434849858283997,
        "improvement_pearson": 0.21992290019989014,
        "improvement_spearman": 0.07572883353949356,
        "improvement_mse": 0.45334261655807495,
        "improvement_mae": 0.174535870552063
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.7879235148429871,
        "spearman_correlation": 0.6772324339993908,
        "mse_loss": 0.3772977888584137,
        "mae": 0.48441725969314575,
        "baseline_pearson": 0.5945952534675598,
        "baseline_spearman": 0.5609696448377599,
        "baseline_mse": 0.9448219537734985,
        "baseline_mae": 0.7066500782966614,
        "improvement_pearson": 0.19332826137542725,
        "improvement_spearman": 0.11626278916163091,
        "improvement_mse": 0.5675241649150848,
        "improvement_mae": 0.22223281860351562
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6123145818710327,
        "spearman_correlation": 0.6239047100523338,
        "mse_loss": 0.005188680253922939,
        "mae": 0.05805465579032898,
        "baseline_pearson": 0.4884979724884033,
        "baseline_spearman": 0.47272303025589174,
        "baseline_mse": 0.005412471946328878,
        "baseline_mae": 0.05859474092721939,
        "improvement_pearson": 0.1238166093826294,
        "improvement_spearman": 0.1511816797964421,
        "improvement_mse": 0.0002237916924059391,
        "improvement_mae": 0.0005400851368904114
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7205113768577576,
        "spearman_correlation": 0.7366263690838181,
        "mse_loss": 0.017091114073991776,
        "mae": 0.10879962891340256,
        "baseline_pearson": 0.651875376701355,
        "baseline_spearman": 0.6755613276069153,
        "baseline_mse": 0.03940935805439949,
        "baseline_mae": 0.17473198473453522,
        "improvement_pearson": 0.06863600015640259,
        "improvement_spearman": 0.061065041476902726,
        "improvement_mse": 0.022318243980407715,
        "improvement_mae": 0.06593235582113266
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.8185624480247498,
        "spearman_correlation": 0.783361033512336,
        "mse_loss": 0.1645767092704773,
        "mae": 0.354410320520401,
        "baseline_pearson": 0.3496236801147461,
        "baseline_spearman": 0.45278992504550875,
        "baseline_mse": 0.5647153258323669,
        "baseline_mae": 0.6115906834602356,
        "improvement_pearson": 0.46893876791000366,
        "improvement_spearman": 0.33057110846682725,
        "improvement_mse": 0.40013861656188965,
        "improvement_mae": 0.2571803629398346
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.8909963369369507,
        "spearman_correlation": 0.8693827490880395,
        "mse_loss": 0.1322769820690155,
        "mae": 0.3130301535129547,
        "baseline_pearson": 0.5435715913772583,
        "baseline_spearman": 0.5953795914760576,
        "baseline_mse": 0.5219523906707764,
        "baseline_mae": 0.5593916177749634,
        "improvement_pearson": 0.3474247455596924,
        "improvement_spearman": 0.2740031576119819,
        "improvement_mse": 0.38967540860176086,
        "improvement_mae": 0.24636146426200867
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6437637209892273,
        "spearman_correlation": 0.6415578262247498,
        "mse_loss": 0.020447608083486557,
        "mae": 0.10944970697164536,
        "baseline_pearson": 0.4941643476486206,
        "baseline_spearman": 0.4985934766935001,
        "baseline_mse": 0.029427412897348404,
        "baseline_mae": 0.12982504069805145,
        "improvement_pearson": 0.1495993733406067,
        "improvement_spearman": 0.14296434953124965,
        "improvement_mse": 0.008979804813861847,
        "improvement_mae": 0.020375333726406097
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6987875699996948,
        "spearman_correlation": 0.6607166176728727,
        "mse_loss": 0.044043075293302536,
        "mae": 0.1584753543138504,
        "baseline_pearson": 0.5857259631156921,
        "baseline_spearman": 0.5711758756330952,
        "baseline_mse": 0.2481904923915863,
        "baseline_mae": 0.4669418931007385,
        "improvement_pearson": 0.11306160688400269,
        "improvement_spearman": 0.08954074203977747,
        "improvement_mse": 0.20414741709828377,
        "improvement_mae": 0.3084665387868881
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.8643084764480591,
        "spearman_correlation": 0.7534676155042078,
        "mse_loss": 0.26869338750839233,
        "mae": 0.38835254311561584,
        "baseline_pearson": 0.6496414542198181,
        "baseline_spearman": 0.6418185578707446,
        "baseline_mse": 0.8215478658676147,
        "baseline_mae": 0.6264525055885315,
        "improvement_pearson": 0.21466702222824097,
        "improvement_spearman": 0.11164905763346322,
        "improvement_mse": 0.5528544783592224,
        "improvement_mae": 0.23809996247291565
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.7977874279022217,
        "spearman_correlation": 0.6564252014495965,
        "mse_loss": 0.3738993704319,
        "mae": 0.49092280864715576,
        "baseline_pearson": 0.6105221509933472,
        "baseline_spearman": 0.5732307280460925,
        "baseline_mse": 0.8948317170143127,
        "baseline_mae": 0.7010171413421631,
        "improvement_pearson": 0.1872652769088745,
        "improvement_spearman": 0.08319447340350394,
        "improvement_mse": 0.5209323465824127,
        "improvement_mae": 0.21009433269500732
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.4596197307109833,
        "spearman_correlation": 0.48989966555183945,
        "mse_loss": 0.006336946506053209,
        "mae": 0.06563041359186172,
        "baseline_pearson": 0.43746986985206604,
        "baseline_spearman": 0.4532130357003966,
        "baseline_mse": 0.011288574896752834,
        "baseline_mae": 0.08344442397356033,
        "improvement_pearson": 0.022149860858917236,
        "improvement_spearman": 0.03668662985144283,
        "improvement_mse": 0.004951628390699625,
        "improvement_mae": 0.01781401038169861
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7075436115264893,
        "spearman_correlation": 0.7138292413382027,
        "mse_loss": 0.014251407235860825,
        "mae": 0.09769327938556671,
        "baseline_pearson": 0.6260946989059448,
        "baseline_spearman": 0.650140798462665,
        "baseline_mse": 0.027126546949148178,
        "baseline_mae": 0.1389124095439911,
        "improvement_pearson": 0.08144891262054443,
        "improvement_spearman": 0.06368844287553765,
        "improvement_mse": 0.012875139713287354,
        "improvement_mae": 0.04121913015842438
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7870924472808838,
        "spearman_correlation": 0.7719366750511046,
        "mse_loss": 0.20232483744621277,
        "mae": 0.39385101199150085,
        "baseline_pearson": 0.27073466777801514,
        "baseline_spearman": 0.3649048539564697,
        "baseline_mse": 0.7297953367233276,
        "baseline_mae": 0.6741521954536438,
        "improvement_pearson": 0.5163577795028687,
        "improvement_spearman": 0.4070318210946349,
        "improvement_mse": 0.5274704992771149,
        "improvement_mae": 0.28030118346214294
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.848231852054596,
        "spearman_correlation": 0.8234178341608666,
        "mse_loss": 0.18676069378852844,
        "mae": 0.3701452612876892,
        "baseline_pearson": 0.4036916494369507,
        "baseline_spearman": 0.4737248917060248,
        "baseline_mse": 0.6475955247879028,
        "baseline_mae": 0.5906919240951538,
        "improvement_pearson": 0.44454020261764526,
        "improvement_spearman": 0.3496929424548418,
        "improvement_mse": 0.4608348309993744,
        "improvement_mae": 0.2205466628074646
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.5529282093048096,
        "spearman_correlation": 0.5171157876864351,
        "mse_loss": 0.022434992715716362,
        "mae": 0.11527159065008163,
        "baseline_pearson": 0.4742736518383026,
        "baseline_spearman": 0.4407317876795835,
        "baseline_mse": 0.041973937302827835,
        "baseline_mae": 0.16513168811798096,
        "improvement_pearson": 0.07865455746650696,
        "improvement_spearman": 0.07638400000685158,
        "improvement_mse": 0.019538944587111473,
        "improvement_mae": 0.04986009746789932
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6944748163223267,
        "spearman_correlation": 0.6218960200571064,
        "mse_loss": 0.05140591412782669,
        "mae": 0.16771960258483887,
        "baseline_pearson": 0.5586616396903992,
        "baseline_spearman": 0.5090563213545708,
        "baseline_mse": 0.3963450789451599,
        "baseline_mae": 0.6066691279411316,
        "improvement_pearson": 0.1358131766319275,
        "improvement_spearman": 0.11283969870253563,
        "improvement_mse": 0.3449391648173332,
        "improvement_mae": 0.4389495253562927
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7374292612075806,
        "spearman_correlation": 0.6276829195526062,
        "mse_loss": 0.3810668885707855,
        "mae": 0.4436852037906647,
        "baseline_pearson": 0.3995856046676636,
        "baseline_spearman": 0.4520717144836539,
        "baseline_mse": 0.7222553491592407,
        "baseline_mae": 0.5325062870979309,
        "improvement_pearson": 0.337843656539917,
        "improvement_spearman": 0.17561120506895234,
        "improvement_mse": 0.3411884605884552,
        "improvement_mae": 0.08882108330726624
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.7034637928009033,
        "spearman_correlation": 0.564409695160521,
        "mse_loss": 0.4929702877998352,
        "mae": 0.5627599358558655,
        "baseline_pearson": 0.3897473216056824,
        "baseline_spearman": 0.3771542699724961,
        "baseline_mse": 0.9296790361404419,
        "baseline_mae": 0.6851403713226318,
        "improvement_pearson": 0.31371647119522095,
        "improvement_spearman": 0.18725542518802485,
        "improvement_mse": 0.4367087483406067,
        "improvement_mae": 0.12238043546676636
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.5683585405349731,
        "spearman_correlation": 0.5904638940432672,
        "mse_loss": 0.0057830470614135265,
        "mae": 0.05975994095206261,
        "baseline_pearson": 0.5283578634262085,
        "baseline_spearman": 0.5347330525894732,
        "baseline_mse": 0.005124067887663841,
        "baseline_mae": 0.05765429884195328,
        "improvement_pearson": 0.04000067710876465,
        "improvement_spearman": 0.05573084145379392,
        "improvement_mse": -0.0006589791737496853,
        "improvement_mae": -0.0021056421101093292
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7180399894714355,
        "spearman_correlation": 0.6999141869302827,
        "mse_loss": 0.013035432435572147,
        "mae": 0.09343879669904709,
        "baseline_pearson": 0.6644487380981445,
        "baseline_spearman": 0.6587954451433201,
        "baseline_mse": 0.04130151867866516,
        "baseline_mae": 0.1811142861843109,
        "improvement_pearson": 0.053591251373291016,
        "improvement_spearman": 0.04111874178696262,
        "improvement_mse": 0.028266086243093014,
        "improvement_mae": 0.08767548948526382
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.83551025390625,
        "spearman_correlation": 0.7887994725776694,
        "mse_loss": 0.16757063567638397,
        "mae": 0.35295701026916504,
        "baseline_pearson": 0.29369327425956726,
        "baseline_spearman": 0.3952962093169915,
        "baseline_mse": 0.7122378945350647,
        "baseline_mae": 0.6625744700431824,
        "improvement_pearson": 0.5418169796466827,
        "improvement_spearman": 0.39350326326067786,
        "improvement_mse": 0.5446672588586807,
        "improvement_mae": 0.30961745977401733
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.8790180683135986,
        "spearman_correlation": 0.8545924228066503,
        "mse_loss": 0.153229221701622,
        "mae": 0.33709269762039185,
        "baseline_pearson": 0.40181463956832886,
        "baseline_spearman": 0.4802774292555072,
        "baseline_mse": 0.6241834759712219,
        "baseline_mae": 0.5833064913749695,
        "improvement_pearson": 0.4772034287452698,
        "improvement_spearman": 0.37431499355114306,
        "improvement_mse": 0.4709542542695999,
        "improvement_mae": 0.24621379375457764
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.659348726272583,
        "spearman_correlation": 0.6070668380486276,
        "mse_loss": 0.01900624856352806,
        "mae": 0.10413365066051483,
        "baseline_pearson": 0.5738167762756348,
        "baseline_spearman": 0.5244917849149883,
        "baseline_mse": 0.03525429591536522,
        "baseline_mae": 0.14178159832954407,
        "improvement_pearson": 0.08553194999694824,
        "improvement_spearman": 0.08257505313363933,
        "improvement_mse": 0.016248047351837158,
        "improvement_mae": 0.037647947669029236
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6801258325576782,
        "spearman_correlation": 0.606635614196959,
        "mse_loss": 0.058223165571689606,
        "mae": 0.1796063333749771,
        "baseline_pearson": 0.5895004868507385,
        "baseline_spearman": 0.5523303318554744,
        "baseline_mse": 0.3836214542388916,
        "baseline_mae": 0.5977635383605957,
        "improvement_pearson": 0.0906253457069397,
        "improvement_spearman": 0.05430528234148457,
        "improvement_mse": 0.325398288667202,
        "improvement_mae": 0.4181572049856186
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.8055852055549622,
        "spearman_correlation": 0.663046670279655,
        "mse_loss": 0.35708990693092346,
        "mae": 0.4456453323364258,
        "baseline_pearson": 0.4101034998893738,
        "baseline_spearman": 0.465794361047646,
        "baseline_mse": 0.8361918330192566,
        "baseline_mae": 0.5812641382217407,
        "improvement_pearson": 0.3954817056655884,
        "improvement_spearman": 0.19725230923200904,
        "improvement_mse": 0.47910192608833313,
        "improvement_mae": 0.13561880588531494
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.7508951425552368,
        "spearman_correlation": 0.6305288413959784,
        "mse_loss": 0.4205990731716156,
        "mae": 0.5158722996711731,
        "baseline_pearson": 0.4547400176525116,
        "baseline_spearman": 0.48030350682657075,
        "baseline_mse": 0.8574506640434265,
        "baseline_mae": 0.653262734413147,
        "improvement_pearson": 0.2961551249027252,
        "improvement_spearman": 0.15022533456940768,
        "improvement_mse": 0.4368515908718109,
        "improvement_mae": 0.13739043474197388
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6193279027938843,
        "spearman_correlation": 0.664847387193191,
        "mse_loss": 0.007175777107477188,
        "mae": 0.06764256954193115,
        "baseline_pearson": 0.5081996917724609,
        "baseline_spearman": 0.49880198668874093,
        "baseline_mse": 0.005446223542094231,
        "baseline_mae": 0.06146332994103432,
        "improvement_pearson": 0.11112821102142334,
        "improvement_spearman": 0.1660454005044501,
        "improvement_mse": -0.0017295535653829575,
        "improvement_mae": -0.006179239600896835
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7429144382476807,
        "spearman_correlation": 0.7422303360108726,
        "mse_loss": 0.013816970400512218,
        "mae": 0.09476995468139648,
        "baseline_pearson": 0.5980582237243652,
        "baseline_spearman": 0.6448902810492896,
        "baseline_mse": 0.050530873239040375,
        "baseline_mae": 0.1985730677843094,
        "improvement_pearson": 0.14485621452331543,
        "improvement_spearman": 0.09734005496158304,
        "improvement_mse": 0.036713902838528156,
        "improvement_mae": 0.1038031131029129
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7640426158905029,
        "spearman_correlation": 0.7686222684876113,
        "mse_loss": 0.20257717370986938,
        "mae": 0.3796573579311371,
        "baseline_pearson": 0.2475363165140152,
        "baseline_spearman": 0.36935508372996984,
        "baseline_mse": 0.5716549158096313,
        "baseline_mae": 0.6121863722801208,
        "improvement_pearson": 0.5165062993764877,
        "improvement_spearman": 0.39926718475764145,
        "improvement_mse": 0.36907774209976196,
        "improvement_mae": 0.23252901434898376
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.8551720380783081,
        "spearman_correlation": 0.8235175982339192,
        "mse_loss": 0.1866646707057953,
        "mae": 0.3676333725452423,
        "baseline_pearson": 0.44768214225769043,
        "baseline_spearman": 0.49917363505201895,
        "baseline_mse": 0.5622704029083252,
        "baseline_mae": 0.5818170309066772,
        "improvement_pearson": 0.4074898958206177,
        "improvement_spearman": 0.3243439631819003,
        "improvement_mse": 0.3756057322025299,
        "improvement_mae": 0.21418365836143494
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.5968456864356995,
        "spearman_correlation": 0.5522826963271766,
        "mse_loss": 0.021097663789987564,
        "mae": 0.10980802029371262,
        "baseline_pearson": 0.5606783032417297,
        "baseline_spearman": 0.4882426669996704,
        "baseline_mse": 0.02402401715517044,
        "baseline_mae": 0.12208110839128494,
        "improvement_pearson": 0.03616738319396973,
        "improvement_spearman": 0.06404002932750624,
        "improvement_mse": 0.0029263533651828766,
        "improvement_mae": 0.012273088097572327
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6915639042854309,
        "spearman_correlation": 0.5941123187295486,
        "mse_loss": 0.050163332372903824,
        "mae": 0.17005988955497742,
        "baseline_pearson": 0.64356529712677,
        "baseline_spearman": 0.5606046679817795,
        "baseline_mse": 0.22488847374916077,
        "baseline_mae": 0.4473571479320526,
        "improvement_pearson": 0.04799860715866089,
        "improvement_spearman": 0.03350765074776907,
        "improvement_mse": 0.17472514137625694,
        "improvement_mae": 0.2772972583770752
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7594029903411865,
        "spearman_correlation": 0.6454127250674919,
        "mse_loss": 0.3696456253528595,
        "mae": 0.4446539282798767,
        "baseline_pearson": 0.45768120884895325,
        "baseline_spearman": 0.45346519244102323,
        "baseline_mse": 0.7494016289710999,
        "baseline_mae": 0.566105842590332,
        "improvement_pearson": 0.3017217814922333,
        "improvement_spearman": 0.1919475326264687,
        "improvement_mse": 0.37975600361824036,
        "improvement_mae": 0.12145191431045532
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.6736815571784973,
        "spearman_correlation": 0.5545311869171774,
        "mse_loss": 0.49393147230148315,
        "mae": 0.5620582103729248,
        "baseline_pearson": 0.30461329221725464,
        "baseline_spearman": 0.30861257329180997,
        "baseline_mse": 0.9027142524719238,
        "baseline_mae": 0.6960381269454956,
        "improvement_pearson": 0.3690682649612427,
        "improvement_spearman": 0.24591861362536743,
        "improvement_mse": 0.4087827801704407,
        "improvement_mae": 0.1339799165725708
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.2533535957336426,
        "spearman_correlation": 0.24983788708763432,
        "mse_loss": 0.009464249014854431,
        "mae": 0.08128272742033005,
        "baseline_pearson": 0.37806814908981323,
        "baseline_spearman": 0.35698441093789934,
        "baseline_mse": 0.0083980243653059,
        "baseline_mae": 0.0741361603140831,
        "improvement_pearson": -0.12471455335617065,
        "improvement_spearman": -0.10714652385026502,
        "improvement_mse": -0.0010662246495485306,
        "improvement_mae": -0.007146567106246948
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7188237309455872,
        "spearman_correlation": 0.7222946870116349,
        "mse_loss": 0.015298768877983093,
        "mae": 0.09913896769285202,
        "baseline_pearson": 0.619296133518219,
        "baseline_spearman": 0.6207471049004822,
        "baseline_mse": 0.03259238600730896,
        "baseline_mae": 0.15305817127227783,
        "improvement_pearson": 0.09952759742736816,
        "improvement_spearman": 0.10154758211115267,
        "improvement_mse": 0.017293617129325867,
        "improvement_mae": 0.05391920357942581
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7758349180221558,
        "spearman_correlation": 0.7666275097817202,
        "mse_loss": 0.18245691061019897,
        "mae": 0.36461377143859863,
        "baseline_pearson": 0.20388688147068024,
        "baseline_spearman": 0.3099378677305943,
        "baseline_mse": 0.6610548496246338,
        "baseline_mae": 0.6502407193183899,
        "improvement_pearson": 0.5719480365514755,
        "improvement_spearman": 0.45668964205112594,
        "improvement_mse": 0.4785979390144348,
        "improvement_mae": 0.28562694787979126
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.8307011127471924,
        "spearman_correlation": 0.8063026033435706,
        "mse_loss": 0.18917948007583618,
        "mae": 0.37575507164001465,
        "baseline_pearson": 0.326055109500885,
        "baseline_spearman": 0.3992829458808791,
        "baseline_mse": 0.5864969491958618,
        "baseline_mae": 0.5774375200271606,
        "improvement_pearson": 0.5046460032463074,
        "improvement_spearman": 0.40701965746269153,
        "improvement_mse": 0.39731746912002563,
        "improvement_mae": 0.201682448387146
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.5058112144470215,
        "spearman_correlation": 0.5112032191473742,
        "mse_loss": 0.02644645981490612,
        "mae": 0.11550367623567581,
        "baseline_pearson": 0.4627668857574463,
        "baseline_spearman": 0.4787941552695972,
        "baseline_mse": 0.03547773137688637,
        "baseline_mae": 0.13995429873466492,
        "improvement_pearson": 0.043044328689575195,
        "improvement_spearman": 0.03240906387777703,
        "improvement_mse": 0.009031271561980247,
        "improvement_mae": 0.024450622498989105
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6628636121749878,
        "spearman_correlation": 0.5968694754617222,
        "mse_loss": 0.05737881734967232,
        "mae": 0.17555367946624756,
        "baseline_pearson": 0.5557459592819214,
        "baseline_spearman": 0.5200949241498073,
        "baseline_mse": 0.3487054407596588,
        "baseline_mae": 0.5620614886283875,
        "improvement_pearson": 0.1071176528930664,
        "improvement_spearman": 0.07677455131191491,
        "improvement_mse": 0.2913266234099865,
        "improvement_mae": 0.3865078091621399
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.44972896575927734,
        "spearman_correlation": 0.4044707438732013,
        "mse_loss": 0.567654550075531,
        "mae": 0.5428889393806458,
        "baseline_pearson": 0.2730189263820648,
        "baseline_spearman": 0.27802237746794584,
        "baseline_mse": 0.787829577922821,
        "baseline_mae": 0.5659909844398499,
        "improvement_pearson": 0.17671003937721252,
        "improvement_spearman": 0.12644836640525547,
        "improvement_mse": 0.22017502784729004,
        "improvement_mae": 0.0231020450592041
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.4141894280910492,
        "spearman_correlation": 0.3662900066675701,
        "mse_loss": 0.7234252095222473,
        "mae": 0.6575598120689392,
        "baseline_pearson": 0.25462478399276733,
        "baseline_spearman": 0.2757736493441212,
        "baseline_mse": 1.0473408699035645,
        "baseline_mae": 0.7485263347625732,
        "improvement_pearson": 0.15956464409828186,
        "improvement_spearman": 0.09051635732344893,
        "improvement_mse": 0.32391566038131714,
        "improvement_mae": 0.09096652269363403
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.44868004322052,
        "spearman_correlation": 0.4570601895576617,
        "mse_loss": 0.007421264424920082,
        "mae": 0.0692419707775116,
        "baseline_pearson": 0.4052659273147583,
        "baseline_spearman": 0.38391271014122375,
        "baseline_mse": 0.007065929006785154,
        "baseline_mae": 0.06833110004663467,
        "improvement_pearson": 0.04341411590576172,
        "improvement_spearman": 0.07314747941643795,
        "improvement_mse": -0.00035533541813492775,
        "improvement_mae": -0.0009108707308769226
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7254754304885864,
        "spearman_correlation": 0.7189982918348303,
        "mse_loss": 0.015206935815513134,
        "mae": 0.1019681766629219,
        "baseline_pearson": 0.6360759139060974,
        "baseline_spearman": 0.6704666999361317,
        "baseline_mse": 0.044402118772268295,
        "baseline_mae": 0.18524953722953796,
        "improvement_pearson": 0.08939951658248901,
        "improvement_spearman": 0.0485315918986986,
        "improvement_mse": 0.02919518295675516,
        "improvement_mae": 0.08328136056661606
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.7952991127967834,
        "spearman_correlation": 0.7763680334728357,
        "mse_loss": 0.18423159420490265,
        "mae": 0.37225574254989624,
        "baseline_pearson": 0.23037682473659515,
        "baseline_spearman": 0.3295553878783797,
        "baseline_mse": 0.5790933966636658,
        "baseline_mae": 0.6128199100494385,
        "improvement_pearson": 0.5649222880601883,
        "improvement_spearman": 0.446812645594456,
        "improvement_mse": 0.3948618024587631,
        "improvement_mae": 0.24056416749954224
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.8627417087554932,
        "spearman_correlation": 0.840390495268407,
        "mse_loss": 0.157829150557518,
        "mae": 0.3445172607898712,
        "baseline_pearson": 0.3960179090499878,
        "baseline_spearman": 0.4424117739587331,
        "baseline_mse": 0.5197708606719971,
        "baseline_mae": 0.5623157620429993,
        "improvement_pearson": 0.46672379970550537,
        "improvement_spearman": 0.39797872130967393,
        "improvement_mse": 0.36194171011447906,
        "improvement_mae": 0.21779850125312805
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6665211319923401,
        "spearman_correlation": 0.6116051661731988,
        "mse_loss": 0.02257865108549595,
        "mae": 0.11844416707754135,
        "baseline_pearson": 0.5792216658592224,
        "baseline_spearman": 0.514639581248266,
        "baseline_mse": 0.029160045087337494,
        "baseline_mae": 0.13656164705753326,
        "improvement_pearson": 0.08729946613311768,
        "improvement_spearman": 0.09696558492493279,
        "improvement_mse": 0.006581394001841545,
        "improvement_mae": 0.018117479979991913
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.6815229654312134,
        "spearman_correlation": 0.5953207637079957,
        "mse_loss": 0.049138929694890976,
        "mae": 0.16234466433525085,
        "baseline_pearson": 0.6077470779418945,
        "baseline_spearman": 0.5192859759866595,
        "baseline_mse": 0.21986180543899536,
        "baseline_mae": 0.43976807594299316,
        "improvement_pearson": 0.07377588748931885,
        "improvement_spearman": 0.0760347877213362,
        "improvement_mse": 0.17072287574410439,
        "improvement_mae": 0.2774234116077423
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 100,
        "pearson_correlation": 0.8476958870887756,
        "spearman_correlation": 0.6944021483086852,
        "mse_loss": 0.29958948493003845,
        "mae": 0.4069003462791443,
        "baseline_pearson": 0.5753698348999023,
        "baseline_spearman": 0.5597476980427327,
        "baseline_mse": 0.755480945110321,
        "baseline_mae": 0.580354630947113,
        "improvement_pearson": 0.2723260521888733,
        "improvement_spearman": 0.13465445026595246,
        "improvement_mse": 0.4558914601802826,
        "improvement_mae": 0.17345428466796875
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 100,
        "pearson_correlation": 0.7369447946548462,
        "spearman_correlation": 0.5518046762051462,
        "mse_loss": 0.4507991671562195,
        "mae": 0.5572382807731628,
        "baseline_pearson": 0.3675463795661926,
        "baseline_spearman": 0.3643351465142022,
        "baseline_mse": 0.8652837872505188,
        "baseline_mae": 0.7069140672683716,
        "improvement_pearson": 0.36939841508865356,
        "improvement_spearman": 0.187469529690944,
        "improvement_mse": 0.4144846200942993,
        "improvement_mae": 0.14967578649520874
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.41371339559555054,
        "spearman_correlation": 0.45873576373070807,
        "mse_loss": 0.006909481715410948,
        "mae": 0.06802213191986084,
        "baseline_pearson": 0.4574582874774933,
        "baseline_spearman": 0.46586028733652596,
        "baseline_mse": 0.010940148495137691,
        "baseline_mae": 0.08236394822597504,
        "improvement_pearson": -0.04374489188194275,
        "improvement_spearman": -0.00712452360581789,
        "improvement_mse": 0.004030666779726744,
        "improvement_mae": 0.014341816306114197
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 100,
        "pearson_correlation": 0.7854598164558411,
        "spearman_correlation": 0.7730888081298246,
        "mse_loss": 0.013389220461249352,
        "mae": 0.09689205139875412,
        "baseline_pearson": 0.7000971436500549,
        "baseline_spearman": 0.7111606434499821,
        "baseline_mse": 0.027204355224967003,
        "baseline_mae": 0.13918375968933105,
        "improvement_pearson": 0.08536267280578613,
        "improvement_spearman": 0.06192816467984252,
        "improvement_mse": 0.013815134763717651,
        "improvement_mae": 0.042291708290576935
    }
]