[
    {
        "model": "bge-m3",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8167417049407959,
        "spearman_correlation": 0.7763302628744686,
        "mse_loss": 0.1750638782978058,
        "mae": 0.36844053864479065,
        "baseline_pearson": 0.15973970293998718,
        "baseline_spearman": 0.20818277181330005,
        "baseline_mse": 0.6377458572387695,
        "baseline_mae": 0.6411760449409485,
        "improvement_pearson": 0.6570020020008087,
        "improvement_spearman": 0.5681474910611686,
        "improvement_mse": 0.46268197894096375,
        "improvement_mae": 0.27273550629615784
    },
    {
        "model": "bge-m3",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8682464957237244,
        "spearman_correlation": 0.8304481628299852,
        "mse_loss": 0.16046521067619324,
        "mae": 0.36453500390052795,
        "baseline_pearson": 0.23316854238510132,
        "baseline_spearman": 0.2719172077100528,
        "baseline_mse": 0.587729275226593,
        "baseline_mae": 0.6074572205543518,
        "improvement_pearson": 0.635077953338623,
        "improvement_spearman": 0.5585309551199324,
        "improvement_mse": 0.4272640645503998,
        "improvement_mae": 0.24292221665382385
    },
    {
        "model": "bge-m3",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6912800073623657,
        "spearman_correlation": 0.6730556976274501,
        "mse_loss": 0.018522722646594048,
        "mae": 0.10258590430021286,
        "baseline_pearson": 0.5962152481079102,
        "baseline_spearman": 0.5696336532264592,
        "baseline_mse": 0.02054264023900032,
        "baseline_mae": 0.10972718894481659,
        "improvement_pearson": 0.09506475925445557,
        "improvement_spearman": 0.1034220444009909,
        "improvement_mse": 0.002019917592406273,
        "improvement_mae": 0.007141284644603729
    },
    {
        "model": "bge-m3",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7476900815963745,
        "spearman_correlation": 0.610925114178263,
        "mse_loss": 0.03069557622075081,
        "mae": 0.13008831441402435,
        "baseline_pearson": 0.5622110366821289,
        "baseline_spearman": 0.46470123933086505,
        "baseline_mse": 0.2508981227874756,
        "baseline_mae": 0.4730938971042633,
        "improvement_pearson": 0.1854790449142456,
        "improvement_spearman": 0.14622387484739796,
        "improvement_mse": 0.22020254656672478,
        "improvement_mae": 0.34300558269023895
    },
    {
        "model": "bge-m3",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8359866738319397,
        "spearman_correlation": 0.6401780939521515,
        "mse_loss": 0.27667418122291565,
        "mae": 0.39231571555137634,
        "baseline_pearson": 0.5418388843536377,
        "baseline_spearman": 0.53005402780743,
        "baseline_mse": 0.7344924807548523,
        "baseline_mae": 0.5818088054656982,
        "improvement_pearson": 0.294147789478302,
        "improvement_spearman": 0.11012406614472148,
        "improvement_mse": 0.45781829953193665,
        "improvement_mae": 0.1894930899143219
    },
    {
        "model": "bge-m3",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.7929596900939941,
        "spearman_correlation": 0.5816324304355686,
        "mse_loss": 0.3603166341781616,
        "mae": 0.5127500891685486,
        "baseline_pearson": 0.4490911066532135,
        "baseline_spearman": 0.403468627381486,
        "baseline_mse": 0.9179061055183411,
        "baseline_mae": 0.7369837164878845,
        "improvement_pearson": 0.34386858344078064,
        "improvement_spearman": 0.17816380305408258,
        "improvement_mse": 0.5575894713401794,
        "improvement_mae": 0.22423362731933594
    },
    {
        "model": "bge-m3",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6377509236335754,
        "spearman_correlation": 0.6388182090912121,
        "mse_loss": 0.010698005557060242,
        "mae": 0.09082353115081787,
        "baseline_pearson": 0.6702603101730347,
        "baseline_spearman": 0.6565664062934031,
        "baseline_mse": 0.005963595118373632,
        "baseline_mae": 0.06105095520615578,
        "improvement_pearson": -0.03250938653945923,
        "improvement_spearman": -0.017748197202191007,
        "improvement_mse": -0.004734410438686609,
        "improvement_mae": -0.029772575944662094
    },
    {
        "model": "bge-m3",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.8179858922958374,
        "spearman_correlation": 0.8065918787143863,
        "mse_loss": 0.00920816883444786,
        "mae": 0.0792563334107399,
        "baseline_pearson": 0.7798171043395996,
        "baseline_spearman": 0.7602876572856767,
        "baseline_mse": 0.020976657047867775,
        "baseline_mae": 0.12570060789585114,
        "improvement_pearson": 0.03816878795623779,
        "improvement_spearman": 0.0463042214287096,
        "improvement_mse": 0.011768488213419914,
        "improvement_mae": 0.04644427448511124
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.7848075032234192,
        "spearman_correlation": 0.780248275626632,
        "mse_loss": 0.18859869241714478,
        "mae": 0.371460497379303,
        "baseline_pearson": 0.1582985669374466,
        "baseline_spearman": 0.2708860450427659,
        "baseline_mse": 0.5816980600357056,
        "baseline_mae": 0.6053963899612427,
        "improvement_pearson": 0.6265089362859726,
        "improvement_spearman": 0.5093622305838661,
        "improvement_mse": 0.3930993676185608,
        "improvement_mae": 0.2339358925819397
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8422869443893433,
        "spearman_correlation": 0.8114316686837033,
        "mse_loss": 0.18137811124324799,
        "mae": 0.38206639885902405,
        "baseline_pearson": 0.20453613996505737,
        "baseline_spearman": 0.2824481391884123,
        "baseline_mse": 0.5510227084159851,
        "baseline_mae": 0.5925363302230835,
        "improvement_pearson": 0.6377508044242859,
        "improvement_spearman": 0.528983529495291,
        "improvement_mse": 0.3696445971727371,
        "improvement_mae": 0.21046993136405945
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6552296280860901,
        "spearman_correlation": 0.5924369402492101,
        "mse_loss": 0.01978434808552265,
        "mae": 0.10541923344135284,
        "baseline_pearson": 0.5571725964546204,
        "baseline_spearman": 0.5150472087145538,
        "baseline_mse": 0.025408169254660606,
        "baseline_mae": 0.120329350233078,
        "improvement_pearson": 0.09805703163146973,
        "improvement_spearman": 0.07738973153465634,
        "improvement_mse": 0.005623821169137955,
        "improvement_mae": 0.014910116791725159
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7253174781799316,
        "spearman_correlation": 0.6390882154253686,
        "mse_loss": 0.03317959979176521,
        "mae": 0.13154324889183044,
        "baseline_pearson": 0.6136019229888916,
        "baseline_spearman": 0.5632056133584451,
        "baseline_mse": 0.20397210121154785,
        "baseline_mae": 0.42629149556159973,
        "improvement_pearson": 0.11171555519104004,
        "improvement_spearman": 0.07588260206692354,
        "improvement_mse": 0.17079250141978264,
        "improvement_mae": 0.2947482466697693
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.7195550799369812,
        "spearman_correlation": 0.5689956831102113,
        "mse_loss": 0.39334696531295776,
        "mae": 0.48527058959007263,
        "baseline_pearson": 0.30938464403152466,
        "baseline_spearman": 0.3362600860784734,
        "baseline_mse": 0.6880159378051758,
        "baseline_mae": 0.5778502225875854,
        "improvement_pearson": 0.41017043590545654,
        "improvement_spearman": 0.2327355970317379,
        "improvement_mse": 0.294668972492218,
        "improvement_mae": 0.09257963299751282
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.6943601369857788,
        "spearman_correlation": 0.5768056781843415,
        "mse_loss": 0.5196889042854309,
        "mae": 0.5868502855300903,
        "baseline_pearson": 0.2852861285209656,
        "baseline_spearman": 0.29213910324230036,
        "baseline_mse": 0.8816540241241455,
        "baseline_mae": 0.700792133808136,
        "improvement_pearson": 0.40907400846481323,
        "improvement_spearman": 0.2846665749420411,
        "improvement_mse": 0.3619651198387146,
        "improvement_mae": 0.11394184827804565
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.44959017634391785,
        "spearman_correlation": 0.4290207668974099,
        "mse_loss": 0.006838461384177208,
        "mae": 0.06810936331748962,
        "baseline_pearson": 0.4838234782218933,
        "baseline_spearman": 0.4563246258291759,
        "baseline_mse": 0.01303885318338871,
        "baseline_mae": 0.08952221274375916,
        "improvement_pearson": -0.034233301877975464,
        "improvement_spearman": -0.027303858931765956,
        "improvement_mse": 0.006200391799211502,
        "improvement_mae": 0.02141284942626953
    },
    {
        "model": "snowflake-arctic-embed-l-v2.0",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7304627895355225,
        "spearman_correlation": 0.7258448900462254,
        "mse_loss": 0.013544626533985138,
        "mae": 0.09450516104698181,
        "baseline_pearson": 0.6920145750045776,
        "baseline_spearman": 0.684269077729331,
        "baseline_mse": 0.018966494128108025,
        "baseline_mae": 0.11314374208450317,
        "improvement_pearson": 0.038448214530944824,
        "improvement_spearman": 0.041575812316894445,
        "improvement_mse": 0.005421867594122887,
        "improvement_mae": 0.018638581037521362
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8753418922424316,
        "spearman_correlation": 0.8815287281566015,
        "mse_loss": 0.11518202722072601,
        "mae": 0.2776574492454529,
        "baseline_pearson": 0.38390418887138367,
        "baseline_spearman": 0.5275940523970295,
        "baseline_mse": 0.4332510828971863,
        "baseline_mae": 0.5122458338737488,
        "improvement_pearson": 0.491437703371048,
        "improvement_spearman": 0.35393467575957205,
        "improvement_mse": 0.31806905567646027,
        "improvement_mae": 0.2345883846282959
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8999866247177124,
        "spearman_correlation": 0.8628434877085779,
        "mse_loss": 0.10908268392086029,
        "mae": 0.2755368649959564,
        "baseline_pearson": 0.5453597903251648,
        "baseline_spearman": 0.6196835435581195,
        "baseline_mse": 0.42889606952667236,
        "baseline_mae": 0.5125240683555603,
        "improvement_pearson": 0.3546268343925476,
        "improvement_spearman": 0.24315994415045838,
        "improvement_mse": 0.3198133856058121,
        "improvement_mae": 0.23698720335960388
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.5810624957084656,
        "spearman_correlation": 0.5898267206789871,
        "mse_loss": 0.0252754595130682,
        "mae": 0.11890190839767456,
        "baseline_pearson": 0.47140419483184814,
        "baseline_spearman": 0.44703592838209166,
        "baseline_mse": 0.0497690886259079,
        "baseline_mae": 0.18258681893348694,
        "improvement_pearson": 0.10965830087661743,
        "improvement_spearman": 0.14279079229689545,
        "improvement_mse": 0.0244936291128397,
        "improvement_mae": 0.06368491053581238
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7499756813049316,
        "spearman_correlation": 0.6312822604574496,
        "mse_loss": 0.039444949477910995,
        "mae": 0.1499156504869461,
        "baseline_pearson": 0.6468614935874939,
        "baseline_spearman": 0.5869379460606993,
        "baseline_mse": 0.1543693244457245,
        "baseline_mae": 0.3529493510723114,
        "improvement_pearson": 0.10311418771743774,
        "improvement_spearman": 0.04434431439675035,
        "improvement_mse": 0.11492437496781349,
        "improvement_mae": 0.2030337005853653
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8667752146720886,
        "spearman_correlation": 0.7282432082116986,
        "mse_loss": 0.2553899586200714,
        "mae": 0.36923953890800476,
        "baseline_pearson": 0.5108879804611206,
        "baseline_spearman": 0.5411215712374186,
        "baseline_mse": 0.7593469023704529,
        "baseline_mae": 0.5717947483062744,
        "improvement_pearson": 0.355887234210968,
        "improvement_spearman": 0.18712163697428008,
        "improvement_mse": 0.5039569437503815,
        "improvement_mae": 0.20255520939826965
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.7934343814849854,
        "spearman_correlation": 0.6501744514574188,
        "mse_loss": 0.3563153147697449,
        "mae": 0.4781727194786072,
        "baseline_pearson": 0.49777892231941223,
        "baseline_spearman": 0.52471168457915,
        "baseline_mse": 0.8166581392288208,
        "baseline_mae": 0.6546531915664673,
        "improvement_pearson": 0.2956554591655731,
        "improvement_spearman": 0.12546276687826885,
        "improvement_mse": 0.4603428244590759,
        "improvement_mae": 0.1764804720878601
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.33413293957710266,
        "spearman_correlation": 0.4060614006822298,
        "mse_loss": 0.008295825682580471,
        "mae": 0.07384997606277466,
        "baseline_pearson": 0.5547794103622437,
        "baseline_spearman": 0.5698641096012178,
        "baseline_mse": 0.00751098059117794,
        "baseline_mae": 0.06567588448524475,
        "improvement_pearson": -0.220646470785141,
        "improvement_spearman": -0.16380270891898802,
        "improvement_mse": -0.0007848450914025307,
        "improvement_mae": -0.008174091577529907
    },
    {
        "model": "text-embedding-3-large",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7195248603820801,
        "spearman_correlation": 0.7260009932592084,
        "mse_loss": 0.015519443899393082,
        "mae": 0.10411100834608078,
        "baseline_pearson": 0.6293452978134155,
        "baseline_spearman": 0.6544097900823072,
        "baseline_mse": 0.022554825991392136,
        "baseline_mae": 0.12441129237413406,
        "improvement_pearson": 0.09017956256866455,
        "improvement_spearman": 0.07159120317690126,
        "improvement_mse": 0.007035382091999054,
        "improvement_mae": 0.020300284028053284
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8534048795700073,
        "spearman_correlation": 0.8315759057595691,
        "mse_loss": 0.134769007563591,
        "mae": 0.30951929092407227,
        "baseline_pearson": 0.4662332832813263,
        "baseline_spearman": 0.5765938426251161,
        "baseline_mse": 0.7548919916152954,
        "baseline_mae": 0.6750190258026123,
        "improvement_pearson": 0.38717159628868103,
        "improvement_spearman": 0.25498206313445293,
        "improvement_mse": 0.6201229840517044,
        "improvement_mae": 0.36549973487854004
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.9047982692718506,
        "spearman_correlation": 0.8763320838791541,
        "mse_loss": 0.11726950854063034,
        "mae": 0.28762099146842957,
        "baseline_pearson": 0.5824797749519348,
        "baseline_spearman": 0.6408426078089147,
        "baseline_mse": 0.7011623382568359,
        "baseline_mae": 0.6025184392929077,
        "improvement_pearson": 0.32231849431991577,
        "improvement_spearman": 0.2354894760702394,
        "improvement_mse": 0.5838928297162056,
        "improvement_mae": 0.31489744782447815
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.4421526789665222,
        "spearman_correlation": 0.48563853231870086,
        "mse_loss": 0.04117441922426224,
        "mae": 0.14438503980636597,
        "baseline_pearson": 0.34502503275871277,
        "baseline_spearman": 0.34907267092080413,
        "baseline_mse": 0.0898447260260582,
        "baseline_mae": 0.25366321206092834,
        "improvement_pearson": 0.09712764620780945,
        "improvement_spearman": 0.13656586139789673,
        "improvement_mse": 0.04867030680179596,
        "improvement_mae": 0.10927817225456238
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6697282791137695,
        "spearman_correlation": 0.5992140742433877,
        "mse_loss": 0.06880294531583786,
        "mae": 0.19609372317790985,
        "baseline_pearson": 0.5334892868995667,
        "baseline_spearman": 0.49747543264458793,
        "baseline_mse": 0.5376843214035034,
        "baseline_mae": 0.7160141468048096,
        "improvement_pearson": 0.13623899221420288,
        "improvement_spearman": 0.10173864159879975,
        "improvement_mse": 0.46888137608766556,
        "improvement_mae": 0.5199204236268997
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8627122640609741,
        "spearman_correlation": 0.7486625017769569,
        "mse_loss": 0.23364634811878204,
        "mae": 0.33777186274528503,
        "baseline_pearson": 0.7769416570663452,
        "baseline_spearman": 0.7345946711881939,
        "baseline_mse": 0.8397605419158936,
        "baseline_mae": 0.5865262746810913,
        "improvement_pearson": 0.0857706069946289,
        "improvement_spearman": 0.014067830588763042,
        "improvement_mse": 0.6061141937971115,
        "improvement_mae": 0.24875441193580627
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8087843060493469,
        "spearman_correlation": 0.7029902326323879,
        "mse_loss": 0.33919191360473633,
        "mae": 0.4621124267578125,
        "baseline_pearson": 0.7113547921180725,
        "baseline_spearman": 0.6589031477969893,
        "baseline_mse": 1.0075945854187012,
        "baseline_mae": 0.7313043475151062,
        "improvement_pearson": 0.09742951393127441,
        "improvement_spearman": 0.04408708483539858,
        "improvement_mse": 0.6684026718139648,
        "improvement_mae": 0.2691919207572937
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.3416900038719177,
        "spearman_correlation": 0.4010817897976644,
        "mse_loss": 0.010222749784588814,
        "mae": 0.08698803931474686,
        "baseline_pearson": 0.32635748386383057,
        "baseline_spearman": 0.3377210857898421,
        "baseline_mse": 0.0069861444644629955,
        "baseline_mae": 0.07279045879840851,
        "improvement_pearson": 0.015332520008087158,
        "improvement_spearman": 0.06336070400782229,
        "improvement_mse": -0.0032366053201258183,
        "improvement_mae": -0.014197580516338348
    },
    {
        "model": "e5-mistral-7b-instruct",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.3817923665046692,
        "spearman_correlation": 0.5668326224523714,
        "mse_loss": 0.055294252932071686,
        "mae": 0.20984004437923431,
        "baseline_pearson": 0.5149005651473999,
        "baseline_spearman": 0.5761223958022088,
        "baseline_mse": 0.05343888700008392,
        "baseline_mae": 0.20678319036960602,
        "improvement_pearson": -0.1331081986427307,
        "improvement_spearman": -0.009289773349837382,
        "improvement_mse": -0.0018553659319877625,
        "improvement_mae": -0.003056854009628296
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8820031881332397,
        "spearman_correlation": 0.8667436891302532,
        "mse_loss": 0.12292147427797318,
        "mae": 0.2944506108760834,
        "baseline_pearson": 0.2786006033420563,
        "baseline_spearman": 0.38650374172388186,
        "baseline_mse": 0.562837541103363,
        "baseline_mae": 0.5921853184700012,
        "improvement_pearson": 0.6034025847911835,
        "improvement_spearman": 0.4802399474063714,
        "improvement_mse": 0.43991606682538986,
        "improvement_mae": 0.29773470759391785
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.899215042591095,
        "spearman_correlation": 0.8652850034245568,
        "mse_loss": 0.11465584486722946,
        "mae": 0.28341206908226013,
        "baseline_pearson": 0.42841988801956177,
        "baseline_spearman": 0.4927323840904588,
        "baseline_mse": 0.4773149788379669,
        "baseline_mae": 0.5383591651916504,
        "improvement_pearson": 0.4707951545715332,
        "improvement_spearman": 0.37255261933409806,
        "improvement_mse": 0.36265913397073746,
        "improvement_mae": 0.25494709610939026
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6520655751228333,
        "spearman_correlation": 0.6274246148870047,
        "mse_loss": 0.020253906026482582,
        "mae": 0.10918727517127991,
        "baseline_pearson": 0.5469287633895874,
        "baseline_spearman": 0.521750510786725,
        "baseline_mse": 0.031150352209806442,
        "baseline_mae": 0.14182965457439423,
        "improvement_pearson": 0.10513681173324585,
        "improvement_spearman": 0.10567410410027978,
        "improvement_mse": 0.01089644618332386,
        "improvement_mae": 0.03264237940311432
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7472953796386719,
        "spearman_correlation": 0.6322811789859912,
        "mse_loss": 0.038722772151231766,
        "mae": 0.15014010667800903,
        "baseline_pearson": 0.663348913192749,
        "baseline_spearman": 0.6097386979328613,
        "baseline_mse": 0.19402913749217987,
        "baseline_mae": 0.4122171401977539,
        "improvement_pearson": 0.08394646644592285,
        "improvement_spearman": 0.022542481053129948,
        "improvement_mse": 0.1553063653409481,
        "improvement_mae": 0.2620770335197449
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.7918187975883484,
        "spearman_correlation": 0.6252098408970774,
        "mse_loss": 0.3087313771247864,
        "mae": 0.4320572018623352,
        "baseline_pearson": 0.3662661612033844,
        "baseline_spearman": 0.4005442643058114,
        "baseline_mse": 0.6998403668403625,
        "baseline_mae": 0.5549520254135132,
        "improvement_pearson": 0.425552636384964,
        "improvement_spearman": 0.22466557659126601,
        "improvement_mse": 0.39110898971557617,
        "improvement_mae": 0.12289482355117798
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.7458872199058533,
        "spearman_correlation": 0.641772532438856,
        "mse_loss": 0.448049932718277,
        "mae": 0.5415164232254028,
        "baseline_pearson": 0.3751322031021118,
        "baseline_spearman": 0.4133967463304241,
        "baseline_mse": 0.9342625141143799,
        "baseline_mae": 0.702225387096405,
        "improvement_pearson": 0.37075501680374146,
        "improvement_spearman": 0.2283757861084319,
        "improvement_mse": 0.4862125813961029,
        "improvement_mae": 0.1607089638710022
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.33311694860458374,
        "spearman_correlation": 0.4231389237658195,
        "mse_loss": 0.00852444488555193,
        "mae": 0.07691088318824768,
        "baseline_pearson": 0.464449942111969,
        "baseline_spearman": 0.4576033067034078,
        "baseline_mse": 0.007510032504796982,
        "baseline_mae": 0.06729768216609955,
        "improvement_pearson": -0.13133299350738525,
        "improvement_spearman": -0.0344643829375883,
        "improvement_mse": -0.0010144123807549477,
        "improvement_mae": -0.009613201022148132
    },
    {
        "model": "gte-Qwen2-7B-instruct",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6201751828193665,
        "spearman_correlation": 0.644904308637369,
        "mse_loss": 0.022396311163902283,
        "mae": 0.12069994956254959,
        "baseline_pearson": 0.5908670425415039,
        "baseline_spearman": 0.6334577811730294,
        "baseline_mse": 0.02814641408622265,
        "baseline_mae": 0.1419629603624344,
        "improvement_pearson": 0.02930814027786255,
        "improvement_spearman": 0.011446527464339606,
        "improvement_mse": 0.005750102922320366,
        "improvement_mae": 0.021263010799884796
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8525168895721436,
        "spearman_correlation": 0.8258678364197235,
        "mse_loss": 0.13716842234134674,
        "mae": 0.31554970145225525,
        "baseline_pearson": 0.3677995800971985,
        "baseline_spearman": 0.4832523715839505,
        "baseline_mse": 0.4762258231639862,
        "baseline_mae": 0.5417832136154175,
        "improvement_pearson": 0.48471730947494507,
        "improvement_spearman": 0.342615464835773,
        "improvement_mse": 0.33905740082263947,
        "improvement_mae": 0.22623351216316223
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.868083119392395,
        "spearman_correlation": 0.8622923329337661,
        "mse_loss": 0.14879058301448822,
        "mae": 0.32896146178245544,
        "baseline_pearson": 0.43792271614074707,
        "baseline_spearman": 0.4921078216967896,
        "baseline_mse": 0.5051460862159729,
        "baseline_mae": 0.5562031865119934,
        "improvement_pearson": 0.43016040325164795,
        "improvement_spearman": 0.37018451123697643,
        "improvement_mse": 0.3563555032014847,
        "improvement_mae": 0.22724172472953796
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6282318234443665,
        "spearman_correlation": 0.6242510158970751,
        "mse_loss": 0.020928803831338882,
        "mae": 0.1130356714129448,
        "baseline_pearson": 0.5547934174537659,
        "baseline_spearman": 0.4897978031273359,
        "baseline_mse": 0.045024484395980835,
        "baseline_mae": 0.17574019730091095,
        "improvement_pearson": 0.07343840599060059,
        "improvement_spearman": 0.1344532127697392,
        "improvement_mse": 0.024095680564641953,
        "improvement_mae": 0.06270452588796616
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7663266062736511,
        "spearman_correlation": 0.6198013202257419,
        "mse_loss": 0.03598407655954361,
        "mae": 0.14025713503360748,
        "baseline_pearson": 0.6688700914382935,
        "baseline_spearman": 0.5625510926879027,
        "baseline_mse": 0.15041442215442657,
        "baseline_mae": 0.3533961772918701,
        "improvement_pearson": 0.09745651483535767,
        "improvement_spearman": 0.05725022753783915,
        "improvement_mse": 0.11443034559488297,
        "improvement_mae": 0.21313904225826263
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8008311986923218,
        "spearman_correlation": 0.6313089785171881,
        "mse_loss": 0.3325327932834625,
        "mae": 0.452256977558136,
        "baseline_pearson": 0.36624813079833984,
        "baseline_spearman": 0.35890042903093794,
        "baseline_mse": 0.7783519625663757,
        "baseline_mae": 0.615327000617981,
        "improvement_pearson": 0.43458306789398193,
        "improvement_spearman": 0.2724085494862502,
        "improvement_mse": 0.4458191692829132,
        "improvement_mae": 0.16307002305984497
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.7805043458938599,
        "spearman_correlation": 0.6553178071978472,
        "mse_loss": 0.4252205491065979,
        "mae": 0.5425642728805542,
        "baseline_pearson": 0.35147348046302795,
        "baseline_spearman": 0.35738332354840413,
        "baseline_mse": 0.9223597049713135,
        "baseline_mae": 0.7183400392532349,
        "improvement_pearson": 0.4290308654308319,
        "improvement_spearman": 0.297934483649443,
        "improvement_mse": 0.4971391558647156,
        "improvement_mae": 0.17577576637268066
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.34755030274391174,
        "spearman_correlation": 0.41028011422349137,
        "mse_loss": 0.00945133063942194,
        "mae": 0.08185230195522308,
        "baseline_pearson": 0.5512392520904541,
        "baseline_spearman": 0.5275209724552495,
        "baseline_mse": 0.008859864436089993,
        "baseline_mae": 0.07064881920814514,
        "improvement_pearson": -0.20368894934654236,
        "improvement_spearman": -0.11724085823175817,
        "improvement_mse": -0.0005914662033319473,
        "improvement_mae": -0.011203482747077942
    },
    {
        "model": "text-embedding-3-small",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7655097246170044,
        "spearman_correlation": 0.7764094220503747,
        "mse_loss": 0.013561045750975609,
        "mae": 0.09473631531000137,
        "baseline_pearson": 0.7102078795433044,
        "baseline_spearman": 0.7305962862909218,
        "baseline_mse": 0.022753849625587463,
        "baseline_mae": 0.12740375101566315,
        "improvement_pearson": 0.05530184507369995,
        "improvement_spearman": 0.045813135759452894,
        "improvement_mse": 0.009192803874611855,
        "improvement_mae": 0.032667435705661774
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.7818725109100342,
        "spearman_correlation": 0.7370570335774352,
        "mse_loss": 0.18005341291427612,
        "mae": 0.3625454008579254,
        "baseline_pearson": 0.20786842703819275,
        "baseline_spearman": 0.3144097314095419,
        "baseline_mse": 0.5374537706375122,
        "baseline_mae": 0.5800958275794983,
        "improvement_pearson": 0.5740040838718414,
        "improvement_spearman": 0.4226473021678933,
        "improvement_mse": 0.3574003577232361,
        "improvement_mae": 0.21755042672157288
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8423984050750732,
        "spearman_correlation": 0.8274116076138462,
        "mse_loss": 0.1760556697845459,
        "mae": 0.37580832839012146,
        "baseline_pearson": 0.26807844638824463,
        "baseline_spearman": 0.3257477660097899,
        "baseline_mse": 0.5427600145339966,
        "baseline_mae": 0.5826422572135925,
        "improvement_pearson": 0.5743199586868286,
        "improvement_spearman": 0.5016638416040564,
        "improvement_mse": 0.3667043447494507,
        "improvement_mae": 0.20683392882347107
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.550184965133667,
        "spearman_correlation": 0.5280556311535368,
        "mse_loss": 0.024172797799110413,
        "mae": 0.11722128093242645,
        "baseline_pearson": 0.4942755699157715,
        "baseline_spearman": 0.471997673523133,
        "baseline_mse": 0.030079999938607216,
        "baseline_mae": 0.1358872950077057,
        "improvement_pearson": 0.05590939521789551,
        "improvement_spearman": 0.05605795763040383,
        "improvement_mse": 0.005907202139496803,
        "improvement_mae": 0.018666014075279236
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6724802255630493,
        "spearman_correlation": 0.5785561599252691,
        "mse_loss": 0.0435120090842247,
        "mae": 0.15261371433734894,
        "baseline_pearson": 0.5562558174133301,
        "baseline_spearman": 0.4896573161663739,
        "baseline_mse": 0.2316681444644928,
        "baseline_mae": 0.4517885744571686,
        "improvement_pearson": 0.11622440814971924,
        "improvement_spearman": 0.08889884375889517,
        "improvement_mse": 0.1881561353802681,
        "improvement_mae": 0.29917486011981964
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.7596170902252197,
        "spearman_correlation": 0.6417518285080595,
        "mse_loss": 0.36213088035583496,
        "mae": 0.45741212368011475,
        "baseline_pearson": 0.41862601041793823,
        "baseline_spearman": 0.4169713279301061,
        "baseline_mse": 0.7605031132698059,
        "baseline_mae": 0.5909589529037476,
        "improvement_pearson": 0.3409910798072815,
        "improvement_spearman": 0.22478050057795335,
        "improvement_mse": 0.39837223291397095,
        "improvement_mae": 0.1335468292236328
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.7375820875167847,
        "spearman_correlation": 0.6021465176552467,
        "mse_loss": 0.4133007228374481,
        "mae": 0.517910361289978,
        "baseline_pearson": 0.4205778241157532,
        "baseline_spearman": 0.38640056491663977,
        "baseline_mse": 0.8272859454154968,
        "baseline_mae": 0.6598346829414368,
        "improvement_pearson": 0.3170042634010315,
        "improvement_spearman": 0.21574595273860697,
        "improvement_mse": 0.4139852225780487,
        "improvement_mae": 0.14192432165145874
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.45981770753860474,
        "spearman_correlation": 0.46763008477871976,
        "mse_loss": 0.008682195097208023,
        "mae": 0.07935507595539093,
        "baseline_pearson": 0.4617167115211487,
        "baseline_spearman": 0.47818842431582576,
        "baseline_mse": 0.010969712398946285,
        "baseline_mae": 0.08007732033729553,
        "improvement_pearson": -0.0018990039825439453,
        "improvement_spearman": -0.010558339537105998,
        "improvement_mse": 0.002287517301738262,
        "improvement_mae": 0.000722244381904602
    },
    {
        "model": "gte-base-en-v1.5",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7176822423934937,
        "spearman_correlation": 0.723963053407984,
        "mse_loss": 0.017262237146496773,
        "mae": 0.10658469796180725,
        "baseline_pearson": 0.6256612539291382,
        "baseline_spearman": 0.6436564950695024,
        "baseline_mse": 0.02835063263773918,
        "baseline_mae": 0.13926760852336884,
        "improvement_pearson": 0.09202098846435547,
        "improvement_spearman": 0.08030655833848155,
        "improvement_mse": 0.011088395491242409,
        "improvement_mae": 0.032682910561561584
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.839657187461853,
        "spearman_correlation": 0.8238874063285878,
        "mse_loss": 0.14983013272285461,
        "mae": 0.32157206535339355,
        "baseline_pearson": 0.3534708321094513,
        "baseline_spearman": 0.4696468729696509,
        "baseline_mse": 0.7213625311851501,
        "baseline_mae": 0.6681334376335144,
        "improvement_pearson": 0.48618635535240173,
        "improvement_spearman": 0.3542405333589369,
        "improvement_mse": 0.5715323984622955,
        "improvement_mae": 0.34656137228012085
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8948401212692261,
        "spearman_correlation": 0.8637997056504633,
        "mse_loss": 0.11955347657203674,
        "mae": 0.2935904860496521,
        "baseline_pearson": 0.4792229235172272,
        "baseline_spearman": 0.5539495016410443,
        "baseline_mse": 0.6283475756645203,
        "baseline_mae": 0.5782155394554138,
        "improvement_pearson": 0.4156171977519989,
        "improvement_spearman": 0.309850204009419,
        "improvement_mse": 0.5087940990924835,
        "improvement_mae": 0.2846250534057617
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.5103687047958374,
        "spearman_correlation": 0.49514350251549055,
        "mse_loss": 0.030290883034467697,
        "mae": 0.12912693619728088,
        "baseline_pearson": 0.4148767590522766,
        "baseline_spearman": 0.37319599016771793,
        "baseline_mse": 0.05350630357861519,
        "baseline_mae": 0.18499113619327545,
        "improvement_pearson": 0.09549194574356079,
        "improvement_spearman": 0.12194751234777262,
        "improvement_mse": 0.02321542054414749,
        "improvement_mae": 0.05586419999599457
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6590917110443115,
        "spearman_correlation": 0.5612937658018851,
        "mse_loss": 0.059889163821935654,
        "mae": 0.17574013769626617,
        "baseline_pearson": 0.48280519247055054,
        "baseline_spearman": 0.44986620754631423,
        "baseline_mse": 0.4334930181503296,
        "baseline_mae": 0.6371827721595764,
        "improvement_pearson": 0.176286518573761,
        "improvement_spearman": 0.11142755825557082,
        "improvement_mse": 0.37360385432839394,
        "improvement_mae": 0.46144263446331024
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8460127711296082,
        "spearman_correlation": 0.7324968475392177,
        "mse_loss": 0.24735870957374573,
        "mae": 0.34645697474479675,
        "baseline_pearson": 0.4991837739944458,
        "baseline_spearman": 0.5286284872640389,
        "baseline_mse": 0.7646529078483582,
        "baseline_mae": 0.5493870973587036,
        "improvement_pearson": 0.34682899713516235,
        "improvement_spearman": 0.20386836027517885,
        "improvement_mse": 0.5172941982746124,
        "improvement_mae": 0.20293012261390686
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.7624551653862,
        "spearman_correlation": 0.6438285409793338,
        "mse_loss": 0.39777931571006775,
        "mae": 0.4979407787322998,
        "baseline_pearson": 0.48535341024398804,
        "baseline_spearman": 0.48462857365566475,
        "baseline_mse": 0.9428007006645203,
        "baseline_mae": 0.695711076259613,
        "improvement_pearson": 0.2771017551422119,
        "improvement_spearman": 0.1591999673236691,
        "improvement_mse": 0.5450213849544525,
        "improvement_mae": 0.19777029752731323
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.5159540772438049,
        "spearman_correlation": 0.5439518216869076,
        "mse_loss": 0.010565640404820442,
        "mae": 0.0887417420744896,
        "baseline_pearson": 0.43677306175231934,
        "baseline_spearman": 0.46782164246269403,
        "baseline_mse": 0.006911384407430887,
        "baseline_mae": 0.06725653260946274,
        "improvement_pearson": 0.0791810154914856,
        "improvement_spearman": 0.07613017922421356,
        "improvement_mse": -0.003654255997389555,
        "improvement_mae": -0.021485209465026855
    },
    {
        "model": "Qwen3-Embedding-8B",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.5477805733680725,
        "spearman_correlation": 0.5992204254414427,
        "mse_loss": 0.030215812847018242,
        "mae": 0.14546166360378265,
        "baseline_pearson": 0.5780947208404541,
        "baseline_spearman": 0.6126700875454898,
        "baseline_mse": 0.03949093446135521,
        "baseline_mae": 0.17501625418663025,
        "improvement_pearson": -0.030314147472381592,
        "improvement_spearman": -0.013449662104047078,
        "improvement_mse": 0.009275121614336967,
        "improvement_mae": 0.029554590582847595
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8032699227333069,
        "spearman_correlation": 0.7664544757981056,
        "mse_loss": 0.168256938457489,
        "mae": 0.35380029678344727,
        "baseline_pearson": 0.4003354012966156,
        "baseline_spearman": 0.4796722454834489,
        "baseline_mse": 0.7521534562110901,
        "baseline_mae": 0.6998725533485413,
        "improvement_pearson": 0.4029345214366913,
        "improvement_spearman": 0.28678223031465666,
        "improvement_mse": 0.5838965177536011,
        "improvement_mae": 0.346072256565094
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8632687330245972,
        "spearman_correlation": 0.8194951538516029,
        "mse_loss": 0.15170693397521973,
        "mae": 0.348346471786499,
        "baseline_pearson": 0.5324727296829224,
        "baseline_spearman": 0.5730794313930754,
        "baseline_mse": 0.6333878040313721,
        "baseline_mae": 0.5874015688896179,
        "improvement_pearson": 0.3307960033416748,
        "improvement_spearman": 0.2464157224585275,
        "improvement_mse": 0.48168087005615234,
        "improvement_mae": 0.2390550971031189
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.5827558040618896,
        "spearman_correlation": 0.5736724356185668,
        "mse_loss": 0.024922480806708336,
        "mae": 0.11783570796251297,
        "baseline_pearson": 0.43795740604400635,
        "baseline_spearman": 0.39591017483271007,
        "baseline_mse": 0.0632966160774231,
        "baseline_mae": 0.21131642162799835,
        "improvement_pearson": 0.1447983980178833,
        "improvement_spearman": 0.17776226078585677,
        "improvement_mse": 0.03837413527071476,
        "improvement_mae": 0.09348071366548538
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6898716688156128,
        "spearman_correlation": 0.5973546273562598,
        "mse_loss": 0.04297897219657898,
        "mae": 0.15143951773643494,
        "baseline_pearson": 0.5434583425521851,
        "baseline_spearman": 0.5205803077005048,
        "baseline_mse": 0.47034338116645813,
        "baseline_mae": 0.6639533638954163,
        "improvement_pearson": 0.14641332626342773,
        "improvement_spearman": 0.07677431965575499,
        "improvement_mse": 0.42736440896987915,
        "improvement_mae": 0.5125138461589813
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8367241621017456,
        "spearman_correlation": 0.6572116714493329,
        "mse_loss": 0.23884503543376923,
        "mae": 0.34344902634620667,
        "baseline_pearson": 0.5744507312774658,
        "baseline_spearman": 0.5521139856613241,
        "baseline_mse": 0.7113387584686279,
        "baseline_mae": 0.5291474461555481,
        "improvement_pearson": 0.2622734308242798,
        "improvement_spearman": 0.10509768578800882,
        "improvement_mse": 0.4724937230348587,
        "improvement_mae": 0.18569841980934143
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.7624789476394653,
        "spearman_correlation": 0.6028340101569986,
        "mse_loss": 0.3722054660320282,
        "mae": 0.4886960983276367,
        "baseline_pearson": 0.5044101476669312,
        "baseline_spearman": 0.4815320446985781,
        "baseline_mse": 0.900180459022522,
        "baseline_mae": 0.6945531368255615,
        "improvement_pearson": 0.2580687999725342,
        "improvement_spearman": 0.12130196545842048,
        "improvement_mse": 0.5279749929904938,
        "improvement_mae": 0.2058570384979248
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.5888857245445251,
        "spearman_correlation": 0.5516047956088401,
        "mse_loss": 0.008905424736440182,
        "mae": 0.08115794509649277,
        "baseline_pearson": 0.4893227815628052,
        "baseline_spearman": 0.47258525094723275,
        "baseline_mse": 0.00529819168150425,
        "baseline_mae": 0.057073257863521576,
        "improvement_pearson": 0.09956294298171997,
        "improvement_spearman": 0.07901954466160738,
        "improvement_mse": -0.003607233054935932,
        "improvement_mae": -0.02408468723297119
    },
    {
        "model": "cohere.embed-multilingual-v3",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.780485987663269,
        "spearman_correlation": 0.7936339185167727,
        "mse_loss": 0.012180141173303127,
        "mae": 0.0902903601527214,
        "baseline_pearson": 0.6827864050865173,
        "baseline_spearman": 0.7053377763536852,
        "baseline_mse": 0.037172093987464905,
        "baseline_mae": 0.17012079060077667,
        "improvement_pearson": 0.09769958257675171,
        "improvement_spearman": 0.08829614216308745,
        "improvement_mse": 0.024991952814161777,
        "improvement_mae": 0.07983043044805527
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8380128145217896,
        "spearman_correlation": 0.8275252036167683,
        "mse_loss": 0.1472754180431366,
        "mae": 0.32952526211738586,
        "baseline_pearson": 0.38780391216278076,
        "baseline_spearman": 0.49287573052352773,
        "baseline_mse": 0.571999728679657,
        "baseline_mae": 0.6095676422119141,
        "improvement_pearson": 0.4502089023590088,
        "improvement_spearman": 0.33464947309324056,
        "improvement_mse": 0.4247243106365204,
        "improvement_mae": 0.2800423800945282
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8923452496528625,
        "spearman_correlation": 0.871664976349212,
        "mse_loss": 0.12061590701341629,
        "mae": 0.30482783913612366,
        "baseline_pearson": 0.5505849123001099,
        "baseline_spearman": 0.601918413659523,
        "baseline_mse": 0.4849012494087219,
        "baseline_mae": 0.5402029752731323,
        "improvement_pearson": 0.3417603373527527,
        "improvement_spearman": 0.269746562689689,
        "improvement_mse": 0.36428534239530563,
        "improvement_mae": 0.23537513613700867
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6721614003181458,
        "spearman_correlation": 0.6722588577191534,
        "mse_loss": 0.020822841674089432,
        "mae": 0.1047714352607727,
        "baseline_pearson": 0.5746607780456543,
        "baseline_spearman": 0.5474489417198866,
        "baseline_mse": 0.02634563110768795,
        "baseline_mae": 0.12331826984882355,
        "improvement_pearson": 0.09750062227249146,
        "improvement_spearman": 0.12480991599926683,
        "improvement_mse": 0.005522789433598518,
        "improvement_mae": 0.018546834588050842
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7095282077789307,
        "spearman_correlation": 0.6184310605990007,
        "mse_loss": 0.04804757237434387,
        "mae": 0.16191764175891876,
        "baseline_pearson": 0.614404559135437,
        "baseline_spearman": 0.582000372145075,
        "baseline_mse": 0.2583571672439575,
        "baseline_mae": 0.48136767745018005,
        "improvement_pearson": 0.09512364864349365,
        "improvement_spearman": 0.03643068845392561,
        "improvement_mse": 0.21030959486961365,
        "improvement_mae": 0.3194500356912613
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8258868455886841,
        "spearman_correlation": 0.6599383432412989,
        "mse_loss": 0.2445213794708252,
        "mae": 0.3625692129135132,
        "baseline_pearson": 0.6631579995155334,
        "baseline_spearman": 0.6497143392654467,
        "baseline_mse": 0.6296736001968384,
        "baseline_mae": 0.5278793573379517,
        "improvement_pearson": 0.16272884607315063,
        "improvement_spearman": 0.010224003975852103,
        "improvement_mse": 0.3851522207260132,
        "improvement_mae": 0.16531014442443848
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8048607110977173,
        "spearman_correlation": 0.6942642770343952,
        "mse_loss": 0.3676130175590515,
        "mae": 0.49615052342414856,
        "baseline_pearson": 0.5810784697532654,
        "baseline_spearman": 0.5663255372956555,
        "baseline_mse": 0.8934751152992249,
        "baseline_mae": 0.7138756513595581,
        "improvement_pearson": 0.2237822413444519,
        "improvement_spearman": 0.1279387397387397,
        "improvement_mse": 0.5258620977401733,
        "improvement_mae": 0.21772512793540955
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.21817371249198914,
        "spearman_correlation": 0.2891307681196458,
        "mse_loss": 0.00881461426615715,
        "mae": 0.0792350023984909,
        "baseline_pearson": 0.34486496448516846,
        "baseline_spearman": 0.36324403604484495,
        "baseline_mse": 0.012212620116770267,
        "baseline_mae": 0.08557296544313431,
        "improvement_pearson": -0.12669125199317932,
        "improvement_spearman": -0.07411326792519918,
        "improvement_mse": 0.0033980058506131172,
        "improvement_mae": 0.006337963044643402
    },
    {
        "model": "gte-Qwen2-1.5B-instruct",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.704207181930542,
        "spearman_correlation": 0.715439186860532,
        "mse_loss": 0.015709636732935905,
        "mae": 0.10184299200773239,
        "baseline_pearson": 0.6342175006866455,
        "baseline_spearman": 0.6574277752444448,
        "baseline_mse": 0.022673575207591057,
        "baseline_mae": 0.12468543648719788,
        "improvement_pearson": 0.06998968124389648,
        "improvement_spearman": 0.05801141161608714,
        "improvement_mse": 0.006963938474655151,
        "improvement_mae": 0.022842444479465485
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8256738781929016,
        "spearman_correlation": 0.8199184003452163,
        "mse_loss": 0.175861194729805,
        "mae": 0.3608543574810028,
        "baseline_pearson": 0.29615914821624756,
        "baseline_spearman": 0.411861885785818,
        "baseline_mse": 0.7153921127319336,
        "baseline_mae": 0.6643909811973572,
        "improvement_pearson": 0.529514729976654,
        "improvement_spearman": 0.40805651455939834,
        "improvement_mse": 0.5395309180021286,
        "improvement_mae": 0.30353662371635437
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8550394773483276,
        "spearman_correlation": 0.8353904131312951,
        "mse_loss": 0.16762380301952362,
        "mae": 0.35421693325042725,
        "baseline_pearson": 0.429982453584671,
        "baseline_spearman": 0.502101230854602,
        "baseline_mse": 0.593342125415802,
        "baseline_mae": 0.5671414136886597,
        "improvement_pearson": 0.4250570237636566,
        "improvement_spearman": 0.33328918227669313,
        "improvement_mse": 0.4257183223962784,
        "improvement_mae": 0.21292448043823242
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.5671717524528503,
        "spearman_correlation": 0.5532616105016629,
        "mse_loss": 0.02926495485007763,
        "mae": 0.1315324902534485,
        "baseline_pearson": 0.4377949833869934,
        "baseline_spearman": 0.4456969149318969,
        "baseline_mse": 0.049258168786764145,
        "baseline_mae": 0.1706210821866989,
        "improvement_pearson": 0.12937676906585693,
        "improvement_spearman": 0.107564695569766,
        "improvement_mse": 0.019993213936686516,
        "improvement_mae": 0.03908859193325043
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6663260459899902,
        "spearman_correlation": 0.594681068140161,
        "mse_loss": 0.04978480190038681,
        "mae": 0.16021515429019928,
        "baseline_pearson": 0.5182719230651855,
        "baseline_spearman": 0.4987066612613395,
        "baseline_mse": 0.39669927954673767,
        "baseline_mae": 0.6053574085235596,
        "improvement_pearson": 0.1480541229248047,
        "improvement_spearman": 0.09597440687882147,
        "improvement_mse": 0.34691447764635086,
        "improvement_mae": 0.4451422542333603
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.75847989320755,
        "spearman_correlation": 0.6622345870704465,
        "mse_loss": 0.4514036178588867,
        "mae": 0.4928989112377167,
        "baseline_pearson": 0.43988198041915894,
        "baseline_spearman": 0.4499612127120925,
        "baseline_mse": 0.9075639843940735,
        "baseline_mae": 0.6260170936584473,
        "improvement_pearson": 0.3185979127883911,
        "improvement_spearman": 0.21227337435835397,
        "improvement_mse": 0.45616036653518677,
        "improvement_mae": 0.1331181824207306
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.7439848780632019,
        "spearman_correlation": 0.6410453523945464,
        "mse_loss": 0.48110759258270264,
        "mae": 0.5645923018455505,
        "baseline_pearson": 0.4183480441570282,
        "baseline_spearman": 0.41699925291930573,
        "baseline_mse": 1.013694405555725,
        "baseline_mae": 0.7429088950157166,
        "improvement_pearson": 0.3256368339061737,
        "improvement_spearman": 0.22404609947524068,
        "improvement_mse": 0.5325868129730225,
        "improvement_mae": 0.17831659317016602
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.5158151388168335,
        "spearman_correlation": 0.5409237880420893,
        "mse_loss": 0.008327781222760677,
        "mae": 0.07509104162454605,
        "baseline_pearson": 0.4936339855194092,
        "baseline_spearman": 0.4489103212257914,
        "baseline_mse": 0.005413820967078209,
        "baseline_mae": 0.060492657124996185,
        "improvement_pearson": 0.022181153297424316,
        "improvement_spearman": 0.0920134668162979,
        "improvement_mse": -0.0029139602556824684,
        "improvement_mae": -0.014598384499549866
    },
    {
        "model": "Qwen3-Embedding-0.6B",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7619969248771667,
        "spearman_correlation": 0.7735169772136021,
        "mse_loss": 0.014962983317673206,
        "mae": 0.0993230938911438,
        "baseline_pearson": 0.6780532598495483,
        "baseline_spearman": 0.718308956265048,
        "baseline_mse": 0.04281383380293846,
        "baseline_mae": 0.18271975219249725,
        "improvement_pearson": 0.08394366502761841,
        "improvement_spearman": 0.05520802094855415,
        "improvement_mse": 0.027850850485265255,
        "improvement_mae": 0.08339665830135345
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8155917525291443,
        "spearman_correlation": 0.811174168490973,
        "mse_loss": 0.1561143845319748,
        "mae": 0.3394497334957123,
        "baseline_pearson": 0.2752102017402649,
        "baseline_spearman": 0.4028305516467127,
        "baseline_mse": 0.644049882888794,
        "baseline_mae": 0.6398035287857056,
        "improvement_pearson": 0.5403815507888794,
        "improvement_spearman": 0.4083436168442603,
        "improvement_mse": 0.48793549835681915,
        "improvement_mae": 0.3003537952899933
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8578766584396362,
        "spearman_correlation": 0.8506345342443328,
        "mse_loss": 0.1382652372121811,
        "mae": 0.3256399631500244,
        "baseline_pearson": 0.42164677381515503,
        "baseline_spearman": 0.48252243487989616,
        "baseline_mse": 0.549272358417511,
        "baseline_mae": 0.561725914478302,
        "improvement_pearson": 0.4362298846244812,
        "improvement_spearman": 0.3681120993644366,
        "improvement_mse": 0.4110071212053299,
        "improvement_mae": 0.2360859513282776
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6003305912017822,
        "spearman_correlation": 0.6082052952879458,
        "mse_loss": 0.02407805249094963,
        "mae": 0.11925096064805984,
        "baseline_pearson": 0.48816728591918945,
        "baseline_spearman": 0.5021952210740983,
        "baseline_mse": 0.04011157527565956,
        "baseline_mae": 0.15271739661693573,
        "improvement_pearson": 0.11216330528259277,
        "improvement_spearman": 0.10601007421384745,
        "improvement_mse": 0.01603352278470993,
        "improvement_mae": 0.033466435968875885
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7037855982780457,
        "spearman_correlation": 0.6043878894954282,
        "mse_loss": 0.04914103075861931,
        "mae": 0.16158193349838257,
        "baseline_pearson": 0.5877649784088135,
        "baseline_spearman": 0.5427959160989858,
        "baseline_mse": 0.38104531168937683,
        "baseline_mae": 0.5980381965637207,
        "improvement_pearson": 0.11602061986923218,
        "improvement_spearman": 0.0615919733964424,
        "improvement_mse": 0.3319042809307575,
        "improvement_mae": 0.43645626306533813
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8340252637863159,
        "spearman_correlation": 0.7050492113231887,
        "mse_loss": 0.32767894864082336,
        "mae": 0.43534591794013977,
        "baseline_pearson": 0.45429468154907227,
        "baseline_spearman": 0.5113577341789659,
        "baseline_mse": 0.8172290325164795,
        "baseline_mae": 0.5859703421592712,
        "improvement_pearson": 0.37973058223724365,
        "improvement_spearman": 0.19369147714422275,
        "improvement_mse": 0.48955008387565613,
        "improvement_mae": 0.15062442421913147
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.7405056357383728,
        "spearman_correlation": 0.5741040217904054,
        "mse_loss": 0.4246581792831421,
        "mae": 0.5238714814186096,
        "baseline_pearson": 0.34541136026382446,
        "baseline_spearman": 0.3792664757623296,
        "baseline_mse": 0.9140188694000244,
        "baseline_mae": 0.6790529489517212,
        "improvement_pearson": 0.39509427547454834,
        "improvement_spearman": 0.19483754602807585,
        "improvement_mse": 0.4893606901168823,
        "improvement_mae": 0.15518146753311157
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.3757070302963257,
        "spearman_correlation": 0.459021100234447,
        "mse_loss": 0.009460270404815674,
        "mae": 0.08207538723945618,
        "baseline_pearson": 0.39237838983535767,
        "baseline_spearman": 0.4231411460127334,
        "baseline_mse": 0.006451830733567476,
        "baseline_mae": 0.06650987267494202,
        "improvement_pearson": -0.016671359539031982,
        "improvement_spearman": 0.035879954221713584,
        "improvement_mse": -0.0030084396712481976,
        "improvement_mae": -0.01556551456451416
    },
    {
        "model": "stella_en_1.5B_v5",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.677402138710022,
        "spearman_correlation": 0.6624704076286587,
        "mse_loss": 0.015535455197095871,
        "mae": 0.10269884765148163,
        "baseline_pearson": 0.536152720451355,
        "baseline_spearman": 0.56755478651552,
        "baseline_mse": 0.0480019673705101,
        "baseline_mae": 0.19588465988636017,
        "improvement_pearson": 0.141249418258667,
        "improvement_spearman": 0.09491562111313867,
        "improvement_mse": 0.03246651217341423,
        "improvement_mae": 0.09318581223487854
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.7839037179946899,
        "spearman_correlation": 0.7585048927281576,
        "mse_loss": 0.17780029773712158,
        "mae": 0.35903942584991455,
        "baseline_pearson": 0.2965526580810547,
        "baseline_spearman": 0.42672738555760037,
        "baseline_mse": 0.5316956639289856,
        "baseline_mae": 0.5898733139038086,
        "improvement_pearson": 0.48735105991363525,
        "improvement_spearman": 0.3317775071705572,
        "improvement_mse": 0.353895366191864,
        "improvement_mae": 0.23083388805389404
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8594940900802612,
        "spearman_correlation": 0.8367178237445873,
        "mse_loss": 0.16020168364048004,
        "mae": 0.3479267358779907,
        "baseline_pearson": 0.4450659155845642,
        "baseline_spearman": 0.4879726908415175,
        "baseline_mse": 0.534817636013031,
        "baseline_mae": 0.5699748396873474,
        "improvement_pearson": 0.414428174495697,
        "improvement_spearman": 0.34874513290306974,
        "improvement_mse": 0.37461595237255096,
        "improvement_mae": 0.2220481038093567
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6101294755935669,
        "spearman_correlation": 0.5699592281471739,
        "mse_loss": 0.021706921979784966,
        "mae": 0.1104670912027359,
        "baseline_pearson": 0.5242546200752258,
        "baseline_spearman": 0.43334932630855266,
        "baseline_mse": 0.02793169766664505,
        "baseline_mae": 0.1301504671573639,
        "improvement_pearson": 0.08587485551834106,
        "improvement_spearman": 0.13660990183862126,
        "improvement_mse": 0.0062247756868600845,
        "improvement_mae": 0.01968337595462799
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6658128499984741,
        "spearman_correlation": 0.6099511726338236,
        "mse_loss": 0.05567396804690361,
        "mae": 0.1660863310098648,
        "baseline_pearson": 0.6062623262405396,
        "baseline_spearman": 0.5454374072630754,
        "baseline_mse": 0.23698070645332336,
        "baseline_mae": 0.4607645869255066,
        "improvement_pearson": 0.05955052375793457,
        "improvement_spearman": 0.06451376537074816,
        "improvement_mse": 0.18130673840641975,
        "improvement_mae": 0.2946782559156418
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.7542676329612732,
        "spearman_correlation": 0.6352576770622244,
        "mse_loss": 0.3582712411880493,
        "mae": 0.43144944310188293,
        "baseline_pearson": 0.42798367142677307,
        "baseline_spearman": 0.4330263745573187,
        "baseline_mse": 0.7471503615379333,
        "baseline_mae": 0.5624980926513672,
        "improvement_pearson": 0.3262839615345001,
        "improvement_spearman": 0.20223130250490567,
        "improvement_mse": 0.38887912034988403,
        "improvement_mae": 0.13104864954948425
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.6489912271499634,
        "spearman_correlation": 0.5320947393163393,
        "mse_loss": 0.4834084212779999,
        "mae": 0.5487231612205505,
        "baseline_pearson": 0.28790152072906494,
        "baseline_spearman": 0.29140817083840387,
        "baseline_mse": 0.861672580242157,
        "baseline_mae": 0.6666445732116699,
        "improvement_pearson": 0.36108970642089844,
        "improvement_spearman": 0.24068656847793546,
        "improvement_mse": 0.3782641589641571,
        "improvement_mae": 0.11792141199111938
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.2985227108001709,
        "spearman_correlation": 0.3311090123223591,
        "mse_loss": 0.008271348662674427,
        "mae": 0.0759890004992485,
        "baseline_pearson": 0.35450154542922974,
        "baseline_spearman": 0.35515727952532805,
        "baseline_mse": 0.009333617053925991,
        "baseline_mae": 0.0770777091383934,
        "improvement_pearson": -0.05597883462905884,
        "improvement_spearman": -0.02404826720296893,
        "improvement_mse": 0.001062268391251564,
        "improvement_mae": 0.0010887086391448975
    },
    {
        "model": "GIST-large-Embedding-v0",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6962051391601562,
        "spearman_correlation": 0.7091437932957728,
        "mse_loss": 0.01757458969950676,
        "mae": 0.11020633578300476,
        "baseline_pearson": 0.610398530960083,
        "baseline_spearman": 0.6368471130490547,
        "baseline_mse": 0.032172754406929016,
        "baseline_mae": 0.15314865112304688,
        "improvement_pearson": 0.08580660820007324,
        "improvement_spearman": 0.07229668024671809,
        "improvement_mse": 0.014598164707422256,
        "improvement_mae": 0.042942315340042114
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.802136242389679,
        "spearman_correlation": 0.7922334719748564,
        "mse_loss": 0.1766146570444107,
        "mae": 0.3638845384120941,
        "baseline_pearson": 0.2056678831577301,
        "baseline_spearman": 0.3082549666117147,
        "baseline_mse": 0.6865060925483704,
        "baseline_mae": 0.6585366129875183,
        "improvement_pearson": 0.5964683592319489,
        "improvement_spearman": 0.4839785053631417,
        "improvement_mse": 0.5098914355039597,
        "improvement_mae": 0.2946520745754242
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.844697117805481,
        "spearman_correlation": 0.8164509108295415,
        "mse_loss": 0.16157498955726624,
        "mae": 0.3486672043800354,
        "baseline_pearson": 0.2950087785720825,
        "baseline_spearman": 0.3714980194357472,
        "baseline_mse": 0.5670413970947266,
        "baseline_mae": 0.5696555972099304,
        "improvement_pearson": 0.5496883392333984,
        "improvement_spearman": 0.4449528913937943,
        "improvement_mse": 0.4054664075374603,
        "improvement_mae": 0.22098839282989502
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6486298441886902,
        "spearman_correlation": 0.6305317802375905,
        "mse_loss": 0.02212519943714142,
        "mae": 0.11316093802452087,
        "baseline_pearson": 0.5601729154586792,
        "baseline_spearman": 0.5406768335468519,
        "baseline_mse": 0.03232823312282562,
        "baseline_mae": 0.13474518060684204,
        "improvement_pearson": 0.08845692873001099,
        "improvement_spearman": 0.08985494669073857,
        "improvement_mse": 0.010203033685684204,
        "improvement_mae": 0.021584242582321167
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6579754948616028,
        "spearman_correlation": 0.5791423322069298,
        "mse_loss": 0.04830580949783325,
        "mae": 0.15686678886413574,
        "baseline_pearson": 0.5181487798690796,
        "baseline_spearman": 0.4516451502860954,
        "baseline_mse": 0.3569047152996063,
        "baseline_mae": 0.5727789402008057,
        "improvement_pearson": 0.1398267149925232,
        "improvement_spearman": 0.12749718192083437,
        "improvement_mse": 0.30859890580177307,
        "improvement_mae": 0.4159121513366699
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.5203901529312134,
        "spearman_correlation": 0.48281227769452784,
        "mse_loss": 0.5536500811576843,
        "mae": 0.5210735201835632,
        "baseline_pearson": 0.32046616077423096,
        "baseline_spearman": 0.36180695389007395,
        "baseline_mse": 0.8027543425559998,
        "baseline_mae": 0.5632946491241455,
        "improvement_pearson": 0.19992399215698242,
        "improvement_spearman": 0.12100532380445389,
        "improvement_mse": 0.24910426139831543,
        "improvement_mae": 0.042221128940582275
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.5282294154167175,
        "spearman_correlation": 0.45083681505630735,
        "mse_loss": 0.6177153587341309,
        "mae": 0.6105638742446899,
        "baseline_pearson": 0.3269558548927307,
        "baseline_spearman": 0.3292665913566019,
        "baseline_mse": 0.954206645488739,
        "baseline_mae": 0.6927431225776672,
        "improvement_pearson": 0.20127356052398682,
        "improvement_spearman": 0.12157022369970544,
        "improvement_mse": 0.33649128675460815,
        "improvement_mae": 0.0821792483329773
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.41711586713790894,
        "spearman_correlation": 0.4290374814206275,
        "mse_loss": 0.008310465142130852,
        "mae": 0.07435747981071472,
        "baseline_pearson": 0.35529816150665283,
        "baseline_spearman": 0.3815517950199447,
        "baseline_mse": 0.007678679656237364,
        "baseline_mae": 0.07077429443597794,
        "improvement_pearson": 0.061817705631256104,
        "improvement_spearman": 0.04748568640068279,
        "improvement_mse": -0.0006317854858934879,
        "improvement_mae": -0.003583185374736786
    },
    {
        "model": "gte-large-en-v1.5",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.614906907081604,
        "spearman_correlation": 0.6443820279396578,
        "mse_loss": 0.02190900221467018,
        "mae": 0.1231054961681366,
        "baseline_pearson": 0.5473071336746216,
        "baseline_spearman": 0.5966991054663099,
        "baseline_mse": 0.047106169164180756,
        "baseline_mae": 0.19015401601791382,
        "improvement_pearson": 0.06759977340698242,
        "improvement_spearman": 0.04768292247334793,
        "improvement_mse": 0.025197166949510574,
        "improvement_mae": 0.06704851984977722
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "concepts",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.811042070388794,
        "spearman_correlation": 0.8002859591580646,
        "mse_loss": 0.17100253701210022,
        "mae": 0.35449862480163574,
        "baseline_pearson": 0.2229887694120407,
        "baseline_spearman": 0.3244985189617318,
        "baseline_mse": 0.5775725245475769,
        "baseline_mae": 0.6086645126342773,
        "improvement_pearson": 0.5880533009767532,
        "improvement_spearman": 0.47578744019633273,
        "improvement_mse": 0.4065699875354767,
        "improvement_mae": 0.2541658878326416
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "concepts",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.8686119318008423,
        "spearman_correlation": 0.8477278410569021,
        "mse_loss": 0.14809198677539825,
        "mae": 0.32456111907958984,
        "baseline_pearson": 0.43430379033088684,
        "baseline_spearman": 0.4776240062123669,
        "baseline_mse": 0.5325793623924255,
        "baseline_mae": 0.5645499229431152,
        "improvement_pearson": 0.43430814146995544,
        "improvement_spearman": 0.37010383484453524,
        "improvement_mse": 0.3844873756170273,
        "improvement_mae": 0.2399888038635254
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "concepts",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.6103116273880005,
        "spearman_correlation": 0.6060016611575957,
        "mse_loss": 0.022929923608899117,
        "mae": 0.11342088133096695,
        "baseline_pearson": 0.5195952653884888,
        "baseline_spearman": 0.45756916710241413,
        "baseline_mse": 0.030188830569386482,
        "baseline_mae": 0.1346035748720169,
        "improvement_pearson": 0.09071636199951172,
        "improvement_spearman": 0.14843249405518155,
        "improvement_mse": 0.007258906960487366,
        "improvement_mae": 0.021182693541049957
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "concepts",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7065712213516235,
        "spearman_correlation": 0.6452966892217452,
        "mse_loss": 0.05107596516609192,
        "mae": 0.1651572287082672,
        "baseline_pearson": 0.6390225291252136,
        "baseline_spearman": 0.590199213722711,
        "baseline_mse": 0.22294461727142334,
        "baseline_mae": 0.44139596819877625,
        "improvement_pearson": 0.06754869222640991,
        "improvement_spearman": 0.05509747549903421,
        "improvement_mse": 0.17186865210533142,
        "improvement_mae": 0.27623873949050903
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "propositions",
        "endpoint": "a -> b",
        "out_dim": 400,
        "pearson_correlation": 0.8469676971435547,
        "spearman_correlation": 0.7117563654889532,
        "mse_loss": 0.27587494254112244,
        "mae": 0.3888516426086426,
        "baseline_pearson": 0.5125066637992859,
        "baseline_spearman": 0.5231024533425563,
        "baseline_mse": 0.7371945381164551,
        "baseline_mae": 0.5684844851493835,
        "improvement_pearson": 0.3344610333442688,
        "improvement_spearman": 0.18865391214639682,
        "improvement_mse": 0.46131959557533264,
        "improvement_mae": 0.17963284254074097
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "propositions",
        "endpoint": "b -> a",
        "out_dim": 400,
        "pearson_correlation": 0.7626235485076904,
        "spearman_correlation": 0.5574793737896678,
        "mse_loss": 0.3577965795993805,
        "mae": 0.48553213477134705,
        "baseline_pearson": 0.4464317858219147,
        "baseline_spearman": 0.42987901689334246,
        "baseline_mse": 0.7892018556594849,
        "baseline_mae": 0.6525278687477112,
        "improvement_pearson": 0.31619176268577576,
        "improvement_spearman": 0.12760035689632537,
        "improvement_mse": 0.43140527606010437,
        "improvement_mae": 0.16699573397636414
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "propositions",
        "endpoint": "char(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.4931808412075043,
        "spearman_correlation": 0.47607017855753947,
        "mse_loss": 0.006652514915913343,
        "mae": 0.06558898091316223,
        "baseline_pearson": 0.5096423029899597,
        "baseline_spearman": 0.4857973977488638,
        "baseline_mse": 0.010924217291176319,
        "baseline_mae": 0.08113962411880493,
        "improvement_pearson": -0.016461461782455444,
        "improvement_spearman": -0.009727219191324354,
        "improvement_mse": 0.004271702375262976,
        "improvement_mae": 0.0155506432056427
    },
    {
        "model": "bilingual-embedding-large",
        "dataset": "propositions",
        "endpoint": "token(a ~ b)",
        "out_dim": 400,
        "pearson_correlation": 0.7388255596160889,
        "spearman_correlation": 0.7358723317248641,
        "mse_loss": 0.01584063284099102,
        "mae": 0.10320574045181274,
        "baseline_pearson": 0.6681331396102905,
        "baseline_spearman": 0.6921161329895124,
        "baseline_mse": 0.026614531874656677,
        "baseline_mae": 0.13661707937717438,
        "improvement_pearson": 0.07069242000579834,
        "improvement_spearman": 0.04375619873535175,
        "improvement_mse": 0.010773899033665657,
        "improvement_mae": 0.03341133892536163
    }
]