,uuid,name,model,creation_date,aggregated_centered_results,aggregated_results,rw_small,95%_CI_above,99%_CI_above,model_uuid,low_variance_datasets,_filename,missing tasks,rw_small_centered,95%_CI_above_centered,99%_CI_above_centered,low_variance_datasets_centered,eval_metrics.perplexity,eval_metrics.downstream_perpexity.mmlu,eval_metrics.downstream_perpexity.hellaswag,eval_metrics.downstream_perpexity.jeopardy_all,eval_metrics.downstream_perpexity.triviaqa_sm_sub,eval_metrics.downstream_perpexity.gsm8k,eval_metrics.downstream_perpexity.agi_eval_sat_math,eval_metrics.downstream_perpexity.aqua,eval_metrics.downstream_perpexity.svamp,eval_metrics.downstream_perpexity.bigbench_qa_wikidata,eval_metrics.downstream_perpexity.arc_easy,eval_metrics.downstream_perpexity.arc_challenge,eval_metrics.downstream_perpexity.bigbench_misconceptions,eval_metrics.downstream_perpexity.copa,eval_metrics.downstream_perpexity.siqa,eval_metrics.downstream_perpexity.commonsense_qa,eval_metrics.downstream_perpexity.piqa,eval_metrics.downstream_perpexity.openbook_qa,eval_metrics.downstream_perpexity.bigbench_novel_concepts,eval_metrics.downstream_perpexity.bigbench_strange_stories,eval_metrics.downstream_perpexity.bigbench_strategy_qa,eval_metrics.downstream_perpexity.lambada_openai,eval_metrics.downstream_perpexity.winograd_wsc,eval_metrics.downstream_perpexity.winogrande,eval_metrics.downstream_perpexity.bigbench_conlang_translation,eval_metrics.downstream_perpexity.bigbench_language_identification,eval_metrics.downstream_perpexity.bigbench_conceptual_combinations,eval_metrics.downstream_perpexity.bigbench_elementary_math_qa,eval_metrics.downstream_perpexity.bigbench_dyck_languages,eval_metrics.downstream_perpexity.agi_eval_lsat_ar,eval_metrics.downstream_perpexity.bigbench_cs_algorithms,eval_metrics.downstream_perpexity.bigbench_logical_deduction,eval_metrics.downstream_perpexity.bigbench_operators,eval_metrics.downstream_perpexity.bigbench_repeat_copy_logic,eval_metrics.downstream_perpexity.simple_arithmetic_nospaces,eval_metrics.downstream_perpexity.simple_arithmetic_withspaces,eval_metrics.downstream_perpexity.math_qa,eval_metrics.downstream_perpexity.logi_qa,eval_metrics.downstream_perpexity.pubmed_qa_labeled,eval_metrics.downstream_perpexity.squad,eval_metrics.downstream_perpexity.agi_eval_lsat_rc,eval_metrics.downstream_perpexity.agi_eval_lsat_lr,eval_metrics.downstream_perpexity.coqa,eval_metrics.downstream_perpexity.bigbench_understanding_fables,eval_metrics.downstream_perpexity.boolq,eval_metrics.downstream_perpexity.agi_eval_sat_en,eval_metrics.downstream_perpexity.winogender_mc_female,eval_metrics.downstream_perpexity.winogender_mc_male,eval_metrics.downstream_perpexity.enterprise_pii_classification,eval_metrics.downstream_perpexity.bbq,eval_metrics.downstream_perpexity.human_eval_return_complex,eval_metrics.downstream_perpexity.human_eval_return_simple,eval_metrics.downstream_perpexity.human_eval-0.5,eval_metrics.downstream_perpexity.human_eval-0.25,eval_metrics.downstream_perpexity.human_eval-0.75,eval_metrics.downstream_perpexity.human_eval,eval_metrics.downstream_perpexity.processed_human_eval_cpp,eval_metrics.downstream_perpexity.processed_human_eval_js,eval_metrics.icl.mmlu_zeroshot,eval_metrics.icl.hellaswag_zeroshot,eval_metrics.icl.jeopardy,eval_metrics.icl.triviaqa_sm_sub,eval_metrics.icl.gsm8k,eval_metrics.icl.agi_eval_sat_math,eval_metrics.icl.aqua,eval_metrics.icl.bigbench_qa_wikidata,eval_metrics.icl.arc_easy,eval_metrics.icl.arc_challenge,eval_metrics.icl.bigbench_misconceptions,eval_metrics.icl.copa,eval_metrics.icl.siqa,eval_metrics.icl.commonsense_qa,eval_metrics.icl.piqa,eval_metrics.icl.openbook_qa,eval_metrics.icl.bigbench_novel_concepts,eval_metrics.icl.bigbench_strange_stories,eval_metrics.icl.bigbench_strategy_qa,eval_metrics.icl.lambada_openai,eval_metrics.icl.hellaswag,eval_metrics.icl.winograd,eval_metrics.icl.winogrande,eval_metrics.icl.bigbench_conlang_translation,eval_metrics.icl.bigbench_language_identification,eval_metrics.icl.bigbench_conceptual_combinations,eval_metrics.icl.bigbench_elementary_math_qa,eval_metrics.icl.bigbench_dyck_languages,eval_metrics.icl.agi_eval_lsat_ar,eval_metrics.icl.bigbench_cs_algorithms,eval_metrics.icl.bigbench_logical_deduction,eval_metrics.icl.bigbench_operators,eval_metrics.icl.bigbench_repeat_copy_logic,eval_metrics.icl.simple_arithmetic_nospaces,eval_metrics.icl.simple_arithmetic_withspaces,eval_metrics.icl.math_qa,eval_metrics.icl.logi_qa,eval_metrics.icl.pubmed_qa_labeled,eval_metrics.icl.squad,eval_metrics.icl.agi_eval_lsat_rc,eval_metrics.icl.agi_eval_lsat_lr,eval_metrics.icl.coqa,eval_metrics.icl.bigbench_understanding_fables,eval_metrics.icl.boolq,eval_metrics.icl.agi_eval_sat_en,eval_metrics.icl.winogender_mc_female,eval_metrics.icl.winogender_mc_male,eval_metrics.icl.enterprise_pii_classification,eval_metrics.icl.bbq,eval_metrics.icl.mmlu_fewshot,eval_metrics.icl.gsm8k_cot,eval_metrics.icl.agi_eval_sat_math_cot,eval_metrics.icl.aqua_cot,eval_metrics.icl.svamp_cot,eval_metrics.icl.gpqa_main,eval_metrics.icl.gpqa_diamond,aggregated_task_categories_centered.commonsense reasoning,aggregated_task_categories_centered.language understanding,aggregated_task_categories_centered.reading comprehension,aggregated_task_categories_centered.safety,aggregated_task_categories_centered.symbolic problem solving,aggregated_task_categories_centered.world knowledge,_source_json,eval_metrics.icl.svamp,model_name,eval_metrics.icl.mmlu,partition_key_1,hyperparameters.tokens,hyperparameters.params,dataset_name,dataset_uuid,tokenizer
0,b9b97500-dbe0-43d4-88ef-4096a79076bb,/opt/ml/code/eval/heavy,open_lm_1b_geglu,2024_08_12-20_54_45,0.12689306129396452,0.3205961449352926,0.5342740714550018,0.40862312550768376,0.4129241879361317,364f4d87-3e34-4575-abe7-7eac90b13c02,0.39445733138233086,,[],0.1937164821122822,0.2139571499297031,0.24906497599054794,0.24136647139764825,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.24001257853549823,0.57588130235672,0.0018487859051674604,0.1106666699051857,,,,0.5809261202812195,0.5681818127632141,0.28412967920303345,0.5114155411720276,0.6800000071525574,0.48515865206718445,0.229320228099823,0.745375394821167,0.37599998712539673,0.4375,0.49425286054611206,0.5185670852661133,0.491558313369751,0.5797649621963501,0.7399267554283142,0.5674822330474854,0.018292682245373726,0.25440001487731934,0.24271844327449799,0.23721173405647278,0.14000000059604645,0.22173912823200226,0.4265151619911194,0.2606666684150696,0.19523809850215912,0.0625,0.0020000000949949026,0.0010000000474974513,0.2507542669773102,0.29032257199287415,0.5490000247955322,0.21021759510040283,0.2276119440793991,0.25882354378700256,0.2170863151550293,0.27513226866722107,0.5299693942070007,0.22815534472465515,0.44999998807907104,0.44999998807907104,0.5245950222015381,0.4550830911506306,0.25579144871025755,0.0022744503803551197,0.004545454401522875,0.004081632476300001,0.0533333346247673,0.2321428507566452,0.24242424964904785,0.20075498495915572,0.27111415522930193,0.11402684710756467,-0.060160955244844605,0.0754861346621398,0.1146516151259223,exp_data/evals/evaluation_c4_original-open_lm_1b_geglu-warm=5000-lr=0p003-wd=0p033-cd=3e-05-bs=256-mult=1-seed=124-tokens=28795904000-norm=rms_norm_heavy.json,,,,,28795904000.0,1439795200,c4_original,7e0f5507-aa36-4d8c-9026-d049f885adf1,EleutherAI/gpt-neox-20b
1,ccff9006-bb07-4bf6-be5e-d5dd36a19ee2,/opt/ml/code/eval/heavy,open_lm_1b_geglu,2024_08_13-00_42_22,0.13754336931810704,0.3268954636955808,0.5357639143864313,0.41371760952782316,0.4215695242518964,2cd33b23-fde5-4dce-a78e-118cadb3f9d1,0.4143791760910641,,[],0.21684665533534267,0.22112863045912787,0.25993768366168785,0.2627991200798645,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.24189689441731102,0.48904600739479065,0.17444142699241638,0.17233332991600037,,,,0.6215245127677917,0.566919207572937,0.282423198223114,0.534246563911438,0.6899999976158142,0.4790174067020416,0.1973792016506195,0.7034820318222046,0.35199999809265137,0.40625,0.4885057508945465,0.5133246183395386,0.5488065481185913,0.49163514375686646,0.721611738204956,0.5595895648002625,0.018292682245373726,0.257099986076355,0.24271844327449799,0.23052935302257538,0.210999995470047,0.25652173161506653,0.4575757682323456,0.23133333027362823,0.20476190745830536,0.0625,0.003000000026077032,0.004000000189989805,0.2527656853199005,0.22734254598617554,0.2939999997615814,0.37284767627716064,0.2761194109916687,0.2764706015586853,0.2685707211494446,0.19576719403266907,0.6266055107116699,0.24757280945777893,0.5,0.5833333134651184,0.5428571701049805,0.49835840138522064,0.24641405333552444,0.008339650928974152,0.013636363670229912,0.008163264952600002,0.05000000074505806,0.2053571492433548,0.21717171370983124,0.17500974357394367,0.24292869413987714,0.14187644678576475,0.06227444247765976,0.07856531389670013,0.1383702019501848,exp_data/evals/evaluation_rpj_original-open_lm_1b_geglu-warm=5000-lr=0p003-wd=0p033-cd=3e-05-bs=256-mult=1-seed=124-tokens=28795904000-norm=rms_norm_heavy.json,,,,,28795904000.0,1439795200,rpj_original,67db6b77-c7c4-48ae-b431-57254587ed43,EleutherAI/gpt-neox-20b
2,335c200a-c7bc-4b6d-8187-942d7369cd5b,/opt/ml/code/eval/heavy,open_lm_1b_geglu,2024_08_13-02_30_50,0.13847180257148328,0.3301250135324626,0.5495777676502863,0.4226177982405409,0.43101297552170964,53285675-362b-4159-abf5-8f34a8bf01d3,0.4166276174512777,,[],0.2340971900705706,0.23106796337327287,0.27088274826003705,0.26864405582071904,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.24903027059739097,0.5590519905090332,0.16123516261577606,0.15133333206176758,,,,0.589144229888916,0.5782828330993652,0.29010239243507385,0.4794520437717438,0.6899999976158142,0.48669394850730896,0.28091728687286377,0.7415668964385986,0.35600000619888306,0.40625,0.5287356376647949,0.5176933407783508,0.53017657995224,0.563035249710083,0.7106227278709412,0.5580110549926758,0.012195121496915817,0.2522999942302704,0.25242719054222107,0.23951782286167145,0.19499999284744263,0.20000000298023224,0.45606061816215515,0.2486666738986969,0.1666666716337204,0.0625,0.0020000000949949026,0.004000000189989805,0.2537713646888733,0.2764976918697357,0.5019999742507935,0.3364238440990448,0.25,0.2549019753932953,0.2666917145252228,0.2539682686328888,0.6220183372497559,0.3203883469104767,0.44999998807907104,0.44999998807907104,0.4977908730506897,0.46713169054551557,0.25681010882059735,0.015163002535700798,0.004545454401522875,0.01224489789456129,0.0533333346247673,0.2120535671710968,0.2222222238779068,0.21083873813633974,0.2612216141606641,0.17535823511711338,-0.06753873012282632,0.07719065004589724,0.1271952006778522,exp_data/evals/evaluation_rw_original-open_lm_1b_geglu-warm=5000-lr=0p003-wd=0p033-cd=3e-05-bs=256-mult=1-seed=124-tokens=28795904000-norm=rms_norm_heavy.json,,,,,28795904000.0,1439795200,rw_original,7e0f5507-aa36-4d8c-9026-d049f885adf7,EleutherAI/gpt-neox-20b
3,0bad0292-96cf-4e58-8e12-014663f0590e,/opt/ml/code/eval/heavy,open_lm_1b_geglu,2024_08_12-20_00_13,0.1515624918868134,0.3391815624022517,0.5856820543607076,0.4348402524149263,0.4449775440537412,3fed5764-e979-4776-a327-69c2a29df900,0.4423281653360887,,[],0.2883940436686689,0.2510520233735962,0.2935939589141663,0.3027168997755465,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.2516034177520819,0.5774745941162109,0.27126975655555724,0.19699999690055847,,,,0.595738410949707,0.6632996797561646,0.361774742603302,0.4840182662010193,0.6899999976158142,0.5092118978500366,0.23914824426174164,0.7459194660186768,0.38600000739097595,0.46875,0.540229856967926,0.5404106378555298,0.6031438112258911,0.5870344638824463,0.7545787692070007,0.5848460793495178,0.018292682245373726,0.25920000672340393,0.2330097109079361,0.24444444477558136,0.19499999284744263,0.27391305565834045,0.385606050491333,0.25733333826065063,0.190476194024086,0.03125,0.0020000000949949026,0.0020000000949949026,0.2537713646888733,0.2304147481918335,0.24699999392032623,0.38580888509750366,0.26119402050971985,0.2764706015586853,0.31304019689559937,0.2539682686328888,0.6366972327232361,0.3009708821773529,0.38333332538604736,0.46666666865348816,0.5154638886451721,0.46845845742659137,0.24901916975514932,0.01440485194325447,0.0181818176060915,0.008163264952600002,0.07000000029802322,0.2321428507566452,0.24747474491596222,0.23293897741614306,0.29358538254666194,0.16216143145503706,-0.0830388299443505,0.07664557028281158,0.17057975041936016,exp_data/evals/evaluation_rw_v2_cc_v3_f0.15_resiliparse_fasttext_openhermes_reddit_eli5_vs_rw_v2_bigram_200k_train_0.1-open_lm_1b_geglu-warm=5000-lr=0p003-wd=0p033-cd=3e-05-bs=256-mult=1-seed=124-tokens=28795904000-norm=rms_norm_heavy.json,,,,,28795904000.0,1439795200,rw_v2_cc_v3_f0.15_resiliparse_fasttext_openhermes_reddit_eli5_vs_rw_v2_bigram_200k_train_0.1,430347e8-4739-4031-b69a-99e0fcf6a6ea,EleutherAI/gpt-neox-20b
4,a9419fbd-7541-47ce-8d50-7352b02bec29,/mnt/task_runtime/dcnlp/eval/heavy,open_lm_1b_geglu,2024_08_15-16_54_02,0.15603987249405468,0.344521978378679,0.5824327518542608,0.4525916912435711,0.4637442960687306,8cfba404-e589-40f8-8e8e-0a54cea3255e,0.4507863227616657,,[],0.28325542685581234,0.26865721892789096,0.31112226732103637,0.3112068308145879,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.25012068999441045,0.5813583135604858,0.2648723065853119,0.19833333790302277,,,,0.6015943884849548,0.6561447978019714,0.345563143491745,0.42465752363204956,0.699999988079071,0.4994882345199585,0.3046683073043823,0.7459194660186768,0.3580000102519989,0.46875,0.5574712753295898,0.530362606048584,0.6153696775436401,0.5891256928443909,0.761904776096344,0.5824782848358154,0.018292682245373726,0.25060001015663147,0.25242719054222107,0.2519915997982025,0.21299999952316284,0.2652173936367035,0.4310606122016907,0.257999986410141,0.190476194024086,0.125,0.004000000189989805,0.006000000052154064,0.2608112692832947,0.27496159076690674,0.5139999985694885,0.3810785114765167,0.23134328424930573,0.24117647111415863,0.3248152434825897,0.19576719403266907,0.6290519833564758,0.23786407709121704,0.4333333373069763,0.4833333194255829,0.48541972041130066,0.4799471578814767,0.25071707211042704,0.016679301857948303,0.022727273404598236,0.01224489789456129,0.03999999910593033,0.2098214328289032,0.23232322931289673,0.24098588959469847,0.2994026224806646,0.16411152732019363,-0.05898323248733173,0.09086735262301618,0.1507035567624527,exp_data/evals/evaluation_cc_v4_resiliparse_rw_v2_bff1shards_shard_3_OH_eli5_vs_rw_v2_bigram_200k_train_0.1-open_lm_1b_geglu-warm=5000-lr=0p003-wd=0p033-cd=3e-05-bs=256-mult=1-seed=124-tokens=28795904000-norm=rms_norm_heavy.json,,,,,28795904000.0,1439795200,cc_v4_resiliparse_rw_v2_bff1shards_shard_3_OH_eli5_vs_rw_v2_bigram_200k_train_0.1,334daad0-735f-4f7d-ac82-215e9374546e,EleutherAI/gpt-neox-20b
5,d35332c7-65c4-42f0-8439-b15d68e0d6bb,/mnt/task_runtime/dcnlp/eval/heavy,open_lm_1b_geglu,2024_08_15-21_25_44,0.154857783933249,0.3431467662247598,0.571837509671847,0.442919793507302,0.4523341604548952,9a5bf51b-aa3e-43a4-94e8-8b9d83ee2c5e,0.4424300966615027,,[],0.25916438179406504,0.2558002801152476,0.29641874173981464,0.2989218818174308,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.26483296772889925,0.5760804414749146,0.25683853179216387,0.20033332705497742,,,,0.5689680576324463,0.6527777910232544,0.3464163839817047,0.4840182662010193,0.6800000071525574,0.4984646737575531,0.3316953182220459,0.7366703152656555,0.3659999966621399,0.4375,0.5747126340866089,0.5351681709289551,0.5994566082954407,0.5822545289993286,0.761904776096344,0.5824782848358154,0.024390242993831635,0.24979999661445618,0.3009708821773529,0.23639936745166779,0.2070000022649765,0.25217390060424805,0.3962121307849884,0.25,0.20000000298023224,0.09375,0.0,0.006000000052154064,0.24136775732040405,0.2688172161579132,0.42399999499320984,0.39744558930397034,0.2723880708217621,0.24313725531101227,0.30226731300354004,0.2857142984867096,0.5932721495628357,0.276699036359787,0.44999998807907104,0.44999998807907104,0.496023565530777,0.45561225847764447,0.2634548665138713,0.004548900760710239,0.004545454401522875,0.01224489789456129,0.06333333253860474,0.2165178507566452,0.21212121844291687,0.23966700487631906,0.30413144700561123,0.16756558683782555,-0.07418209991671823,0.08072938343731167,0.16023378868113486,exp_data/evals/evaluation_cc_v4_resiliparse_rw_v2_bff_minngram20_10shards_shard3_OH_eli5_vs_rw_v2_bigram_200k_train_0.1-open_lm_1b_geglu-warm=5000-lr=0p003-wd=0p033-cd=3e-05-bs=256-mult=1-seed=124-tokens=28795904000-norm=rms_norm_heavy.json,,,,,28795904000.0,1439795200,cc_v4_resiliparse_rw_v2_bff_minngram20_10shards_shard3_OH_eli5_vs_rw_v2_bigram_200k_train_0.1,167cff17-2d14-46ab-ae83-44d428f8c50d,tokenizers/gpt_neox_tokenizer.json
6,7e3d4d58-572e-4fbe-90a0-0ac20db9e728,/mnt/task_runtime/dcnlp/eval/heavy,open_lm_1b_geglu,2024_08_16-01_58_00,0.16699909587447365,0.3501837466536657,0.5829706788063049,0.44971606950094173,0.45819611160651497,4b4cb97c-99d1-42cf-a6ed-3d288aa051f3,0.44658147638494317,,[],0.2864196952323467,0.26781822454179743,0.3074060604919649,0.3084355041306183,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.25575654757650274,0.5763791799545288,0.26414390504360197,0.19300000369548798,,,,0.5973131060600281,0.6523569226264954,0.3395904302597046,0.4885844886302948,0.7200000286102295,0.48362332582473755,0.3316953182220459,0.7415668964385986,0.3919999897480011,0.5625,0.6091954112052917,0.5220620632171631,0.5965456962585449,0.5821549296379089,0.7692307829856873,0.576164186000824,0.030487805604934692,0.25360000133514404,0.2330097109079361,0.2431865781545639,0.21799999475479126,0.25217390060424805,0.41893938183784485,0.25200000405311584,0.17619048058986664,0.03125,0.003000000026077032,0.004000000189989805,0.24773718416690826,0.23502303659915924,0.47099998593330383,0.4076631963253021,0.2985074520111084,0.2823529541492462,0.29450082778930664,0.29100528359413147,0.6333333253860474,0.30582523345947266,0.46666666865348816,0.5166666507720947,0.49631810188293457,0.5009445683522658,0.2412177823614656,0.009855951182544231,0.027272727340459824,0.004081632476300001,0.06666667014360428,0.1964285671710968,0.19696970283985138,0.27731854301029774,0.2940116362201564,0.2028146831547482,-0.009702005169608396,0.07701435158471472,0.15413859291731963,exp_data/evals/evaluation_cc_v4_resiliparse_rw_v2_bff_minngram20_32shards_shard3_OH_eli5_vs_rw_v2_bigram_200k_train_0.1-open_lm_1b_geglu-warm=5000-lr=0p003-wd=0p033-cd=3e-05-bs=256-mult=1-seed=124-tokens=28795904000-norm=rms_norm_heavy.json,,,,,28795904000.0,1439795200,cc_v4_resiliparse_rw_v2_bff_minngram20_32shards_shard3_OH_eli5_vs_rw_v2_bigram_200k_train_0.1,903b957f-6097-406d-8b74-c4f14975f2b5,tokenizers/gpt_neox_tokenizer.json
7,eb5d84b7-1dfb-4e29-8cec-379aa27c5176,/mnt/task_runtime/dcnlp/eval/heavy,open_lm_1b_geglu,2024_08_15-17_29_47,0.13165642813391717,0.3251720689782884,0.5276335030794144,0.4137554775276403,0.41475239712744955,9748278c-5659-4dd3-b6fa-06f9615f4f0a,0.40147763279859316,,[],0.18669259304191635,0.2192995455985336,0.24831985130800968,0.24474139376972187,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.23923929427799426,0.5404301881790161,0.05240039359778166,0.1340000033378601,,,,0.5860440135002136,0.5841751098632812,0.2875426709651947,0.5205479264259338,0.6499999761581421,0.5117707252502441,0.23587223887443542,0.7312296032905579,0.3580000102519989,0.5,0.5057471394538879,0.5220620632171631,0.49679797887802124,0.5499900579452515,0.7106227278709412,0.5311760306358337,0.018292682245373726,0.25929999351501465,0.26213592290878296,0.23949161171913147,0.2540000081062317,0.13913042843341827,0.4727272689342499,0.25333333015441895,0.2142857164144516,0.0625,0.0010000000474974513,0.0020000000949949026,0.26148173213005066,0.2534562349319458,0.41999998688697815,0.28751182556152344,0.2537313401699066,0.26862746477127075,0.2562946379184723,0.24867725372314453,0.5724770426750183,0.291262149810791,0.44999998807907104,0.4000000059604645,0.5460972189903259,0.5081940157846971,0.24105101666952433,0.008339650928974152,0.00909090880304575,0.004081632476300001,0.0533333346247673,0.2321428507566452,0.24242424964904785,0.20624249416735324,0.24840561390395416,0.1384446636789985,-0.047854385592720705,0.07836614710684933,0.12489738528633065,exp_data/evals/evaluation_dolma_v1_no_resample-open_lm_1b_geglu-warm=5000-lr=0p003-wd=0p033-cd=3e-05-bs=256-mult=1-seed=124-tokens=28795904000-norm=rms_norm_heavy.json,,,,,28795904000.0,1439795200,dolma_v1_no_resample,bdff90b2-5557-4699-a4c5-8d7b287ddc1b,EleutherAI/gpt-neox-20b
8,e17c3f81-22b0-49cf-a342-f52e1845240f,/mnt/task_runtime/dcnlp/eval/heavy,open_lm_1b_geglu,2024_08_15-22_04_07,0.15544744528004273,0.34028149505803695,0.582904244462649,0.4367945290521368,0.4441915951345278,14f4236a-9ae1-43f9-9e4b-89c8b029aff2,0.43791410801085556,,[],0.28108075313400804,0.2525726555366656,0.29047102052050633,0.2966490316572866,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.24825809529998846,0.5756821632385254,0.2674189805984497,0.19499999284744263,,,,0.5904237031936646,0.6502525210380554,0.34897610545158386,0.4794520437717438,0.75,0.48004093766212463,0.21457821130752563,0.7459194660186768,0.3779999911785126,0.4375,0.5804597735404968,0.5439056158065796,0.5992625951766968,0.5870344638824463,0.7765567898750305,0.5816890001296997,0.018292682245373726,0.2531999945640564,0.28155338764190674,0.2493186593055725,0.2150000035762787,0.186956524848938,0.4477272629737854,0.23733332753181458,0.190476194024086,0.0,0.003000000026077032,0.007000000216066837,0.24472008645534515,0.26574501395225525,0.33799999952316284,0.38136234879493713,0.24253731966018677,0.2568627595901489,0.30276837944984436,0.23280423879623413,0.5908256769180298,0.276699036359787,0.5166666507720947,0.5166666507720947,0.4974963068962097,0.48513610796494916,0.25136891739410266,0.006823351141065359,0.00909090880304575,0.020408162847161293,0.04333333298563957,0.2232142835855484,0.21212121844291687,0.24334816383416655,0.30477225603161806,0.14327628825578773,0.007982858202674165,0.0723294144173123,0.15906682857993054,exp_data/evals/evaluation_fasttext_openhermes_reddit_eli5_vs_rw_v2_bigram_200k_train_minhash.b15.r93_substr-open_lm_1b_geglu-warm=5000-lr=0p003-wd=0p033-cd=3e-05-bs=256-mult=1-seed=124-tokens=28795904000-norm=rms_norm_heavy.json,,,,,28795904000.0,1439795200,fasttext_openhermes_reddit_eli5_vs_rw_v2_bigram_200k_train_minhash.b15.r93_substr,e8fbc9af-0704-4e54-b961-b71dc1d9ead6,EleutherAI/gpt-neox-20b
9,cc45be5a-169e-442b-87cb-4b61e0c9a4ff,/mnt/task_runtime/dcnlp/eval/heavy,open_lm_1b_geglu,2024_08_16-04_36_28,0.15099520126006608,0.33923847575259913,0.5864851226409277,0.43980065596761636,0.45472059159175204,d6470484-48cf-451e-81cc-62d4d954c043,0.4421331027692014,,[],0.2938381182520013,0.25454774884195924,0.3043825338250076,0.30451114026636855,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.252138761313338,0.5759809017181396,0.19789857864379884,0.1860000044107437,,,,0.5832390189170837,0.6351010203361511,0.34215018153190613,0.465753436088562,0.7400000095367432,0.4979529082775116,0.2612612545490265,0.7415668964385986,0.3919999897480011,0.46875,0.545976996421814,0.5037134289741516,0.5903357267379761,0.5819557905197144,0.7655677795410156,0.6045777201652527,0.012195121496915817,0.2502000033855438,0.1650485396385193,0.24748428165912628,0.2240000069141388,0.291304349899292,0.44621211290359497,0.24533332884311676,0.20952381193637848,0.0,0.004000000189989805,0.004000000189989805,0.25544753670692444,0.2703533172607422,0.4869999885559082,0.3725638687610626,0.24253731966018677,0.239215686917305,0.3003883361816406,0.26455026865005493,0.621100902557373,0.2572815418243408,0.44999998807907104,0.46666666865348816,0.49484536051750183,0.4479794746095484,0.2590513527393341,0.007581501267850399,0.00909090880304575,0.016326529905200005,0.0533333346247673,0.2209821492433548,0.21212121844291687,0.23895847001929824,0.28524245928647146,0.16942964024482327,-0.07025425407019528,0.08493427162454144,0.14607040522914183,exp_data/evals/evaluation_rw_v2_cc_v3_f0.15_resiliparse_fasttext_openhermes_reddit_eli5_vs_rw_v2_bigram_200k_train_0.2-open_lm_1b_geglu-warm=5000-lr=0p003-wd=0p033-cd=3e-05-bs=256-mult=1-seed=124-tokens=28795904000-norm=rms_norm_heavy.json,,,,,28795904000.0,1439795200,rw_v2_cc_v3_f0.15_resiliparse_fasttext_openhermes_reddit_eli5_vs_rw_v2_bigram_200k_train_0.2,cbf619ee-6f45-42a2-8cec-18d9e55ffb83,EleutherAI/gpt-neox-20b
