model,4,,,,8,,,,16,,,,32,,,,64,,,,96,,,,128,,,
,token accuracy,std,EM,std,token accuracy,std,EM,std,token accuracy,std,EM,std,token accuracy,std,EM,std,token accuracy,std,EM,std,token accuracy,std,EM,std,token accuracy,std,EM,std
llama-L4H4D128,"100,0","0,0","100,0","0,0","100,0","0,0","100,0","0,0","99,9","0,0","99,8","0,0","99,9","0,1","99,8","0,3","98,2","1,5","96,5","2,9","99,4","0,0","98,8","0,0",,,,
mamba-L4H128,"100,0","0,0","99,9","0,1","99,5","0,2","98,9","0,4","99,4","0,1","98,7","0,2","95,1","5,2","90,2","10,2","97,5","0,04","95,2","0,1","87,3",,"76,3",,,,,
,,,,,,,,,,,,,,,,,,,,,,,,,,,,
"RMT-llama-L4H4D128
(mem=8, K=1)","99,0","0,3","98,2","0,7","98,1","2,0","96,2","3,8","11,8","0,2","1,4","0,1",,,,,,,,,,,,,,,,
"RMT-llama-L4H4D128
(mem=8, K=2)",,,,,"99,0","0,9","98,0","1,7","26,1","32,6","15,3","31,5",,,,,,,,,,,,,,,,
"RMT-llama-L4H4D128
(mem=8, K=1, reconstruct)","100,0","0,0","100,0","0,0","100,0","0,0","100,0","0,0","74,7","31,4","45,5","0,2","46,7","0,1","44,3","0,0",,,,,,,,,,,,
"RMT-llama-L4H4D128
(mem=8, K=2, reconstruct)",,,,,,,,,"74,5","24,1","69,6","28,1","21,5","3,3","18,7","3,4",,,,,,,,,,,,
"RMT-llama-L4H4D128
(mem=8, K=3, reconstruct)",,,,,,,,,"66,3","37,9","60,0","42,0","40,7","0,1","38,1","0,0",,,,,,,,,,,,
"RMT-llama-L4H4D128
(mem=8, K=4, reconstruct)",,,,,,,,,,,,,"33,9","0,1","31,5","0,0",,,,,,,,,,,,
"RMT-llama-L4H4D128
(mem=8, K=5, reconstruct)",,,,,,,,,,,,,"39,1","1,7","37,0","1,7",,,,,,,,,,,,
,,,,,,,,,,,,,,,,,,,,,,,,,,,,
"RMT-llama-L4H4D128
(mem=8, K=1, curriculum)
4 pairs per segment","99,5","0,1","99,1","0,1","99,1","0,2","98,5","0,4","96,1","1,0","93,0","1,7","83,4","2,9","72,0","4,8","53,6","5,7","33,8","5,9",,,,,"29,0","0,1","12,04","0,2"
"ARMT-llama-L4H4D128
(mem=8, K=1)","99,5","0,1","99,0","0,3","99,1","0,3","98,5","0,5","98,4","0,1","97,4","0,3","63,3","1,9","54,9","2,1","28,5","3,8","22,6","3,9","19,6","0,2","15,2","0,2",,,,
,,,,,,,,,,,,,,,,,,,,,,,,,,,,
,,,,,,,,,,,,,,,,,,,,,,,,,,,,
"gradmem-llama-L4H4D128
(mem=8; K=1)","100,0","0,0","100,0","0,0","99,7","0,1","99,3","0,2","98,1","0,4","96,3","0,9","93,0","0,3","86,9","0,5","74,7","0,5","58,6","0,7",,,,,,,,
"gradmem-llama-L4H4D128
(mem=8; K=2)","100,0","0,0","100,0","0,0","100,0","0,0","100,0","0,0","99,8","0,0","99,6","0,1","99,1","0,0","98,3","0,1","85,2","0,1","72,8","0,5",,,,,,,,
"gradmem-llama-L4H4D128
(mem=8; K=5)",,,,,,,,,,,,,"100,0","0,0","99,9","0,1","99,5","0,2","99,1","0,3","94,0","1,3","88,4","2,3",,,,
,,,,,,,,,,,,,,,,,,,,,,,,,,,,
"gradmem-llama-L4H4D128
(mem=8; K=1, no meta)",,,,,"39,5","16,1","12,9","8,1","7,2","2,4","0,5","0,3",,,,,,,,,,,,,,,,
"gradmem-llama-L4H4D128
(mem=8; K=2, no meta)",,,,,"62,9","4,1","35,0","5,5","32,1","6,0","3,7","1,0",,,,,,,,,,,,,,,,