pythia-progressive

================================================================================
Progressive Embeddings Statistics
================================================================================
Experiment                                                             # Compr. Tok    Traj. Len         Steps Taken       PCA 99%         PCA ALL 99%    Rand. Proj. 99%    Info Gain  Info Gain (Dataset)      Emb. Stats (Comp/Vocab)
sl_4096_pythia-1.4b_loss_cosine_hybrid_1.0_align_16                    155.50±35.46    69.29±16.43       4943.00±1924.33   13.50±1.50               92                nan          nan  427.0738±66.0513                             nan
sl_4096_pythia-1.4b_loss_cosine_hybrid_1.0_align_20                    116.60±26.13    58.45±9.97        4590.50±1129.87   11.90±0.83               87                nan          nan  306.9694±35.4717                             nan
sl_4096_pythia-1.4b_loss_cosine_hybrid_1.0_align_4                     182.70±31.05    82.87±9.24        6143.10±1368.16   14.60±1.96               98                nan          nan  553.0752±63.3932                             nan
sl_4096_pythia-1.4b_loss_cosine_hybrid_1.0_align_8                     178.70±33.07    80.22±13.09       6360.10±1979.46   14.30±1.79               94                nan          nan  524.2754±92.2529                             nan
sl_4096_pythia-1.4b_lowdim_128_lowproj_loss_cosine_hybrid_1.0_align_8  468.30±68.63    4698.94±2413.72   9187.70±2180.80   20.00±4.96              111                nan          nan  1447.9609±106.4891                           nan
sl_4096_pythia-1.4b_lowdim_256_lowproj_loss_cosine_hybrid_1.0_align_8  498.20±92.75    5395.50±3309.25   9865.90±2045.42   19.60±5.89              101                nan          nan  1555.3695±145.8146                           nan
sl_4096_pythia-1.4b_lowdim_32_lowproj_loss_cosine_hybrid_1.0_align_8   423.10±104.44   2497.97±1438.45   9974.60±2932.32   15.50±4.57               88                nan          nan  1317.2888±220.9443                           nan
sl_4096_pythia-1.4b_lowdim_64_lowproj_loss_cosine_hybrid_1.0_align_8   447.80±81.93    3309.23±2568.56   8570.50±2375.71   16.90±4.01               84                nan          nan  1397.7190±185.6337                           nan
sl_4096_pythia-1.4b                                                    188.20±27.79    83.05±13.96       0.00±0.00         15.70±1.85              102                nan          nan  580.8471±100.6887                            nan
sl_4096_pythia-1.4b_lr_0.1                                             274.30±56.21    955.73±122.75     0.00±0.00         23.20±1.99              147                nan          nan  846.0144±106.0048                            nan
sl_4096_pythia-1.4b_lr_0.5                                             543.80±56.76    6729.57±390.17    0.00±0.00         49.00±3.32              313                nan          nan  1694.0125±125.2676                           nan
sl_4096_pythia-1.4b_lr_1.0                                             558.20±74.15    11380.97±992.91   0.00±0.00         63.30±6.21              406                nan          nan  1736.9688±158.3229                           nan
sl_4096_pythia-1.4b_lr_5.0                                             517.20±87.30    33749.49±3698.68  0.00±0.00         128.00±13.18             -1                nan          nan  1533.8012±139.6697                           nan
sl_4096_pythia-1.4b_lowdim_32_lowproj                                  358.20±80.64    1550.61±953.66    8742.30±2395.37   15.10±3.01               82                nan          nan  1136.5011±241.3849                           nan
sl_4096_pythia-1.4b_lowdim_64_lowproj                                  392.80±96.62    1919.65±1190.73   8196.50±1920.41   16.70±3.69               87                nan          nan  1240.0505±286.2224                           nan
sl_4096_pythia-1.4b_lowdim_128_lowproj                                 373.00±81.81    1914.51±1133.27   9013.20±1934.87   15.80±3.22               89                nan          nan  1168.0420±240.0144                           nan
sl_4096_pythia-1.4b_lowdim_256_lowproj                                 375.50±100.66   2134.77±1312.39   7590.50±2342.10   16.50±2.16               87                nan          nan  1188.9791±313.6299                           nan
sl_4096_pythia-1.4b_lowdim_512_lowproj                                 415.50±76.30    2863.47±1432.90   7473.30±1632.56   18.00±2.49               98                nan          nan  1332.7256±199.7924                           nan


sl_4096_pythia-160m_loss_cosine_hybrid_1.0_align_16                    13.60±5.62      27.78±10.42       2931.20±1433.96   5.30±2.37                46                nan          nan  54.7593±24.2250                              nan
sl_4096_pythia-160m_loss_cosine_hybrid_1.0_align_20                    13.60±5.62      27.78±10.42       2931.20±1433.96   5.30±2.37                46                nan          nan  54.7593±24.2250                              nan
sl_4096_pythia-160m_loss_cosine_hybrid_1.0_align_4                     10.40±1.91      21.13±6.35        2037.30±691.64    3.60±1.50                39                nan          nan  39.6921±15.4719                              nan
sl_4096_pythia-160m_loss_cosine_hybrid_1.0_align_8                     11.30±2.19      23.11±6.50        2141.90±578.33    4.50±1.20                44                nan          nan  41.9960±12.9570                              nan
sl_4096_pythia-160m_lowdim_128_lowproj_loss_cosine_hybrid_1.0_align_8  13.10±3.62      926.84±437.27     2717.80±1194.37   4.30±1.90                39                nan          nan  44.1375±39.0951                              nan
sl_4096_pythia-160m_lowdim_256_lowproj_loss_cosine_hybrid_1.0_align_8  14.00±7.44      1590.59±1370.67   2865.00±1608.03   3.90±3.05                32                nan          nan  38.5154±23.0642                              nan
sl_4096_pythia-160m_lowdim_32_lowproj_loss_cosine_hybrid_1.0_align_8   9.80±1.83       310.64±139.71     2062.60±437.54    2.80±1.25                30                nan          nan  29.4400±26.5642                              nan
sl_4096_pythia-160m_lowdim_64_lowproj_loss_cosine_hybrid_1.0_align_8   13.90±6.22      663.31±517.54     2911.10±1517.09   4.90±2.70                38                nan          nan  48.4926±31.3420                              nan
sl_4096_pythia-160m_lr_0.1                                             11.70±1.68      239.33±55.11      0.00±0.00         5.60±1.20                57                nan          nan  25.1209±16.4659                              nan
sl_4096_pythia-160m_lr_0.5                                             10.70±1.95      651.57±196.02     0.00±0.00         5.10±1.64                56                nan          nan  18.8272±25.5783                              nan
sl_4096_pythia-160m_lr_1.0                                             10.20±1.33      952.06±190.27     0.00±0.00         5.10±1.04                59                nan          nan  23.6151±11.8344                              nan
sl_4096_pythia-160m_lr_5.0                                             8.40±1.85       1497.49±611.48    0.00±0.00         4.40±1.56                53                nan          nan  -7.7184±29.8996                              nan
sl_4096_pythia-160m                                                    10.80±3.16      24.32±9.30        0.00±0.00         4.30±1.73                43                nan          nan  38.6282±19.5051                              nan
sl_4096_pythia-160m_lowdim_32_lowproj                                  9.50±3.23       264.30±214.07     1876.60±707.52    2.50±1.86                25                nan          nan  20.6846±23.0741                              nan
sl_4096_pythia-160m_lowdim_64_lowproj                                  12.70±6.26      595.78±447.19     2865.50±1497.25   3.60±3.38                35                nan          nan  50.1697±26.8477                              nan
sl_4096_pythia-160m_lowdim_128_lowproj                                 10.40±4.34      742.06±638.37     2547.10±1830.70   2.90±2.39                25                nan          nan  36.6760±25.5980                              nan
sl_4096_pythia-160m_lowdim_256_lowproj                                 10.70±2.76      1155.91±587.25    2486.50±978.28    2.30±1.49                26                nan          nan  36.9150±20.4974                              nan
sl_4096_pythia-160m_lowdim_512_lowproj                                 15.50±6.59      3490.27±2241.99   3259.30±1451.67   5.00±3.29                40                nan          nan  64.5877±41.3813                              nan


sl_4096_pythia-410m_loss_cosine_hybrid_1.0_align_16                    31.90±7.05      37.78±10.23       3207.90±987.47    8.10±1.81                60                nan          nan  104.7126±16.8411                             nan
sl_4096_pythia-410m_loss_cosine_hybrid_1.0_align_20                    29.80±6.95      35.28±7.97        2929.00±710.38    8.20±2.09                62                nan          nan  98.7885±14.6260                              nan
sl_4096_pythia-410m_loss_cosine_hybrid_1.0_align_4                     45.40±11.93     55.07±17.24       4260.40±1697.25   10.50±3.56               74                nan          nan  159.8979±34.9961                             nan
sl_4096_pythia-410m_loss_cosine_hybrid_1.0_align_8                     39.60±9.87      47.22±16.97       3723.00±1934.49   9.80±2.48                71                nan          nan  138.3409±32.1351                             nan
sl_4096_pythia-410m_lowdim_128_lowproj_loss_cosine_hybrid_1.0_align_8  138.60±40.17    5320.13±2022.79   10712.00±4845.11  18.40±4.05               98                nan          nan  471.4457±109.6528                            nan
sl_4096_pythia-410m_lowdim_256_lowproj_loss_cosine_hybrid_1.0_align_8  148.40±31.88    7775.44±2012.94   11268.70±3571.56  20.30±3.41              106                nan          nan  508.4418±65.2160                             nan
sl_4096_pythia-410m_lowdim_32_lowproj_loss_cosine_hybrid_1.0_align_8   110.30±54.16    2244.96±1444.60   9660.80±5347.35   13.10±5.32               70                nan          nan  379.4649±156.3271                            nan
sl_4096_pythia-410m_lowdim_64_lowproj_loss_cosine_hybrid_1.0_align_8   133.00±43.43    4755.84±1555.95   11069.10±4773.85  16.70±4.67               95                nan          nan  452.0144±93.0450                             nan
sl_4096_pythia-410m_lr_0.1                                             102.40±35.95    855.94±235.83     0.00±0.00         26.80±7.93              178                nan          nan  350.9311±102.6158                            nan
sl_4096_pythia-410m_lr_0.5                                             102.10±40.76    3613.26±840.91    0.00±0.00         37.50±11.16             286                nan          nan  322.6948±105.3743                            nan
sl_4096_pythia-410m_lr_1.0                                             61.80±13.59     3951.88±982.82    0.00±0.00         24.90±6.39              215                nan          nan  163.6197±79.5642                             nan
sl_4096_pythia-410m_lr_5.0                                             25.80±6.13      4674.35±1063.41   0.00±0.00         13.00±2.53              124                nan          nan  31.3606±43.2810                              nan
sl_4096_pythia-410m                                                    57.30±12.16     69.03±10.89       0.00±0.00         12.60±2.50               85                nan          nan  203.6905±31.0672                             nan
sl_4096_pythia-410m_lowdim_32_lowproj                                  102.60±34.78    1226.35±573.66    10145.40±3758.45  13.40±3.41               73                nan          nan  351.2602±112.3417                            nan
sl_4096_pythia-410m_lowdim_64_lowproj                                  102.80±30.96    2059.96±1136.54   8350.00±4104.56   15.50±3.85               84                nan          nan  352.2430±117.3033                            nan
sl_4096_pythia-410m_lowdim_128_lowproj                                 133.80±33.00    3382.83±954.02    11265.30±2285.20  18.90±2.34               97                nan          nan  460.4902±72.9850                             nan
sl_4096_pythia-410m_lowdim_256_lowproj                                 136.50±40.79    6811.96±1644.71   10353.20±3461.78  18.60±4.13              100                nan          nan  480.6429±122.4841                            nan
sl_4096_pythia-410m_lowdim_512_lowproj                                 155.90±40.95    9513.60±4638.55   11936.50±3802.79  21.10±2.62               95                nan          nan  528.5584±110.4659                            nan
================================================================================