Spaces:
Running
Running
\begin{tabular}{llcccccrr} | |
\toprule | |
\textbf{Model} & \textbf{Elo ($\uparrow$)} & \textbf{Norm.} & \textbf{Avg.} & \textbf{Harm.} & \textbf{\#wins ($\uparrow$)} & \textbf{Improva-} & \textbf{Train time} & \textbf{Predict time} \\ | |
& & \textbf{score ($\uparrow$)} & \textbf{rank ($\downarrow$)} & \textbf{mean} & & \textbf{bility ($\downarrow$)} & \textbf{per 1K [s]} & \textbf{per 1K [s]} \\ | |
& & & & \textbf{rank ($\downarrow$)} & & & & \\ | |
\midrule | |
TabM (T+E) & \textcolor{gold}{\textbf{1574${}_{-28,+28}$}} & \textcolor{bronze}{\textbf{0.505}} & \textcolor{gold}{\textbf{9.6}} & 4.5 & 3 & \textcolor{bronze}{\textbf{8.2\%}} & 2466.21 & 1.50 \\ | |
AutoGluon 1.3 (4h) & \textcolor{silver}{\textbf{1573${}_{-34,+30}$}} & \textcolor{gold}{\textbf{0.577}} & \textcolor{silver}{\textbf{9.7}} & \textcolor{silver}{\textbf{3.3}} & \textcolor{silver}{\textbf{6}} & \textcolor{gold}{\textbf{6.9\%}} & 1322.72 & 2.36 \\ | |
RealMLP (T+E) & \textcolor{bronze}{\textbf{1552${}_{-30,+32}$}} & 0.470 & \textcolor{bronze}{\textbf{10.5}} & 7.4 & 0 & \textcolor{bronze}{\textbf{8.2\%}} & 6519.69 & 10.84 \\ | |
LightGBM (T+E) & 1537${}_{-30,+26}$ & 0.421 & 11.1 & 6.4 & 1 & 9.8\% & 382.05 & 1.49 \\ | |
TabICL (D) & 1530${}_{-31,+23}$ & \textcolor{silver}{\textbf{0.512}} & 11.4 & \textcolor{bronze}{\textbf{3.5}} & \textcolor{silver}{\textbf{6}} & \textcolor{silver}{\textbf{7.9\%}} & 8.68 & 1.74 \\ | |
TabM (T) & 1487${}_{-30,+29}$ & 0.420 & 13.2 & 6.4 & 1 & 9.3\% & 2466.21 & 0.18 \\ | |
CatBoost (T+E) & 1479${}_{-26,+24}$ & 0.395 & 13.6 & 8.7 & 0 & 9.1\% & 1372.94 & 0.56 \\ | |
CatBoost (T) & 1469${}_{-27,+25}$ & 0.379 & 13.9 & 7.0 & 1 & 9.3\% & 1372.94 & 0.07 \\ | |
LightGBM (T) & 1463${}_{-29,+30}$ & 0.336 & 14.3 & 12.1 & 0 & 10.6\% & 382.05 & 0.25 \\ | |
CatBoost (D) & 1454${}_{-28,+23}$ & 0.362 & 14.7 & 7.1 & 1 & 10.3\% & 5.72 & 0.08 \\ | |
TabPFNv2 (T+E) & 1454${}_{-31,+25}$ & 0.497 & 14.7 & \textcolor{gold}{\textbf{3.1}} & \textcolor{gold}{\textbf{8}} & 9.7\% & 3008.22 & 20.85 \\ | |
XGBoost (T+E) & 1452${}_{-28,+31}$ & 0.332 & 14.8 & 9.3 & 0 & 10.7\% & 685.87 & 1.45 \\ | |
ModernNCA (T) & 1416${}_{-34,+24}$ & 0.289 & 16.5 & 9.7 & 1 & 10.5\% & 4879.89 & 0.52 \\ | |
XGBoost (T) & 1412${}_{-26,+28}$ & 0.279 & 16.6 & 13.3 & 0 & 11.1\% & 685.87 & 0.21 \\ | |
ModernNCA (T+E) & 1410${}_{-28,+27}$ & 0.382 & 16.7 & 7.5 & 0 & 10.4\% & 4879.89 & 8.74 \\ | |
TabPFNv2 (T) & 1388${}_{-30,+33}$ & 0.385 & 17.8 & 5.2 & 1 & 12.1\% & 3008.22 & 0.51 \\ | |
TabM (D) & 1375${}_{-26,+30}$ & 0.280 & 18.3 & 11.8 & 0 & 12.6\% & 10.21 & 0.14 \\ | |
TabPFNv2 (D) & 1366${}_{-31,+25}$ & 0.354 & 18.8 & 4.8 & 4 & 13.0\% & 3.37 & 0.32 \\ | |
TorchMLP (T+E) & 1364${}_{-28,+29}$ & 0.233 & 19.1 & 14.8 & 0 & 11.6\% & 2389.22 & 2.16 \\ | |
RealMLP (T) & 1357${}_{-27,+29}$ & 0.188 & 19.4 & 16.7 & 0 & 12.0\% & 6519.69 & 0.53 \\ | |
EBM (T+E) & 1356${}_{-28,+26}$ & 0.188 & 19.3 & 13.5 & 0 & 14.9\% & 914.23 & 0.22 \\ | |
FastaiMLP (T+E) & 1323${}_{-29,+23}$ & 0.203 & 21.0 & 12.4 & 0 & 14.6\% & 618.90 & 4.77 \\ | |
ModernNCA (D) & 1306${}_{-28,+26}$ & 0.140 & 21.8 & 12.3 & 1 & 14.7\% & 14.78 & 0.35 \\ | |
EBM (T) & 1295${}_{-30,+26}$ & 0.130 & 22.4 & 17.9 & 0 & 15.6\% & 914.23 & 0.03 \\ | |
EBM (D) & 1265${}_{-36,+29}$ & 0.143 & 23.9 & 11.4 & 1 & 16.6\% & 4.31 & 0.05 \\ | |
RealMLP (D) & 1253${}_{-27,+23}$ & 0.088 & 24.5 & 21.0 & 0 & 14.6\% & 21.83 & 0.90 \\ | |
XGBoost (D) & 1253${}_{-31,+29}$ & 0.116 & 24.5 & 19.3 & 0 & 14.1\% & 1.77 & 0.12 \\ | |
ExtraTrees (T+E) & 1252${}_{-29,+24}$ & 0.110 & 24.6 & 16.8 & 0 & 15.8\% & 189.76 & 0.74 \\ | |
TabDPT (D) & 1239${}_{-35,+28}$ & 0.180 & 25.1 & 8.1 & 2 & 15.5\% & 22.61 & 8.55 \\ | |
TorchMLP (T) & 1237${}_{-26,+26}$ & 0.106 & 25.1 & 21.7 & 0 & 14.1\% & 2389.22 & 0.15 \\ | |
FastaiMLP (T) & 1220${}_{-29,+28}$ & 0.093 & 26.1 & 20.7 & 0 & 16.6\% & 618.90 & 0.30 \\ | |
RandomForest (T+E) & 1214${}_{-24,+25}$ & 0.105 & 26.3 & 14.4 & 0 & 16.6\% & 323.74 & 0.74 \\ | |
LightGBM (D) & 1198${}_{-28,+29}$ & 0.087 & 27.0 & 23.6 & 0 & 15.4\% & 1.79 & 0.12 \\ | |
ExtraTrees (T) & 1196${}_{-33,+24}$ & 0.080 & 27.1 & 17.2 & 0 & 17.2\% & 189.76 & 0.08 \\ | |
RandomForest (T) & 1159${}_{-33,+33}$ & 0.078 & 28.8 & 16.5 & 0 & 17.8\% & 323.74 & 0.08 \\ | |
TorchMLP (D) & 1082${}_{-30,+22}$ & 0.023 & 32.0 & 29.3 & 0 & 19.3\% & 6.83 & 0.15 \\ | |
FastaiMLP (D) & 1053${}_{-31,+29}$ & 0.031 & 33.1 & 29.9 & 0 & 22.1\% & 2.91 & 0.37 \\ | |
RandomForest (D) & 1000${}_{-0,+0}$ & 0.013 & 34.8 & 32.9 & 0 & 24.1\% & 0.38 & 0.04 \\ | |
Linear (T+E) & 998${}_{-37,+26}$ & 0.042 & 34.9 & 25.5 & 0 & 29.2\% & 51.79 & 0.22 \\ | |
Linear (T) & 962${}_{-28,+24}$ & 0.027 & 36.1 & 30.6 & 0 & 30.1\% & 51.79 & 0.08 \\ | |
Linear (D) & 951${}_{-30,+28}$ & 0.019 & 36.3 & 27.8 & 0 & 31.1\% & 1.61 & 0.10 \\ | |
ExtraTrees (D) & 915${}_{-31,+32}$ & 0.010 & 37.3 & 34.3 & 0 & 26.7\% & 0.25 & 0.04 \\ | |
KNN (T+E) & 688${}_{-46,+39}$ & 0.000 & 41.7 & 41.4 & 0 & 48.5\% & 2.97 & 0.19 \\ | |
KNN (T) & 605${}_{-45,+48}$ & 0.000 & 42.7 & 42.5 & 0 & 50.3\% & 2.97 & 0.04 \\ | |
KNN (D) & 462${}_{-71,+70}$ & 0.000 & 43.9 & 43.7 & 0 & 58.7\% & 0.07 & 0.02 \\ | |
\bottomrule | |
\end{tabular} |