Upload ugi-leaderboard-data.csv
Browse files- ugi-leaderboard-data.csv +17 -10
ugi-leaderboard-data.csv
CHANGED
|
@@ -993,13 +993,20 @@ DavidAU/gemma-3-12b-it-vl-Polaris-GLM-4.7-Flash-VAR-Thinking-Instruct-Heretic-Un
|
|
| 993 |
stepfun-ai/Step-3.5-Flash,https://huggingface.co/stepfun-ai/Step-3.5-Flash,2/1/2026,2/11/2026,,11.0,196.0,196.0,FALSE,FALSE,TRUE,45.87,43.09,5.9,2.6,6.8,2.5,3.0,2.0,37.57,62.64,24.14,25.94,48.75,0.262,0.1421,0.4317,0.1623,0.2989,-26.3%,69.1%,45.8%,49.0%,64.4%,46.0%,63.1%,46.5%,28.1%,35.4%,29.2%,52.9%,58.5%,35.6%,67.5%,62.9%,62.9%,Liberalism,True,0,0,,25.0,0.59,14.1,4.7,0.373,42.0,100.0,0.865,0.408,0.351,1.437,0.111,0.253,50.4,8290.0,93.2,24.6,1.8,4.9
|
| 994 |
zai-org/GLM-5 (reasoning=disabled),https://huggingface.co/zai-org/GLM-5,2/11/2026,2/11/2026,,40.0,744.0,744.0,FALSE,FALSE,TRUE,49.22,36.74,2.9,4.8,5.2,1.2,1.0,1.5,49.38,58.32,51.72,38.1,44.32,0.3785,0.1321,0.5087,0.4566,0.4291,-21.0%,65.7%,47.2%,49.0%,62.6%,42.5%,60.4%,44.4%,33.5%,35.4%,34.0%,53.5%,50.6%,42.9%,59.0%,63.3%,65.6%,Liberalism,False,0,0,,37.1,0.74,11.7,5.5,0.401,36.0,98.0,0.854,0.432,0.348,1.197,0.454,0.383,38.4,8768.0,84.0,20.9,2.0,4.0
|
| 995 |
zai-org/GLM-5 (reasoning=enabled),https://huggingface.co/zai-org/GLM-5,2/11/2026,2/11/2026,,0.0,744.0,744.0,FALSE,FALSE,TRUE,55.03,61.28,8.8,7.4,7.4,0.8,0.0,1.5,55.34,62.6,58.62,44.8,78.09,0.5425,0.3827,0.6166,0.3635,0.3346,-20.7%,65.6%,44.5%,49.1%,61.0%,48.8%,61.7%,44.0%,33.8%,37.7%,31.9%,54.2%,51.7%,41.5%,58.8%,60.0%,64.2%,Liberalism,True,0,0,,42.0,0.82,11.9,5.1,0.38,34.0,90.0,0.835,0.431,0.35,1.437,0.063,0.313,27.5,3438.0,72.6,21.82,1.8,4.4
|
| 996 |
-
temaq-org/Tema_Q-R7.0,https://huggingface.co/temaq-org/Tema_Q-R7.0,12/26/2025,2/12/2026,gemma-3,12.0,12.0,12.0,
|
| 997 |
-
deepseek-ai/DeepSeek-R1-Distill-Qwen-14B,https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B,1/20/2025,2/12/2026,deepseek-r1 w/ <think> prefill,14.0,14.0,14.0,
|
| 998 |
-
temaq-org/Tema_Q-X-Thinking,https://huggingface.co/temaq-org/Tema_Q-X-Thinking,1/16/2026,2/12/2026,deepseek-r1 w/ <think> prefill,14.0,14.0,14.0,
|
| 999 |
-
sleepdeprived3/Christian-Bible-Expert-v2.0-24B,https://huggingface.co/sleepdeprived3/Christian-Bible-Expert-v2.0-24B,4/12/2025,2/12/2026,mistral V7-Tekken,24.0,24.0,24.0,
|
| 1000 |
-
sleepdeprived3/Christian-Bible-Expert-v2.0-12B,https://huggingface.co/sleepdeprived3/Christian-Bible-Expert-v2.0-12B,4/12/2025,2/12/2026,mistral V3-Tekken,12.0,12.0,12.0,
|
| 1001 |
-
MiniMaxAI/MiniMax-M2.5,https://huggingface.co/openrouter/minimax/minimax-m2.5,2/12/2026,2/12/2026,,,,,
|
| 1002 |
-
KaraKaraWitch/GoldDiamondGold-Abliterated-L33-70b,https://huggingface.co/KaraKaraWitch/GoldDiamondGold-Abliterated-L33-70b,2/10/2026,2/14/2026,llama-3,70.0,70.0,70.0,
|
| 1003 |
-
Silicone-Moss/TheDrummer-Skyfall-31B-v4.1-Heretic-Absolute,https://huggingface.co/Silicone-Moss/TheDrummer-Skyfall-31B-v4.1-Heretic-Absolute,2/10/2026,2/14/2026,mistral V7-Tekken,31.0,31.0,31.0,
|
| 1004 |
-
meta-llama/Llama-2-70b-chat-hf,https://huggingface.co/meta-llama/Llama-2-70b-chat-hf,7/18/2023,2/14/2026,llama-2-or-Codestral-22B-v0.1,70.0,70.0,70.0,
|
| 1005 |
-
Darkknight535/Void-Citrus-L3.3-70B,https://huggingface.co/Darkknight535/Void-Citrus-L3.3-70B,1/31/2026,2/15/2026,llama-3,70.0,70.0,70.0,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 993 |
stepfun-ai/Step-3.5-Flash,https://huggingface.co/stepfun-ai/Step-3.5-Flash,2/1/2026,2/11/2026,,11.0,196.0,196.0,FALSE,FALSE,TRUE,45.87,43.09,5.9,2.6,6.8,2.5,3.0,2.0,37.57,62.64,24.14,25.94,48.75,0.262,0.1421,0.4317,0.1623,0.2989,-26.3%,69.1%,45.8%,49.0%,64.4%,46.0%,63.1%,46.5%,28.1%,35.4%,29.2%,52.9%,58.5%,35.6%,67.5%,62.9%,62.9%,Liberalism,True,0,0,,25.0,0.59,14.1,4.7,0.373,42.0,100.0,0.865,0.408,0.351,1.437,0.111,0.253,50.4,8290.0,93.2,24.6,1.8,4.9
|
| 994 |
zai-org/GLM-5 (reasoning=disabled),https://huggingface.co/zai-org/GLM-5,2/11/2026,2/11/2026,,40.0,744.0,744.0,FALSE,FALSE,TRUE,49.22,36.74,2.9,4.8,5.2,1.2,1.0,1.5,49.38,58.32,51.72,38.1,44.32,0.3785,0.1321,0.5087,0.4566,0.4291,-21.0%,65.7%,47.2%,49.0%,62.6%,42.5%,60.4%,44.4%,33.5%,35.4%,34.0%,53.5%,50.6%,42.9%,59.0%,63.3%,65.6%,Liberalism,False,0,0,,37.1,0.74,11.7,5.5,0.401,36.0,98.0,0.854,0.432,0.348,1.197,0.454,0.383,38.4,8768.0,84.0,20.9,2.0,4.0
|
| 995 |
zai-org/GLM-5 (reasoning=enabled),https://huggingface.co/zai-org/GLM-5,2/11/2026,2/11/2026,,0.0,744.0,744.0,FALSE,FALSE,TRUE,55.03,61.28,8.8,7.4,7.4,0.8,0.0,1.5,55.34,62.6,58.62,44.8,78.09,0.5425,0.3827,0.6166,0.3635,0.3346,-20.7%,65.6%,44.5%,49.1%,61.0%,48.8%,61.7%,44.0%,33.8%,37.7%,31.9%,54.2%,51.7%,41.5%,58.8%,60.0%,64.2%,Liberalism,True,0,0,,42.0,0.82,11.9,5.1,0.38,34.0,90.0,0.835,0.431,0.35,1.437,0.063,0.313,27.5,3438.0,72.6,21.82,1.8,4.4
|
| 996 |
+
temaq-org/Tema_Q-R7.0,https://huggingface.co/temaq-org/Tema_Q-R7.0,12/26/2025,2/12/2026,gemma-3,12.0,12.0,12.0,TRUE,FALSE,FALSE,29.73,34.23,2.4,1.3,1.2,9.5,10.0,9.0,18.29,16.28,18.28,20.32,15.24,0.2541,0.1561,0.1439,0.2208,0.241,-10.6%,59.6%,48.3%,43.3%,61.9%,39.8%,63.5%,48.1%,42.1%,39.6%,39.6%,44.2%,45.6%,40.2%,56.5%,60.6%,68.5%,Liberalism,False,0,0,Gemma3ForConditionalGeneration,31.7,0.8,15.4,7.0,0.297,11.0,86.0,0.892,0.429,0.289,1.553,0.326,0.258,51.4,7701.0,154.0,23.58,3.9,3.5
|
| 997 |
+
deepseek-ai/DeepSeek-R1-Distill-Qwen-14B,https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B,1/20/2025,2/12/2026,deepseek-r1 w/ <think> prefill,14.0,14.0,14.0,TRUE,FALSE,FALSE,26.29,19.64,2.4,1.5,1.0,3.2,6.0,0.5,16.39,23.47,12.41,13.28,15.62,0.0822,0.098,0.052,0.2496,0.1821,-27.4%,66.6%,48.1%,53.5%,59.6%,47.9%,59.2%,51.2%,31.2%,35.8%,33.1%,61.2%,61.2%,38.1%,52.9%,62.9%,63.1%,Liberalism,True,2612,0,Qwen2ForCausalLM,29.4,0.81,13.0,7.0,0.323,60.0,76.0,0.89,0.458,0.308,1.53,0.429,0.139,100.2,10978.0,223.8,23.17,0.5,5.2
|
| 998 |
+
temaq-org/Tema_Q-X-Thinking,https://huggingface.co/temaq-org/Tema_Q-X-Thinking,1/16/2026,2/12/2026,deepseek-r1 w/ <think> prefill,14.0,14.0,14.0,TRUE,FALSE,FALSE,24.94,28.63,2.9,1.3,1.3,6.5,8.0,5.0,13.81,19.36,7.93,14.13,17.26,0.1109,0.1381,0.1187,0.099,0.2399,-21.0%,62.3%,47.7%,52.1%,56.8%,48.5%,60.4%,52.1%,30.8%,50.0%,32.3%,50.2%,55.8%,50.2%,44.2%,60.8%,65.8%,Liberalism,True,2312,0,Qwen2ForCausalLM,30.7,0.73,12.7,6.6,0.302,65.0,66.0,0.866,0.429,0.284,1.467,0.591,0.243,84.9,8477.0,165.8,26.2,1.0,1.8
|
| 999 |
+
sleepdeprived3/Christian-Bible-Expert-v2.0-24B,https://huggingface.co/sleepdeprived3/Christian-Bible-Expert-v2.0-24B,4/12/2025,2/12/2026,mistral V7-Tekken,24.0,24.0,24.0,TRUE,FALSE,FALSE,36.83,31.17,2.4,2.4,1.4,6.5,6.0,7.0,28.13,36.08,23.1,25.21,20.6,0.3057,0.167,0.191,0.2828,0.3138,-19.9%,64.5%,45.8%,42.8%,60.6%,41.7%,67.5%,46.5%,36.5%,39.6%,30.4%,51.0%,46.0%,31.5%,59.6%,61.7%,60.6%,Liberalism,False,0,0,MistralForCausalLM,43.4,0.88,12.4,5.8,0.339,11.0,35.0,0.898,0.49,0.286,1.337,0.4,0.272,45.2,7299.0,137.5,22.73,1.8,3.1
|
| 1000 |
+
sleepdeprived3/Christian-Bible-Expert-v2.0-12B,https://huggingface.co/sleepdeprived3/Christian-Bible-Expert-v2.0-12B,4/12/2025,2/12/2026,mistral V3-Tekken,12.0,12.0,12.0,TRUE,FALSE,FALSE,34.63,28.86,2.9,1.6,1.7,5.8,7.0,4.5,21.14,22.11,17.93,23.38,19.91,0.122,0.1497,0.1597,0.4425,0.295,-16.0%,61.7%,44.9%,44.5%,63.1%,47.5%,60.2%,42.3%,44.2%,37.1%,33.5%,43.1%,49.4%,41.0%,61.5%,61.2%,66.7%,Liberalism,False,0,0,MistralForCausalLM,44.6,0.79,12.6,6.1,0.351,17.0,46.0,0.892,0.47,0.314,1.383,0.376,0.268,80.5,7958.0,147.9,21.03,2.6,3.9
|
| 1001 |
+
MiniMaxAI/MiniMax-M2.5,https://huggingface.co/openrouter/minimax/minimax-m2.5,2/12/2026,2/12/2026,,,,,FALSE,FALSE,TRUE,NA,19.29,3.5,2.1,1.3,1.0,1.0,1.0,38.64,50.45,30.69,34.78,22.19,0.338,0.0872,0.5145,0.471,0.3284,-17.4%,65.4%,49.9%,42.7%,56.9%,35.4%,60.4%,45.6%,38.8%,35.8%,29.2%,44.2%,49.8%,34.2%,52.7%,58.3%,59.6%,Liberalism,False,0,0,,NA,NA,NA,NA,NA,NA,NA,NA,NA,NA,1.337,0.302,0.284,42.0,11961.0,83.4,20.77,NA,NA
|
| 1002 |
+
KaraKaraWitch/GoldDiamondGold-Abliterated-L33-70b,https://huggingface.co/KaraKaraWitch/GoldDiamondGold-Abliterated-L33-70b,2/10/2026,2/14/2026,llama-3,70.0,70.0,70.0,TRUE,TRUE,FALSE,42.25,47.64,4.1,3.5,3.8,8.0,8.0,8.0,30.61,36.47,30.69,24.65,37.53,0.2432,0.2138,0.1725,0.3356,0.2676,-11.7%,57.1%,49.8%,44.9%,62.0%,42.1%,57.1%,48.5%,44.6%,45.0%,39.2%,46.2%,43.8%,44.6%,58.8%,61.7%,65.6%,Liberalism,False,0,0,LlamaForCausalLM,41.4,0.98,13.5,5.7,0.344,27.0,76.0,0.908,0.491,0.272,1.49,0.415,0.293,52.9,5957.0,143.4,22.12,7.8,6.3
|
| 1003 |
+
Silicone-Moss/TheDrummer-Skyfall-31B-v4.1-Heretic-Absolute,https://huggingface.co/Silicone-Moss/TheDrummer-Skyfall-31B-v4.1-Heretic-Absolute,2/10/2026,2/14/2026,mistral V7-Tekken,31.0,31.0,31.0,TRUE,FALSE,FALSE,42.37,34.64,2.4,1.6,3.1,7.2,8.0,6.5,23.49,29.14,16.21,25.14,22.81,0.1955,0.1657,0.2805,0.3148,0.3004,-8.5%,58.5%,43.1%,46.1%,56.2%,47.5%,66.0%,42.7%,41.7%,40.4%,42.3%,54.6%,43.8%,40.0%,51.5%,55.8%,61.2%,Liberalism,False,0,0,MistralForCausalLM,55.6,0.97,13.8,5.4,0.306,22.0,46.0,0.846,0.441,0.287,1.487,0.18,0.31,60.9,7344.0,116.3,22.35,3.7,3.4
|
| 1004 |
+
meta-llama/Llama-2-70b-chat-hf,https://huggingface.co/meta-llama/Llama-2-70b-chat-hf,7/18/2023,2/14/2026,llama-2-or-Codestral-22B-v0.1,70.0,70.0,70.0,FALSE,FALSE,TRUE,NA,4.26,0.6,0.0,1.2,0.0,0.0,0.0,18.23,17.7,24.48,12.51,5.59,0.0447,0.1447,0.1302,0.1385,0.1674,-23.2%,60.7%,43.9%,49.4%,62.3%,45.0%,60.0%,36.7%,41.9%,42.5%,33.5%,52.1%,60.4%,35.8%,57.9%,62.1%,66.9%,Liberalism,False,0,0,LlamaForCausalLM,NA,NA,NA,NA,NA,NA,NA,NA,NA,NA,1.843,0.533,0.238,138.7,8173.0,160.1,25.12,NA,NA
|
| 1005 |
+
Darkknight535/Void-Citrus-L3.3-70B,https://huggingface.co/Darkknight535/Void-Citrus-L3.3-70B,1/31/2026,2/15/2026,llama-3,70.0,70.0,70.0,TRUE,TRUE,FALSE,21.09,23.49,1.2,2.3,1.1,4.8,5.0,4.5,26.55,30.53,32.41,16.71,15.98,0.1002,0.1738,0.0845,0.2545,0.2227,-1.4%,54.4%,50.3%,44.0%,56.5%,43.8%,56.2%,51.0%,45.0%,46.7%,45.2%,48.1%,36.9%,47.1%,55.2%,54.8%,59.4%,Centrism,False,0,0,LlamaForCausalLM,36.8,0.87,18.0,10.2,0.266,31.0,62.0,0.9,0.446,0.21,1.618,0.312,0.247,89.9,7067.0,188.1,23.1,7.4,7.1
|
| 1006 |
+
MuXodious/GLM-4.7-Flash-absolute-heresy (glm-4.7 w/ <think> prefill),https://huggingface.co/MuXodious/GLM-4.7-Flash-absolute-heresy,2/14/2026,2/16/2026,glm-4.7 w/ <think> prefill,3.0,30.0,30.0,TRUE,FALSE,FALSE,15.3,35.6,1.8,1.9,1.2,9.8,10.0,9.5,20.6,38.9,10.0,12.91,16.26,0.1293,0.0999,0.0902,0.0654,0.2606,-2.3%,53.2%,46.9%,40.4%,57.4%,51.2%,55.2%,47.3%,46.9%,56.2%,37.3%,44.2%,27.7%,49.4%,50.6%,54.8%,66.9%,Centrism,True,9388,3,Glm4MoeLiteForCausalLM,25.4,0.66,11.8,5.2,0.374,163.0,100.0,0.843,0.41,0.391,1.53,0.144,0.242,77.9,10828.0,183.6,27.55,3.2,3.8
|
| 1007 |
+
MuXodious/GLM-4.7-Flash-absolute-heresy (glm-4.7 (no-think)),https://huggingface.co/MuXodious/GLM-4.7-Flash-absolute-heresy,2/14/2026,2/16/2026,glm-4.7 (no-think),3.0,30.0,30.0,TRUE,FALSE,FALSE,19.8,32.37,1.2,1.5,1.8,8.8,8.0,9.5,16.5,17.68,16.9,14.93,15.14,0.0616,0.1512,0.1083,0.1988,0.2265,-11.7%,55.7%,51.7%,50.6%,55.0%,41.7%,53.1%,49.8%,46.9%,46.2%,39.8%,53.3%,48.3%,50.0%,49.8%,56.5%,58.8%,Centrism,False,0,5,Glm4MoeLiteForCausalLM,32.4,0.74,11.5,5.0,0.362,40.0,92.0,0.852,0.459,0.383,1.676,0.023,0.197,117.1,7896.0,171.6,23.93,4.9,5.1
|
| 1008 |
+
darkc0de/XortronCriminalComputingConfig-heretic-1.2.0,https://huggingface.co/darkc0de/XortronCriminalComputingConfig-heretic-1.2.0,2/16/2026,2/16/2026,mistral V7-Tekken,24.0,24.0,24.0,TRUE,TRUE,FALSE,36.58,41.74,1.8,2.9,3.1,9.0,9.0,9.0,26.42,28.23,20.69,30.34,26.66,0.3047,0.2553,0.307,0.3619,0.2881,-14.7%,59.7%,45.6%,44.9%,57.7%,48.8%,63.8%,49.4%,37.9%,47.1%,35.8%,52.9%,44.8%,36.9%,46.2%,59.0%,67.9%,Liberalism,False,0,0,MistralForCausalLM,45.9,0.9,12.7,5.5,0.356,11.0,18.0,0.907,0.504,0.306,1.33,0.537,0.231,45.3,5103.0,111.5,21.83,1.8,0.6
|
| 1009 |
+
darkc0de/XortronCriminalComputingConfig-heretic,https://huggingface.co/darkc0de/XortronCriminalComputingConfig-heretic,2/1/2026,2/16/2026,mistral V7-Tekken,24.0,24.0,24.0,TRUE,TRUE,FALSE,34.13,41.74,1.8,2.9,3.1,9.0,9.0,9.0,24.45,28.79,17.93,26.62,26.66,0.3047,0.1982,0.3115,0.2633,0.2534,-14.1%,58.9%,46.0%,45.1%,60.8%,47.7%,63.8%,49.4%,39.4%,47.5%,36.5%,52.7%,45.4%,37.3%,57.1%,58.5%,66.7%,Liberalism,False,0,1,MistralForCausalLM,44.4,0.92,12.6,5.6,0.356,11.0,16.0,0.904,0.507,0.301,1.377,0.548,0.199,45.3,6346.0,110.7,22.98,2.1,0.7
|
| 1010 |
+
Qwen/Qwen3.5-397B-A17B (reasoning=enabled),https://huggingface.co/Qwen/Qwen3.5-397B-A17B,2/16/2026,2/16/2026,,17.0,397.0,397.0,FALSE,FALSE,TRUE,49.39,38.95,4.7,3.8,5.6,1.5,2.0,1.0,46.27,66.11,30.34,42.35,46.44,0.3891,0.2922,0.692,0.4096,0.3345,-17.0%,66.1%,46.2%,44.2%,55.6%,44.8%,66.0%,49.6%,33.3%,35.2%,33.1%,47.1%,51.5%,34.0%,49.4%,59.4%,57.9%,Liberalism,True,0,0,,33.9,0.74,11.4,5.2,0.35,9.0,68.0,0.857,0.42,0.333,1.38,0.28,0.329,37.6,4510.0,64.9,21.35,1.1,2.9
|
| 1011 |
+
Qwen/Qwen3.5-397B-A17B (reasoning=disabled),https://huggingface.co/Qwen/Qwen3.5-397B-A17B,2/16/2026,2/16/2026,,17.0,397.0,397.0,FALSE,FALSE,TRUE,52.7,22.25,1.8,2.8,2.0,2.0,3.0,1.0,44.13,61.04,33.1,38.25,22.95,0.3758,0.3419,0.5759,0.3251,0.2937,-18.9%,64.6%,48.4%,45.0%,57.5%,43.8%,61.9%,50.8%,36.7%,37.1%,32.5%,47.3%,49.8%,37.9%,47.7%,62.3%,62.5%,Liberalism,False,0,0,,37.4,0.7,13.2,6.5,0.329,21.0,98.0,0.845,0.441,0.326,1.547,0.082,0.302,38.7,3869.0,76.8,22.23,2.2,5.0
|
| 1012 |
+
ServiceNow-AI/Apriel-1.6-15b-Thinker,https://huggingface.co/ServiceNow-AI/Apriel-1.6-15b-Thinker,12/8/2025,2/16/2026,Apriel-1.6,15.0,15.0,15.0,FALSE,FALSE,TRUE,-5.89,12.1,1.8,0.6,0.5,2.2,3.0,1.5,23.63,37.47,7.93,25.48,8.85,0.3551,0.1421,0.3078,0.208,0.2612,-16.0%,64.9%,41.9%,40.2%,63.2%,44.6%,67.5%,37.9%,36.9%,35.6%,32.7%,40.0%,39.0%,41.7%,61.7%,67.3%,60.6%,Liberalism,True,13176,5,LlavaForConditionalGeneration,27.2,0.69,16.1,9.1,0.248,347.0,98.0,0.785,0.385,0.309,1.363,0.565,0.207,40.4,8287.0,111.4,23.78,2.0,2.8
|