Spaces:
Running
Running
Upload 2 files
Browse files- app.py +9 -3
- fmnb-leaderboard-data.csv +37 -34
app.py
CHANGED
|
@@ -511,6 +511,9 @@ columnDefs = [
|
|
| 511 |
create_numeric_column("16k πͺ‘", width=100, filterParams={
|
| 512 |
"defaultOption": "greaterThanOrEqual"
|
| 513 |
}),
|
|
|
|
|
|
|
|
|
|
| 514 |
# Misc Columns
|
| 515 |
{
|
| 516 |
"field": "Size",
|
|
@@ -658,17 +661,20 @@ app.layout = html.Div([
|
|
| 658 |
html.Div([
|
| 659 |
html.H3("Info", style={'fontSize': '22px', 'marginBottom': '0px'}),
|
| 660 |
|
| 661 |
-
html.P([html.Strong(""), "
|
|
|
|
|
|
|
|
|
|
| 662 |
style={'marginTop': '7px', 'marginBottom': '4px'}),
|
| 663 |
|
| 664 |
-
html.P([html.Strong("Score:"), " Primarily based on the scoring in the multi-needle test at 8k / 16k context, weighted towards 16k."],
|
| 665 |
style={'marginTop': '7px', 'marginBottom': '4px'}),
|
| 666 |
|
| 667 |
html.P([html.Strong("Behavior:"), " Qualitative assessment of the model's behavior during the evaluation. User discretion is advised, as it only has a minor impact on the final score."], style={'marginTop': '7px', 'marginBottom': '4px'}),
|
| 668 |
|
| 669 |
html.P([html.Strong("Difficulty:"), " The current difficulty is only set at a medium level. (Silver Tier 1)"], style={'marginTop': '7px', 'marginBottom': '4px'}),
|
| 670 |
|
| 671 |
-
html.P([html.Strong("Version:"), " 4.
|
| 672 |
|
| 673 |
html.Br(),
|
| 674 |
|
|
|
|
| 511 |
create_numeric_column("16k πͺ‘", width=100, filterParams={
|
| 512 |
"defaultOption": "greaterThanOrEqual"
|
| 513 |
}),
|
| 514 |
+
create_numeric_column("32k πͺ‘", width=100, filterParams={
|
| 515 |
+
"defaultOption": "greaterThanOrEqual"
|
| 516 |
+
}),
|
| 517 |
# Misc Columns
|
| 518 |
{
|
| 519 |
"field": "Size",
|
|
|
|
| 661 |
html.Div([
|
| 662 |
html.H3("Info", style={'fontSize': '22px', 'marginBottom': '0px'}),
|
| 663 |
|
| 664 |
+
html.P([html.Strong("Version 4.1:"), " Thanks to some generously provided compute by an anonymous source, this latest version now includes 32k context scoring data, (not included in the overall score), and adds a number of larger models into the mix!"],
|
| 665 |
+
style={'marginTop': '7px', 'marginBottom': '4px'}),
|
| 666 |
+
|
| 667 |
+
html.P([html.Strong("Info:"), "This latest reiteration of the leaderboard has finally made it to Hugging Face with extended functionality based on the UGI leaderboard, enjoy!"],
|
| 668 |
style={'marginTop': '7px', 'marginBottom': '4px'}),
|
| 669 |
|
| 670 |
+
html.P([html.Strong("Score:"), " Primarily based on the scoring in the multi-needle test at 8k / 16k context, weighted towards 16k. The 32k scoring is not included."],
|
| 671 |
style={'marginTop': '7px', 'marginBottom': '4px'}),
|
| 672 |
|
| 673 |
html.P([html.Strong("Behavior:"), " Qualitative assessment of the model's behavior during the evaluation. User discretion is advised, as it only has a minor impact on the final score."], style={'marginTop': '7px', 'marginBottom': '4px'}),
|
| 674 |
|
| 675 |
html.P([html.Strong("Difficulty:"), " The current difficulty is only set at a medium level. (Silver Tier 1)"], style={'marginTop': '7px', 'marginBottom': '4px'}),
|
| 676 |
|
| 677 |
+
html.P([html.Strong("Version:"), " 4.1"], style={'marginTop': '7px', 'marginBottom': '4px'}),
|
| 678 |
|
| 679 |
html.Br(),
|
| 680 |
|
fmnb-leaderboard-data.csv
CHANGED
|
@@ -1,34 +1,37 @@
|
|
| 1 |
-
author/model_name,Score,Behavior,8k πͺ‘,16k πͺ‘,Size,New,Base,Model Link,Settings
|
| 2 |
-
TheDrummer/Cydonia-24B-v4.1,93,10,94,93
|
| 3 |
-
mistralai/Mistral-Small-3.2-24B-Instruct-2506,88,10,92,86
|
| 4 |
-
ConicCat/Mistral-Small-3.2-AntiRep-24B,87,10,94,83
|
| 5 |
-
TheDrummer/Cydonia-R1-24B-v4,84,10,85,83
|
| 6 |
-
TheDrummer/Cydonia-24B-v4,78,10,86,74
|
| 7 |
-
zerofata/MS3.2-PaintedFantasy-v2-24B,78,10,89,72
|
| 8 |
-
kyx0r/Neona-12B,75,9,92,70
|
| 9 |
-
DreadPoor/Irix-12B-Model_Stock,73,8,91,70
|
| 10 |
-
Nitral-AI/CaptainErisNebula-12B-AE-v1,71,9,92,64
|
| 11 |
-
Doctor-Shotgun/MS3.2-24B-Magnum-Diamond,68,9,69,71
|
| 12 |
-
Entropicengine/Pinecone-Rune-12b,68,9,87,61
|
| 13 |
-
DreadPoor/Ward-12B-Model_Stock,67,9,86,61
|
| 14 |
-
yamatazen/LorablatedStock-12B,67,9,88,60
|
| 15 |
-
Nitral-AI/CaptainErisNebula-12B-AE-v1r,67,8,91,61
|
| 16 |
-
Nitral-AI/Irixxed-Magcap-12B-Slerp,66,7,91,62
|
| 17 |
-
TheDrummer/Rocinante-12B-v1.1,66,8,83,63
|
| 18 |
-
Nitral-AI/CaptainErisNebula-12B-Chimera-v1.1,64,8,85,59
|
| 19 |
-
SicariusSicariiStuff/Impish_Longtail_12B_GGUF_HA,63,9,87,54
|
| 20 |
-
mistralai/Mistral-Nemo-Instruct-2407,55,9,76,48
|
| 21 |
-
inflatebot/MN-12B-Mag-Mell-R1,53,7,79,49
|
| 22 |
-
grimjim/MagnaMellRei-v1-12B,52,8,79,45
|
| 23 |
-
ConicCat/NemoPlotter-12B,52,7,71,51
|
| 24 |
-
SicariusSicariiStuff/Impish_Nemo_12B,49,8,72,43
|
| 25 |
-
pot99rta/PatriSlush-DarkRPMax-12B,47,8,69,42
|
| 26 |
-
ReadyArt/The-Omega-Directive-M-12B-v1.0,42,7,67,39
|
| 27 |
-
CrucibleLab/M3.2-24B-Loki-V1.3,82,10,92,77
|
| 28 |
-
LatitudeGames/Wayfarer-2-12B ,43,7,66,41
|
| 29 |
-
LatitudeGames/Muse-2-12B ,63,7,84,62
|
| 30 |
-
Retreatcost/KansenSakura-Radiance-RP-12b,46,6,68,47
|
| 31 |
-
TheDrummer/Cydonia-24B-v4.2.0,94,10,95,94
|
| 32 |
-
mistralai/Magistral-Small-2509,88,10,95,81
|
| 33 |
-
zai-org/GLM-4.5-Air,99,10,100,99,110B,π,TRUE,https://huggingface.co/zai-org/GLM-4.5-Air,
|
| 34 |
-
TheDrummer/Skyfall-31B-v4,87,10,94,83,31B
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
author/model_name,Score,Behavior,8k πͺ‘,16k πͺ‘,32k πͺ‘,Size,New,Base,Model Link,Settings
|
| 2 |
+
TheDrummer/Cydonia-24B-v4.1,93,10,94,93,,24B,,,https://huggingface.co/TheDrummer/Cydonia-24B-v4.1,
|
| 3 |
+
mistralai/Mistral-Small-3.2-24B-Instruct-2506,88,10,92,86,,24B,,TRUE,https://huggingface.co/mistralai/Mistral-Small-3.2-24B-Instruct-2506,
|
| 4 |
+
ConicCat/Mistral-Small-3.2-AntiRep-24B,87,10,94,83,,24B,,,https://huggingface.co/ConicCat/Mistral-Small-3.2-AntiRep-24B,
|
| 5 |
+
TheDrummer/Cydonia-R1-24B-v4,84,10,85,83,,24B,,,https://huggingface.co/TheDrummer/Cydonia-R1-24B-v4,
|
| 6 |
+
TheDrummer/Cydonia-24B-v4,78,10,86,74,,24B,,,https://huggingface.co/TheDrummer/Cydonia-24B-v4,
|
| 7 |
+
zerofata/MS3.2-PaintedFantasy-v2-24B,78,10,89,72,,24B,,,https://huggingface.co/zerofata/MS3.2-PaintedFantasy-v2-24B,
|
| 8 |
+
kyx0r/Neona-12B,75,9,92,70,,12B,,,https://huggingface.co/kyx0r/Neona-12B,1
|
| 9 |
+
DreadPoor/Irix-12B-Model_Stock,73,8,91,70,,12B,,,https://huggingface.co/DreadPoor/Irix-12B-Model_Stock,1
|
| 10 |
+
Nitral-AI/CaptainErisNebula-12B-AE-v1,71,9,92,64,,12B,,,https://huggingface.co/Nitral-AI/CaptainErisNebula-12B-AE-v1,1
|
| 11 |
+
Doctor-Shotgun/MS3.2-24B-Magnum-Diamond,68,9,69,71,,24B,,,https://huggingface.co/Doctor-Shotgun/MS3.2-24B-Magnum-Diamond,
|
| 12 |
+
Entropicengine/Pinecone-Rune-12b,68,9,87,61,,12B,,,https://huggingface.co/Entropicengine/Pinecone-Rune-12b,1 & 2
|
| 13 |
+
DreadPoor/Ward-12B-Model_Stock,67,9,86,61,,12B,,,https://huggingface.co/DreadPoor/Ward-12B-Model_Stock,1
|
| 14 |
+
yamatazen/LorablatedStock-12B,67,9,88,60,,12B,,,https://huggingface.co/yamatazen/LorablatedStock-12B,1
|
| 15 |
+
Nitral-AI/CaptainErisNebula-12B-AE-v1r,67,8,91,61,,12B,,,https://huggingface.co/Nitral-AI/CaptainErisNebula-12B-AE-v1r,1
|
| 16 |
+
Nitral-AI/Irixxed-Magcap-12B-Slerp,66,7,91,62,,12B,,,https://huggingface.co/Nitral-AI/Irixxed-Magcap-12B-Slerp,1
|
| 17 |
+
TheDrummer/Rocinante-12B-v1.1,66,8,83,63,,12B,,,https://huggingface.co/TheDrummer/Rocinante-12B-v1.1,1
|
| 18 |
+
Nitral-AI/CaptainErisNebula-12B-Chimera-v1.1,64,8,85,59,,12B,,,https://huggingface.co/Nitral-AI/CaptainErisNebula-12B-Chimera-v1.1,1
|
| 19 |
+
SicariusSicariiStuff/Impish_Longtail_12B_GGUF_HA,63,9,87,54,,12B,,,https://huggingface.co/SicariusSicariiStuff/Impish_Longtail_12B_GGUF_HA,1
|
| 20 |
+
mistralai/Mistral-Nemo-Instruct-2407,55,9,76,48,,12B,,TRUE,https://huggingface.co/mistralai/Mistral-Nemo-Instruct-2407,1
|
| 21 |
+
inflatebot/MN-12B-Mag-Mell-R1,53,7,79,49,,12B,,,https://huggingface.co/inflatebot/MN-12B-Mag-Mell-R1,1 & 2
|
| 22 |
+
grimjim/MagnaMellRei-v1-12B,52,8,79,45,,12B,,,https://huggingface.co/grimjim/MagnaMellRei-v1-12B,1
|
| 23 |
+
ConicCat/NemoPlotter-12B,52,7,71,51,,12B,,,https://huggingface.co/ConicCat/NemoPlotter-12B,1
|
| 24 |
+
SicariusSicariiStuff/Impish_Nemo_12B,49,8,72,43,,12B,,,https://huggingface.co/SicariusSicariiStuff/Impish_Nemo_12B,1
|
| 25 |
+
pot99rta/PatriSlush-DarkRPMax-12B,47,8,69,42,,12B,,,https://huggingface.co/pot99rta/PatriSlush-DarkRPMax-12B,1
|
| 26 |
+
ReadyArt/The-Omega-Directive-M-12B-v1.0,42,7,67,39,,12B,,,https://huggingface.co/ReadyArt/The-Omega-Directive-M-12B-v1.0,1
|
| 27 |
+
CrucibleLab/M3.2-24B-Loki-V1.3,82,10,92,77,,24B,,,https://huggingface.co/CrucibleLab/M3.2-24B-Loki-V1.3,
|
| 28 |
+
LatitudeGames/Wayfarer-2-12B ,43,7,66,41,,12B,,,https://huggingface.co/LatitudeGames/Wayfarer-2-12B ,1
|
| 29 |
+
LatitudeGames/Muse-2-12B ,63,7,84,62,,12B,,,https://huggingface.co/LatitudeGames/Muse-2-12B ,1
|
| 30 |
+
Retreatcost/KansenSakura-Radiance-RP-12b,46,6,68,47,,12B,,,https://huggingface.co/Retreatcost/KansenSakura-Radiance-RP-12b,1
|
| 31 |
+
TheDrummer/Cydonia-24B-v4.2.0,94,10,95,94,,24B,,,https://huggingface.co/TheDrummer/Cydonia-24B-v4.2.0,v4l
|
| 32 |
+
mistralai/Magistral-Small-2509,88,10,95,81,,24B,π,TRUE,https://huggingface.co/mistralai/Magistral-Small-2509,
|
| 33 |
+
zai-org/GLM-4.5-Air,99,10,100,99,92,110B,π,TRUE,https://huggingface.co/zai-org/GLM-4.5-Air,
|
| 34 |
+
TheDrummer/Skyfall-31B-v4,87,10,94,83,54,31B,π,,https://huggingface.co/TheDrummer/Skyfall-31B-v4,
|
| 35 |
+
meta-llama/Llama-3.3-70B-Instruct,100,10,100,100,89,70B,π,TRUE,https://huggingface.co/meta-llama/Llama-3.3-70B-Instruct,
|
| 36 |
+
zerofata/MS3.2-PaintedFantasy-Visage-v3-34B,79,10,80,79,54,34B,π,,https://huggingface.co/zerofata/MS3.2-PaintedFantasy-Visage-v3-34B,
|
| 37 |
+
Llama-4-Scout-17B-16E-Instruct,83,9,100,77,39,109B,π,TRUE,https://huggingface.co/Llama-4-Scout-17B-16E-Instruct,
|