add depricated
Browse files
app.py
CHANGED
|
@@ -16,10 +16,24 @@ leader_component_values = [None] * 5
|
|
| 16 |
|
| 17 |
promo_banner = """
|
| 18 |
<div style="background-color: #ffcc00; color: black; padding: 10px; text-align: center; font-weight: bold; font-size: 18px; border: 2px solid #000;">
|
| 19 |
-
|
| 20 |
</div>
|
| 21 |
"""
|
| 22 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 23 |
def make_default_md_1():
|
| 24 |
leaderboard_md = f"""
|
| 25 |
# π LLM Arena in Russian: Leaderboard
|
|
@@ -136,14 +150,15 @@ def recompute_final_ranking(arena_df):
|
|
| 136 |
return list(ranking.values())
|
| 137 |
|
| 138 |
|
| 139 |
-
def get_arena_table(arena_df, model_table_df, arena_subset_df=None):
|
| 140 |
arena_df = arena_df.sort_values(
|
| 141 |
by=["final_ranking", "rating"], ascending=[True, False]
|
| 142 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
| 143 |
arena_df["final_ranking"] = recompute_final_ranking(arena_df)
|
| 144 |
-
arena_df = arena_df.sort_values(
|
| 145 |
-
by=["final_ranking", "rating"], ascending=[True, False]
|
| 146 |
-
)
|
| 147 |
|
| 148 |
# sort by rating
|
| 149 |
if arena_subset_df is not None:
|
|
@@ -319,6 +334,13 @@ def build_leaderboard_tab(
|
|
| 319 |
value=selected_category, # Default to selected_category
|
| 320 |
label="Category",
|
| 321 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 322 |
default_category_details = make_category_arena_leaderboard_md(
|
| 323 |
arena_df, arena_df, name=selected_category
|
| 324 |
)
|
|
@@ -458,7 +480,7 @@ def build_leaderboard_tab(
|
|
| 458 |
highlight_rank_max, subset=["Delta"]
|
| 459 |
)
|
| 460 |
|
| 461 |
-
def update_leaderboard_and_plots(category):
|
| 462 |
_, arena_dfs, category_elo_results, _ , model_table_df = read_elo_file(elo_results_file, leaderboard_table_file)
|
| 463 |
|
| 464 |
arena_subset_df = arena_dfs[category]
|
|
@@ -471,6 +493,7 @@ def build_leaderboard_tab(
|
|
| 471 |
arena_df,
|
| 472 |
model_table_df,
|
| 473 |
arena_subset_df=arena_subset_df if category != "Overall" else None,
|
|
|
|
| 474 |
)
|
| 475 |
if category != "Overall":
|
| 476 |
arena_values = update_leaderboard_df(arena_values)
|
|
@@ -546,7 +569,20 @@ def build_leaderboard_tab(
|
|
| 546 |
if leaderboard_table_file:
|
| 547 |
category_dropdown.change(
|
| 548 |
fn=update_leaderboard_and_plots,
|
| 549 |
-
inputs=[category_dropdown],
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 550 |
outputs=[
|
| 551 |
elo_display_df,
|
| 552 |
plot_1,
|
|
@@ -719,4 +755,4 @@ if __name__ == "__main__":
|
|
| 719 |
leaderboard_table_file = leaderboard_table_files[-1]
|
| 720 |
|
| 721 |
demo = build_demo(elo_result_file, leaderboard_table_file)
|
| 722 |
-
demo.launch(show_api=False)
|
|
|
|
| 16 |
|
| 17 |
promo_banner = """
|
| 18 |
<div style="background-color: #ffcc00; color: black; padding: 10px; text-align: center; font-weight: bold; font-size: 18px; border: 2px solid #000;">
|
| 19 |
+
USE THE LATEST VERSIONS OF THE BEST CHATBOTS IN RUSSIAN FOR FREE
|
| 20 |
</div>
|
| 21 |
"""
|
| 22 |
|
| 23 |
+
deprecated_model_name = [
|
| 24 |
+
"GigaChat 3.1.25.3",
|
| 25 |
+
"GigaChat-Pro 2.2.25.3",
|
| 26 |
+
"saiga_llama3_8b_v6",
|
| 27 |
+
"saiga_phi3_medium",
|
| 28 |
+
"GigaChat-Plus 3.1.25.3",
|
| 29 |
+
"GigaChat-Pro 4.0.26.8",
|
| 30 |
+
"GigaChat 4.0.26.8",
|
| 31 |
+
"xAI: Grok 2",
|
| 32 |
+
"GigaChat-Pro 4.0.26.15",
|
| 33 |
+
"GigaChat 4.0.26.15",
|
| 34 |
+
"YandexGPT Experimental", "yandex-gpt-arena"
|
| 35 |
+
]
|
| 36 |
+
|
| 37 |
def make_default_md_1():
|
| 38 |
leaderboard_md = f"""
|
| 39 |
# π LLM Arena in Russian: Leaderboard
|
|
|
|
| 150 |
return list(ranking.values())
|
| 151 |
|
| 152 |
|
| 153 |
+
def get_arena_table(arena_df, model_table_df, arena_subset_df=None, hidden_models=None):
|
| 154 |
arena_df = arena_df.sort_values(
|
| 155 |
by=["final_ranking", "rating"], ascending=[True, False]
|
| 156 |
)
|
| 157 |
+
|
| 158 |
+
if hidden_models:
|
| 159 |
+
arena_df = arena_df[~arena_df.index.isin(hidden_models)].copy() # Filter deprecated models
|
| 160 |
+
|
| 161 |
arena_df["final_ranking"] = recompute_final_ranking(arena_df)
|
|
|
|
|
|
|
|
|
|
| 162 |
|
| 163 |
# sort by rating
|
| 164 |
if arena_subset_df is not None:
|
|
|
|
| 334 |
value=selected_category, # Default to selected_category
|
| 335 |
label="Category",
|
| 336 |
)
|
| 337 |
+
with gr.Column(scale=2): # New CheckboxGroup for deprecated models
|
| 338 |
+
category_checkbox = gr.CheckboxGroup(
|
| 339 |
+
["Show Deprecated Models"],
|
| 340 |
+
label="Filter",
|
| 341 |
+
info="",
|
| 342 |
+
)
|
| 343 |
+
|
| 344 |
default_category_details = make_category_arena_leaderboard_md(
|
| 345 |
arena_df, arena_df, name=selected_category
|
| 346 |
)
|
|
|
|
| 480 |
highlight_rank_max, subset=["Delta"]
|
| 481 |
)
|
| 482 |
|
| 483 |
+
def update_leaderboard_and_plots(category, filters):
|
| 484 |
_, arena_dfs, category_elo_results, _ , model_table_df = read_elo_file(elo_results_file, leaderboard_table_file)
|
| 485 |
|
| 486 |
arena_subset_df = arena_dfs[category]
|
|
|
|
| 493 |
arena_df,
|
| 494 |
model_table_df,
|
| 495 |
arena_subset_df=arena_subset_df if category != "Overall" else None,
|
| 496 |
+
hidden_models=None if "Show Deprecated Models" in filters else deprecated_model_name # Pass filter value
|
| 497 |
)
|
| 498 |
if category != "Overall":
|
| 499 |
arena_values = update_leaderboard_df(arena_values)
|
|
|
|
| 569 |
if leaderboard_table_file:
|
| 570 |
category_dropdown.change(
|
| 571 |
fn=update_leaderboard_and_plots,
|
| 572 |
+
inputs=[category_dropdown, category_checkbox], # Pass checkbox value
|
| 573 |
+
outputs=[
|
| 574 |
+
elo_display_df,
|
| 575 |
+
plot_1,
|
| 576 |
+
plot_2,
|
| 577 |
+
plot_3,
|
| 578 |
+
plot_4,
|
| 579 |
+
more_stats_md,
|
| 580 |
+
category_deets,
|
| 581 |
+
],
|
| 582 |
+
)
|
| 583 |
+
category_checkbox.change( # Add a separate change handler for the checkbox
|
| 584 |
+
fn=update_leaderboard_and_plots,
|
| 585 |
+
inputs=[category_dropdown, category_checkbox],
|
| 586 |
outputs=[
|
| 587 |
elo_display_df,
|
| 588 |
plot_1,
|
|
|
|
| 755 |
leaderboard_table_file = leaderboard_table_files[-1]
|
| 756 |
|
| 757 |
demo = build_demo(elo_result_file, leaderboard_table_file)
|
| 758 |
+
demo.launch(show_api=False)
|