LLMArena commited on
Commit
38cea8b
Β·
verified Β·
1 Parent(s): 1aaa52c

add depricated

Browse files
Files changed (1) hide show
  1. app.py +44 -8
app.py CHANGED
@@ -16,10 +16,24 @@ leader_component_values = [None] * 5
16
 
17
  promo_banner = """
18
  <div style="background-color: #ffcc00; color: black; padding: 10px; text-align: center; font-weight: bold; font-size: 18px; border: 2px solid #000;">
19
- llmarena.ru - USE THE LATEST VERSIONS OF THE BEST CHATBOTS IN RUSSIAN FOR FREE
20
  </div>
21
  """
22
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
23
  def make_default_md_1():
24
  leaderboard_md = f"""
25
  # πŸ† LLM Arena in Russian: Leaderboard
@@ -136,14 +150,15 @@ def recompute_final_ranking(arena_df):
136
  return list(ranking.values())
137
 
138
 
139
- def get_arena_table(arena_df, model_table_df, arena_subset_df=None):
140
  arena_df = arena_df.sort_values(
141
  by=["final_ranking", "rating"], ascending=[True, False]
142
  )
 
 
 
 
143
  arena_df["final_ranking"] = recompute_final_ranking(arena_df)
144
- arena_df = arena_df.sort_values(
145
- by=["final_ranking", "rating"], ascending=[True, False]
146
- )
147
 
148
  # sort by rating
149
  if arena_subset_df is not None:
@@ -319,6 +334,13 @@ def build_leaderboard_tab(
319
  value=selected_category, # Default to selected_category
320
  label="Category",
321
  )
 
 
 
 
 
 
 
322
  default_category_details = make_category_arena_leaderboard_md(
323
  arena_df, arena_df, name=selected_category
324
  )
@@ -458,7 +480,7 @@ def build_leaderboard_tab(
458
  highlight_rank_max, subset=["Delta"]
459
  )
460
 
461
- def update_leaderboard_and_plots(category):
462
  _, arena_dfs, category_elo_results, _ , model_table_df = read_elo_file(elo_results_file, leaderboard_table_file)
463
 
464
  arena_subset_df = arena_dfs[category]
@@ -471,6 +493,7 @@ def build_leaderboard_tab(
471
  arena_df,
472
  model_table_df,
473
  arena_subset_df=arena_subset_df if category != "Overall" else None,
 
474
  )
475
  if category != "Overall":
476
  arena_values = update_leaderboard_df(arena_values)
@@ -546,7 +569,20 @@ def build_leaderboard_tab(
546
  if leaderboard_table_file:
547
  category_dropdown.change(
548
  fn=update_leaderboard_and_plots,
549
- inputs=[category_dropdown],
 
 
 
 
 
 
 
 
 
 
 
 
 
550
  outputs=[
551
  elo_display_df,
552
  plot_1,
@@ -719,4 +755,4 @@ if __name__ == "__main__":
719
  leaderboard_table_file = leaderboard_table_files[-1]
720
 
721
  demo = build_demo(elo_result_file, leaderboard_table_file)
722
- demo.launch(show_api=False)
 
16
 
17
  promo_banner = """
18
  <div style="background-color: #ffcc00; color: black; padding: 10px; text-align: center; font-weight: bold; font-size: 18px; border: 2px solid #000;">
19
+ USE THE LATEST VERSIONS OF THE BEST CHATBOTS IN RUSSIAN FOR FREE
20
  </div>
21
  """
22
 
23
+ deprecated_model_name = [
24
+ "GigaChat 3.1.25.3",
25
+ "GigaChat-Pro 2.2.25.3",
26
+ "saiga_llama3_8b_v6",
27
+ "saiga_phi3_medium",
28
+ "GigaChat-Plus 3.1.25.3",
29
+ "GigaChat-Pro 4.0.26.8",
30
+ "GigaChat 4.0.26.8",
31
+ "xAI: Grok 2",
32
+ "GigaChat-Pro 4.0.26.15",
33
+ "GigaChat 4.0.26.15",
34
+ "YandexGPT Experimental", "yandex-gpt-arena"
35
+ ]
36
+
37
  def make_default_md_1():
38
  leaderboard_md = f"""
39
  # πŸ† LLM Arena in Russian: Leaderboard
 
150
  return list(ranking.values())
151
 
152
 
153
+ def get_arena_table(arena_df, model_table_df, arena_subset_df=None, hidden_models=None):
154
  arena_df = arena_df.sort_values(
155
  by=["final_ranking", "rating"], ascending=[True, False]
156
  )
157
+
158
+ if hidden_models:
159
+ arena_df = arena_df[~arena_df.index.isin(hidden_models)].copy() # Filter deprecated models
160
+
161
  arena_df["final_ranking"] = recompute_final_ranking(arena_df)
 
 
 
162
 
163
  # sort by rating
164
  if arena_subset_df is not None:
 
334
  value=selected_category, # Default to selected_category
335
  label="Category",
336
  )
337
+ with gr.Column(scale=2): # New CheckboxGroup for deprecated models
338
+ category_checkbox = gr.CheckboxGroup(
339
+ ["Show Deprecated Models"],
340
+ label="Filter",
341
+ info="",
342
+ )
343
+
344
  default_category_details = make_category_arena_leaderboard_md(
345
  arena_df, arena_df, name=selected_category
346
  )
 
480
  highlight_rank_max, subset=["Delta"]
481
  )
482
 
483
+ def update_leaderboard_and_plots(category, filters):
484
  _, arena_dfs, category_elo_results, _ , model_table_df = read_elo_file(elo_results_file, leaderboard_table_file)
485
 
486
  arena_subset_df = arena_dfs[category]
 
493
  arena_df,
494
  model_table_df,
495
  arena_subset_df=arena_subset_df if category != "Overall" else None,
496
+ hidden_models=None if "Show Deprecated Models" in filters else deprecated_model_name # Pass filter value
497
  )
498
  if category != "Overall":
499
  arena_values = update_leaderboard_df(arena_values)
 
569
  if leaderboard_table_file:
570
  category_dropdown.change(
571
  fn=update_leaderboard_and_plots,
572
+ inputs=[category_dropdown, category_checkbox], # Pass checkbox value
573
+ outputs=[
574
+ elo_display_df,
575
+ plot_1,
576
+ plot_2,
577
+ plot_3,
578
+ plot_4,
579
+ more_stats_md,
580
+ category_deets,
581
+ ],
582
+ )
583
+ category_checkbox.change( # Add a separate change handler for the checkbox
584
+ fn=update_leaderboard_and_plots,
585
+ inputs=[category_dropdown, category_checkbox],
586
  outputs=[
587
  elo_display_df,
588
  plot_1,
 
755
  leaderboard_table_file = leaderboard_table_files[-1]
756
 
757
  demo = build_demo(elo_result_file, leaderboard_table_file)
758
+ demo.launch(show_api=False)