Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -252,12 +252,13 @@ with block:
|
|
| 252 |
interactive=True,
|
| 253 |
)
|
| 254 |
|
| 255 |
-
|
| 256 |
-
|
| 257 |
-
|
| 258 |
-
|
| 259 |
-
|
| 260 |
-
|
|
|
|
| 261 |
|
| 262 |
with gr.Accordion("π Metrics", open=False):
|
| 263 |
leaderboard_metric_selector = gr.CheckboxGroup(
|
|
@@ -300,7 +301,6 @@ with block:
|
|
| 300 |
elem_classes="leaderboard-note",
|
| 301 |
)
|
| 302 |
|
| 303 |
-
gr.Markdown("#### If a method name ends with **^**, it suggests potential suspicions of data leakage related to ***similarity***, ***function***, or ***family*** benchmarks.")
|
| 304 |
# ββ dataframe ββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 305 |
styler = build_leaderboard_styler(base_method_names, metric_names)
|
| 306 |
|
|
@@ -315,6 +315,8 @@ with block:
|
|
| 315 |
max_height=1000,
|
| 316 |
show_fullscreen_button=True,
|
| 317 |
)
|
|
|
|
|
|
|
| 318 |
|
| 319 |
# ββ callbacks ββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 320 |
leaderboard_method_selector_base.change(
|
|
|
|
| 252 |
interactive=True,
|
| 253 |
)
|
| 254 |
|
| 255 |
+
with gr.Accordion("π§ͺ Benchmark Types", open=False):
|
| 256 |
+
benchmark_type_selector_lb = gr.CheckboxGroup(
|
| 257 |
+
choices=list(benchmark_metric_mapping.keys()),
|
| 258 |
+
label="Benchmark Types",
|
| 259 |
+
value=list(benchmark_metric_mapping.keys()), # all selected
|
| 260 |
+
interactive=True,
|
| 261 |
+
)
|
| 262 |
|
| 263 |
with gr.Accordion("π Metrics", open=False):
|
| 264 |
leaderboard_metric_selector = gr.CheckboxGroup(
|
|
|
|
| 301 |
elem_classes="leaderboard-note",
|
| 302 |
)
|
| 303 |
|
|
|
|
| 304 |
# ββ dataframe ββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 305 |
styler = build_leaderboard_styler(base_method_names, metric_names)
|
| 306 |
|
|
|
|
| 315 |
max_height=1000,
|
| 316 |
show_fullscreen_button=True,
|
| 317 |
)
|
| 318 |
+
|
| 319 |
+
gr.Markdown("#### If a method name ends with **^**, it suggests potential suspicions of data leakage related to ***similarity***, ***function***, or ***family*** benchmarks.")
|
| 320 |
|
| 321 |
# ββ callbacks ββββββββββββββββββββββββββββββββββββββββββββββββ
|
| 322 |
leaderboard_method_selector_base.change(
|