Commit
·
d7a42ca
1
Parent(s):
331f902
Improve setup
Browse files- Checkbox to hide incomplete evaluations
- No need for precision.
- Default values for parameter size
app.py
CHANGED
|
@@ -34,6 +34,7 @@ def init_leaderboard(source: str, aggregate: bool = False) -> Leaderboard:
|
|
| 34 |
|
| 35 |
df = pd.DataFrame.from_records(all_data_json)
|
| 36 |
df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
|
|
|
|
| 37 |
|
| 38 |
master_columns = []
|
| 39 |
for col in fields(AutoEvalColumn):
|
|
@@ -51,8 +52,8 @@ def init_leaderboard(source: str, aggregate: bool = False) -> Leaderboard:
|
|
| 51 |
for c in fields(AutoEvalColumn)
|
| 52 |
if not c.hidden and c.name in master_columns
|
| 53 |
]
|
|
|
|
| 54 |
df = df[cols].round(decimals=2)
|
| 55 |
-
# df = df[has_no_nan_values(df, benchmark_cols)]
|
| 56 |
|
| 57 |
return Leaderboard(
|
| 58 |
value=df,
|
|
@@ -72,10 +73,11 @@ def init_leaderboard(source: str, aggregate: bool = False) -> Leaderboard:
|
|
| 72 |
),
|
| 73 |
filter_columns=[
|
| 74 |
# fmt: off
|
| 75 |
-
ColumnFilter(
|
|
|
|
| 76 |
ColumnFilter(AutoEvalColumn.model_type.name, type="checkboxgroup", label="Model type"),
|
| 77 |
ColumnFilter(AutoEvalColumn.multilingual.name, type="checkboxgroup", label="Multilinguality"),
|
| 78 |
-
ColumnFilter(AutoEvalColumn.param_size.name, type="slider", min=0.01, max=150, label="Select the number of parameters (B)"),
|
| 79 |
# fmt: on
|
| 80 |
],
|
| 81 |
search_columns=[AutoEvalColumn.model.name],
|
|
@@ -120,6 +122,6 @@ with demo:
|
|
| 120 |
|
| 121 |
|
| 122 |
scheduler = BackgroundScheduler()
|
| 123 |
-
scheduler.add_job(restart_space, "interval", seconds=
|
| 124 |
scheduler.start()
|
| 125 |
demo.queue(default_concurrency_limit=40).launch()
|
|
|
|
| 34 |
|
| 35 |
df = pd.DataFrame.from_records(all_data_json)
|
| 36 |
df = df.sort_values(by=[AutoEvalColumn.average.name], ascending=False)
|
| 37 |
+
df["Incomplete"] = ~df.isna().any(axis=1)
|
| 38 |
|
| 39 |
master_columns = []
|
| 40 |
for col in fields(AutoEvalColumn):
|
|
|
|
| 52 |
for c in fields(AutoEvalColumn)
|
| 53 |
if not c.hidden and c.name in master_columns
|
| 54 |
]
|
| 55 |
+
cols.append("Incomplete")
|
| 56 |
df = df[cols].round(decimals=2)
|
|
|
|
| 57 |
|
| 58 |
return Leaderboard(
|
| 59 |
value=df,
|
|
|
|
| 73 |
),
|
| 74 |
filter_columns=[
|
| 75 |
# fmt: off
|
| 76 |
+
ColumnFilter("Incomplete", type="boolean", label="Hide incomplete evaluations", default=True),
|
| 77 |
+
# ColumnFilter(AutoEvalColumn.precision.name, type="checkboxgroup", label="Precision"),
|
| 78 |
ColumnFilter(AutoEvalColumn.model_type.name, type="checkboxgroup", label="Model type"),
|
| 79 |
ColumnFilter(AutoEvalColumn.multilingual.name, type="checkboxgroup", label="Multilinguality"),
|
| 80 |
+
ColumnFilter(AutoEvalColumn.param_size.name, type="slider", min=0.01, max=150, label="Select the number of parameters (B)", default=[-1, 83]),
|
| 81 |
# fmt: on
|
| 82 |
],
|
| 83 |
search_columns=[AutoEvalColumn.model.name],
|
|
|
|
| 122 |
|
| 123 |
|
| 124 |
scheduler = BackgroundScheduler()
|
| 125 |
+
scheduler.add_job(restart_space, "interval", seconds=3600)
|
| 126 |
scheduler.start()
|
| 127 |
demo.queue(default_concurrency_limit=40).launch()
|