Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -53,7 +53,7 @@ except Exception:
|
|
| 53 |
|
| 54 |
LEADERBOARD_DF = get_leaderboard_df(EVAL_RESULTS_PATH, EVAL_REQUESTS_PATH, COLS, BENCHMARK_COLS)
|
| 55 |
_test_data = pd.DataFrame({"Score": [54,46,53], "Name": ["MageBench", "MageBench", "MageBench"], "BaseModel": ["GPT-4o", "GPT-4o", "LLaMA"], "Env.": ["Sokoban", "Sokoban", "Football"],
|
| 56 |
-
"Target-research": ["Model-Eval-Global", "Model-Eval-Online", "Agent-Eval-Prompt"], "Link": ["xxx", "xxx", "xxx"]})
|
| 57 |
|
| 58 |
|
| 59 |
(
|
|
@@ -79,6 +79,7 @@ def init_leaderboard(dataframe):
|
|
| 79 |
ColumnFilter("Target-research", type="checkboxgroup", label="Comparison settings for target researches (Single Selection)"),
|
| 80 |
ColumnFilter("BaseModel", type="dropdown", label="Select The base lmm model that fultill the task."),
|
| 81 |
ColumnFilter("Env.", type="checkboxgroup", label="Environment (Single Selection)"),
|
|
|
|
| 82 |
# ColumnFilter(AutoEvalColumn.precision.name, type="checkboxgroup", label="Precision"),
|
| 83 |
# ColumnFilter(
|
| 84 |
# AutoEvalColumn.params.name,
|
|
|
|
| 53 |
|
| 54 |
LEADERBOARD_DF = get_leaderboard_df(EVAL_RESULTS_PATH, EVAL_REQUESTS_PATH, COLS, BENCHMARK_COLS)
|
| 55 |
_test_data = pd.DataFrame({"Score": [54,46,53], "Name": ["MageBench", "MageBench", "MageBench"], "BaseModel": ["GPT-4o", "GPT-4o", "LLaMA"], "Env.": ["Sokoban", "Sokoban", "Football"],
|
| 56 |
+
"Target-research": ["Model-Eval-Global", "Model-Eval-Online", "Agent-Eval-Prompt"], "Subset": ["mini", "all", "mini"], "Link": ["xxx", "xxx", "xxx"]})
|
| 57 |
|
| 58 |
|
| 59 |
(
|
|
|
|
| 79 |
ColumnFilter("Target-research", type="checkboxgroup", label="Comparison settings for target researches (Single Selection)"),
|
| 80 |
ColumnFilter("BaseModel", type="dropdown", label="Select The base lmm model that fultill the task."),
|
| 81 |
ColumnFilter("Env.", type="checkboxgroup", label="Environment (Single Selection)"),
|
| 82 |
+
ColumnFilter("Subset", type="checkboxgroup", label="Subset (Single Selection)"),
|
| 83 |
# ColumnFilter(AutoEvalColumn.precision.name, type="checkboxgroup", label="Precision"),
|
| 84 |
# ColumnFilter(
|
| 85 |
# AutoEvalColumn.params.name,
|