Spaces:
Running
Running
Joschka Strueber
commited on
Commit
·
ffacaaa
1
Parent(s):
36159b1
[Add] metric selection
Browse files
app.py
CHANGED
|
@@ -9,7 +9,7 @@ from src.dataloading import get_leaderboard_models_cached, get_leaderboard_datas
|
|
| 9 |
# Set matplotlib backend for non-GUI environments
|
| 10 |
plt.switch_backend('Agg')
|
| 11 |
|
| 12 |
-
def create_heatmap(selected_models, selected_dataset):
|
| 13 |
if not selected_models or not selected_dataset:
|
| 14 |
return None
|
| 15 |
|
|
@@ -78,6 +78,13 @@ with gr.Blocks(title="LLM Similarity Analyzer") as demo:
|
|
| 78 |
allow_custom_value=False,
|
| 79 |
info="Search and select multiple models"
|
| 80 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 81 |
|
| 82 |
generate_btn = gr.Button("Generate Heatmap", variant="primary")
|
| 83 |
heatmap = gr.Image(label="Similarity Heatmap", visible=True)
|
|
@@ -88,7 +95,7 @@ with gr.Blocks(title="LLM Similarity Analyzer") as demo:
|
|
| 88 |
queue=False
|
| 89 |
).then(
|
| 90 |
fn=create_heatmap,
|
| 91 |
-
inputs=[model_dropdown, dataset_dropdown],
|
| 92 |
outputs=heatmap
|
| 93 |
)
|
| 94 |
|
|
|
|
| 9 |
# Set matplotlib backend for non-GUI environments
|
| 10 |
plt.switch_backend('Agg')
|
| 11 |
|
| 12 |
+
def create_heatmap(selected_models, selected_dataset, selected_metric):
|
| 13 |
if not selected_models or not selected_dataset:
|
| 14 |
return None
|
| 15 |
|
|
|
|
| 78 |
allow_custom_value=False,
|
| 79 |
info="Search and select multiple models"
|
| 80 |
)
|
| 81 |
+
|
| 82 |
+
metric_dropdown = gr.Dropdown(
|
| 83 |
+
choices=["Kappa_p (prob.)", "Kappa_p (det.)", "Error Consistency"],
|
| 84 |
+
label="Select Metric",
|
| 85 |
+
default="Kappa_p (prob.)",
|
| 86 |
+
info="Select a similarity metric to compute"
|
| 87 |
+
)
|
| 88 |
|
| 89 |
generate_btn = gr.Button("Generate Heatmap", variant="primary")
|
| 90 |
heatmap = gr.Image(label="Similarity Heatmap", visible=True)
|
|
|
|
| 95 |
queue=False
|
| 96 |
).then(
|
| 97 |
fn=create_heatmap,
|
| 98 |
+
inputs=[model_dropdown, dataset_dropdown, metric_dropdown],
|
| 99 |
outputs=heatmap
|
| 100 |
)
|
| 101 |
|