danemery-ai2 commited on
Commit
ac9171f
·
unverified ·
1 Parent(s): 2972be9

Add column description tooltip icon to leaderboard legend (#11)

Browse files
Files changed (2) hide show
  1. content.py +34 -0
  2. ui_components.py +15 -0
content.py CHANGED
@@ -287,4 +287,38 @@ html:not(.dark) #legend-markdown .light-mode-icon,
287
  #legend-markdown .light-mode-icon, #legend-markdown .dark-mode-icon {
288
  display: none;
289
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
290
  """
 
287
  #legend-markdown .light-mode-icon, #legend-markdown .dark-mode-icon {
288
  display: none;
289
  }
290
+
291
+ /* Column description tooltip styles */
292
+ #legend-markdown,
293
+ #leaderboard-accordion {
294
+ overflow: visible !important;
295
+ }
296
+
297
+ .tooltip-icon {
298
+ display: inline-block;
299
+ margin-left: 6px;
300
+ cursor: help;
301
+ position: relative;
302
+ }
303
+
304
+ .tooltip-icon::after {
305
+ content: attr(data-tooltip);
306
+ position: absolute;
307
+ bottom: 125%;
308
+ background-color: #333;
309
+ color: #fff;
310
+ padding: 12px 16px;
311
+ border-radius: 4px;
312
+ font-size: 12px;
313
+ opacity: 0;
314
+ transition: opacity 0.2s;
315
+ white-space: pre-line;
316
+ width: 500px;
317
+ text-align: left;
318
+ pointer-events: none;
319
+ }
320
+
321
+ .tooltip-icon:hover::after {
322
+ opacity: 1;
323
+ }
324
  """
ui_components.py CHANGED
@@ -175,6 +175,21 @@ legend_markdown = f"""
175
  <div style="display: flex; flex-wrap: wrap; align-items: center; gap: 16px; margin-top: 4px;">{tooling_html}</div>
176
  </div>
177
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
178
  </div>
179
  """
180
 
 
175
  <div style="display: flex; flex-wrap: wrap; align-items: center; gap: 16px; margin-top: 4px;">{tooling_html}</div>
176
  </div>
177
 
178
+ <div><b>Column Descriptions</b><span class="tooltip-icon" data-tooltip="• Pareto: Indicates if agent is on the Pareto frontier
179
+ • Openness: Level of accessibility to model and implementation
180
+ • Agent Tooling: Approach used by the agent
181
+ • Agent: Name of the AI agent
182
+ • Overall Score: Performance across all benchmarks
183
+ • Overall Cost: Cost per task in USD
184
+ • Literature Understanding Score: Performance on scientific literature tasks
185
+ • Literature Understanding Cost: Cost per literature understanding task in USD
186
+ • Data Analysis Score: Performance on data analysis tasks
187
+ • Code Execution Score: Performance on coding tasks
188
+ • Code Execution Cost: Cost per code execution task in USD
189
+ • Discovery Score: Performance on information discovery tasks
190
+ • Discovery Cost: Cost per discovery task in USD
191
+ • Categories Attempted: Number of benchmark categories the agent participated in
192
+ • Logs: Link to detailed evaluation logs">ⓘ</span></div>
193
  </div>
194
  """
195