SLM-RAG-Arena

Running on Zero

oliver-aizip commited on May 5

Commit

44c2a20

1 Parent(s): ce4dda5

ready hyperlinks for leaderboard

Files changed (3) hide show

utils/arena_df_leaderboard.csv ADDED Viewed

+model,wins,losses,ties
+Model Alpha,0,0,0
+Model Beta,0,0,0
+Model Delta (Refusal Specialist),0,0,0
+Model Gamma,0,0,0
+Qwen2.5-1.5b-Instruct,1,1,0
+Llama-3.2-1b-Instruct,0,1,0
+Qwen2.5-3b-Instruct,1,0,0
+Llama-3.2-3b-Instruct,0,0,0

utils/leaderboard.py CHANGED Viewed

@@ -2,6 +2,7 @@ import os
 import pandas as pd
 import math
 from datetime import datetime
 # Default K-factor (determines how much a single match affects ratings)
 DEFAULT_K_FACTOR = 32
@@ -9,12 +10,37 @@ DEFAULT_K_FACTOR = 32
 # Default starting Elo
 DEFAULT_ELO = 1500
 # Mapping of model names to their Hugging Face URLs
-model_to_hf = {
-    "Qwen2.5-1.5b-Instruct": "https://huggingface.co/qwen/qwen2.5-1.5b-instruct",
-    "Qwen2.5-3b-Instruct": "https://huggingface.co/qwen/qwen2.5-3b-instruct",
-    # Add more models and their HF links here
-}
 def calculate_elo_changes(winner_rating, loser_rating, k_factor=DEFAULT_K_FACTOR, draw=False):
     """

 import pandas as pd
 import math
 from datetime import datetime
+from .models import models
 # Default K-factor (determines how much a single match affects ratings)
 DEFAULT_K_FACTOR = 32
 # Default starting Elo
 DEFAULT_ELO = 1500
+def prepare_url(model_dict: dict):
+    """
+    Prepare the URL for the model based on its name.
+    Parameters:
+    - model_dict: Dictionary containing model information
+    Returns:
+    - URL string for the model
+    """
+    url_dict = {}
+    # Extract the model name from the dictionary
+    model_names = model_dict.keys()
+    for name in model_names:
+        half_url = model_dict[name]
+    # Construct the URL using the model name
+        url = f"https://huggingface.co/{half_url}"
+        url_dict[name] = url
+    return url_dict
 # Mapping of model names to their Hugging Face URLs
+# model_to_hf = {
+#     "Qwen2.5-1.5b-Instruct": "https://huggingface.co/qwen/qwen2.5-1.5b-instruct",
+#     "Qwen2.5-3b-Instruct": "https://huggingface.co/qwen/qwen2.5-3b-instruct",
+#     # Add more models and their HF links here
+# }
+model_to_hf = prepare_url(models)
 def calculate_elo_changes(winner_rating, loser_rating, k_factor=DEFAULT_K_FACTOR, draw=False):
     """

utils/models.py CHANGED Viewed

@@ -13,8 +13,8 @@ from .prompts import format_rag_prompt
 models = {
     "Qwen2.5-1.5b-Instruct": "qwen/qwen2.5-1.5b-instruct",
-    "Qwen2.5-3b-Instruct": "qwen/qwen2.5-3b-instruct", # remove gated for now
-    "Llama-3.2-3b-Instruct": "meta-llama/llama-3.2-3b-instruct",
     "Llama-3.2-1b-Instruct": "meta-llama/llama-3.2-1b-instruct",
     "Gemma-3-1b-it" : "google/gemma-3-1b-it",
     #"Bitnet-b1.58-2B-4T": "microsoft/bitnet-b1.58-2B-4T",

 models = {
     "Qwen2.5-1.5b-Instruct": "qwen/qwen2.5-1.5b-instruct",
+    #"Qwen2.5-3b-Instruct": "qwen/qwen2.5-3b-instruct", # remove gated for now
+    #"Llama-3.2-3b-Instruct": "meta-llama/llama-3.2-3b-instruct",
     "Llama-3.2-1b-Instruct": "meta-llama/llama-3.2-1b-instruct",
     "Gemma-3-1b-it" : "google/gemma-3-1b-it",
     #"Bitnet-b1.58-2B-4T": "microsoft/bitnet-b1.58-2B-4T",