Commit 
							
							·
						
						2171ba2
	
1
								Parent(s):
							
							ca59093
								
pin the space
Browse files
    	
        FACTS.tsv
    DELETED
    
    | @@ -1,32 +0,0 @@ | |
| 1 | 
            -
            model	size	Separate Grounding Score	Separate Quality Score	Combined Score
         | 
| 2 | 
            -
            deepseek-ai/DeepSeek-R1-Distill-Qwen-14B	14	0.817797	0.542373	0.457627
         | 
| 3 | 
            -
            VIDraft/Gemma-3-R1984-27B	27	0.93617	0.459574	0.434043
         | 
| 4 | 
            -
            meta-llama/Llama-3.3-70B-Instruct	70	0.842553	0.510638	0.425532
         | 
| 5 | 
            -
            Qwen/Qwen3-30B-A3B	30	0.812766	0.540426	0.425532
         | 
| 6 | 
            -
            Qwen/Qwen3-4B	4	0.770213	0.540426	0.425532
         | 
| 7 | 
            -
            Qwen/Qwen3-32B	32	0.740426	0.553191	0.417021
         | 
| 8 | 
            -
            deepseek-ai/DeepSeek-R1-Distill-Llama-8B	8	0.766949	0.516949	0.40678
         | 
| 9 | 
            -
            Qwen/Qwen3-8B	8	0.748936	0.523404	0.4
         | 
| 10 | 
            -
            Qwen/Qwen3-14B	14	0.778723	0.502128	0.382979
         | 
| 11 | 
            -
            google/gemma-3-27b-it	27	0.936	0.391	0.378
         | 
| 12 | 
            -
            Qwen/Qwen2.5-VL-32B-Instruct	32	0.621277	0.570213	0.357447
         | 
| 13 | 
            -
            meta-llama/Llama-3.1-70B-Instruct	70	0.855932	0.389831	0.334746
         | 
| 14 | 
            -
            google/gemma-3-12b-it	12	0.944	0.343	0.313
         | 
| 15 | 
            -
            google/gemma-3-4b-it	4	0.9	0.33	0.3
         | 
| 16 | 
            -
            Qwen/Qwen3-1.7B	1.7	0.702128	0.451064	0.297872
         | 
| 17 | 
            -
            deepseek-ai/DeepSeek-R1-Distill-Qwen-7B	7	0.59322	0.449153	0.275424
         | 
| 18 | 
            -
            Qwen/Qwen3-0.6B	0.6	0.682203	0.330508	0.266949
         | 
| 19 | 
            -
            Qwen/Qwen2.5-7B-Instruct	7	0.731915	0.310638	0.255319
         | 
| 20 | 
            -
            Qwen/Qwen2.5-14B-Instruct-1M	14	0.70339	0.300847	0.254237
         | 
| 21 | 
            -
            nvidia/Llama-Nemotron-Nano-8B	8	0.576271	0.402542	0.241525
         | 
| 22 | 
            -
            OpenScholar/Llama-3.1-OpenScholar-8B	8	0.690678	0.283898	0.241525
         | 
| 23 | 
            -
            Qwen/Qwen2.5-7B-Instruct-1M	7	0.737288	0.271186	0.207627
         | 
| 24 | 
            -
            nvidia/Llama-Nemotron-Nano-4B-v1.1	4	0.548936	0.340426	0.2
         | 
| 25 | 
            -
            google/gemma-3-1b-it	1	0.65	0.28	0.19
         | 
| 26 | 
            -
            mistralai/Ministral-8B-Instruct-2410	8	0.94	0.184	0.175
         | 
| 27 | 
            -
            meta-llama/Llama-3.1-8B-Instruct	8	0.665254	0.194915	0.169492
         | 
| 28 | 
            -
            mistralai/Mistral-Small-3.1-24B-Instruct-2503	24	0.953191	0.165957	0.157447
         | 
| 29 | 
            -
            mistralai/Mistral-Small-24B-Instruct-2501	24	0.95339	0.135593	0.131356
         | 
| 30 | 
            -
            open-thoughts/OpenThinker-7B	7	0.478814	0.152542	0.110169
         | 
| 31 | 
            -
            PleIAs/Pleias-RAG-350M	0.35	0.236264	0.021978	0.010989
         | 
| 32 | 
            -
            PleIAs/Pleias-RAG-1B	1	0.190476	0.037037	0
         | 
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
    	
        README.md
    CHANGED
    
    | @@ -6,7 +6,7 @@ colorTo: purple | |
| 6 | 
             
            sdk: gradio
         | 
| 7 | 
             
            sdk_version: 5.31.0
         | 
| 8 | 
             
            app_file: app.py
         | 
| 9 | 
            -
            pinned:  | 
| 10 | 
             
            license: apache-2.0
         | 
| 11 | 
             
            short_description: This is FACTS Grounding Leaderboard, but for Open LLMs!
         | 
| 12 | 
             
            ---
         | 
|  | |
| 6 | 
             
            sdk: gradio
         | 
| 7 | 
             
            sdk_version: 5.31.0
         | 
| 8 | 
             
            app_file: app.py
         | 
| 9 | 
            +
            pinned: true
         | 
| 10 | 
             
            license: apache-2.0
         | 
| 11 | 
             
            short_description: This is FACTS Grounding Leaderboard, but for Open LLMs!
         | 
| 12 | 
             
            ---
         | 
