Spaces:
Running
Running
| SIZE_MAP = { | |
| 'Airavata': '7b', | |
| 'CCK-v2.0-DPO': '13b', | |
| 'GEITje-7B': '7b', | |
| 'Heimer-dpo-TinyLlama-1.1B': '1b', | |
| 'Heimer-kto-TinyLlama-1.1B': '1b', | |
| 'Heimer-ipo-TinyLlama-1.1B': '1b', | |
| 'HuggingFaceH4': '7b', | |
| 'Llama-2-13b-chat-hf': '13b', | |
| 'Llama-2-13b-hf': '13b', | |
| 'Llama-2-70b-chat-hf': '70b', | |
| 'Llama-2-7b-chat-hf': '7b', | |
| 'Llama-2-7b-hf': '7b', | |
| 'Mistral-7B-Instruct-v0.1': '7b', | |
| 'Mistral-7B-Instruct-v0.2': '7b', | |
| 'OLMo-7B-Instruct': '7b', | |
| 'OpenHathi-7B-Hi-v0.1-Base': '7b', | |
| 'Qwen-7B-Chat': '7b', | |
| 'Swallow-13b-instruct-hf': '13b', | |
| 'Swallow-70b-instruct-hf': '70b', | |
| 'Swallow-7b-hf': '7b', | |
| 'Swallow-7b-instruct-hf': '7b', | |
| 'Yi-6B-Chat': '1b-7b', | |
| 'archangel_dpo_llama13b': '13b', | |
| 'archangel_dpo_llama7b': '7b', | |
| 'archangel_kto_llama13b': '13b', | |
| 'archangel_kto_llama7b': '7b', | |
| 'archangel_ppo_llama13b': '13b', | |
| 'archangel_ppo_llama7b': '7b', | |
| 'archangel_sft-dpo_llama13b': '13b', | |
| 'archangel_sft-dpo_llama7b': '7b', | |
| 'archangel_sft-kto_llama13b': '13b', | |
| 'archangel_sft-kto_llama7b': '7b', | |
| 'archangel_sft-ppo_llama13b': '13b', | |
| 'archangel_sft-ppo_llama7b': '7b', | |
| 'bloomz-1b1': '1b', | |
| 'bloomz-1b7': '7b', | |
| 'bloomz-3b': '1b-7b', | |
| 'bloomz-560m': '<1b', | |
| 'bloomz-7b1': '7b', | |
| 'gemma-7b-it': '7b', | |
| 'llama-30b': '30b', | |
| 'mpt-7b': '7b', | |
| 'mpt-7b-instruct': '7b', | |
| 'pythia-1.4b': '1b-7b', | |
| 'pythia-12b': '13b', | |
| 'pythia-160m': '<1b', | |
| 'pythia-1b': '1b', | |
| 'pythia-2.8b': '1b-7b', | |
| 'pythia-410m': '1b', | |
| 'pythia-6.9b': '7b', | |
| 'pythia-70m': '1b', | |
| 'ruGPT-3.5-13B': '13b', | |
| 'stablelm-2-1_6b': '1b-7b', | |
| 'stablelm-2-zephyr-1_6b': '1b-7b', | |
| 'tulu-2-13b': '13b', | |
| 'tulu-2-7b': '7b', | |
| 'tulu-2-dpo-13b': '13b', | |
| 'tulu-2-dpo-70b': '70b', | |
| 'tulu-2-dpo-7b': '7b', | |
| 'zephyr-7b-beta': '7b', | |
| 'gpt-35-turbo': "Unknown", | |
| "Aya101": '13b', | |
| "zephyr-7b-gemma-v0.1": "7b", | |
| "Mistral-7B-v0.1": '7b', | |
| "Meta-Llama-3-8B-Instruct": "8b", | |
| "Meta-Llama-3-8B": '8b', | |
| } | |
| MODEL_FAMILY = { | |
| 'Airavata': 'OpenHathi', | |
| 'CCK-v2.0-DPO': 'NA', | |
| 'GEITje-7B': 'Mistral-GEITje', | |
| 'Heimer-dpo-TinyLlama-1.1B': 'Llama-Tiny', | |
| 'Heimer-kto-TinyLlama-1.1B': 'Llama-Tiny', | |
| 'Heimer-ipo-TinyLlama-1.1B': 'Llama-Tiny', | |
| 'HuggingFaceH4': 'Mistral-CAI', | |
| 'Llama-2-13b-chat-hf': 'Llama', | |
| 'Llama-2-13b-hf': 'Llama', | |
| 'Llama-2-70b-chat-hf': 'Llama', | |
| 'Llama-2-7b-chat-hf': 'Llama', | |
| 'Llama-2-7b-hf': 'Llama', | |
| 'Mistral-7B-Instruct-v0.1': 'Mistral', | |
| 'Mistral-7B-Instruct-v0.2': 'Mistral', | |
| 'OLMo-7B-Instruct': 'OLMo', | |
| 'OpenHathi-7B-Hi-v0.1-Base': 'OpenHathi', | |
| 'Qwen-7B-Chat': 'Qwen', | |
| 'Swallow-13b-instruct-hf': 'Llama-Swallow', | |
| 'Swallow-70b-instruct-hf': 'Llama-Swallow', | |
| 'Swallow-7b-hf': 'Llama-Swallow', | |
| 'Swallow-7b-instruct-hf': 'Llama-Swallow', | |
| 'Yi-6B-Chat': 'Yi', | |
| 'archangel_dpo_llama13b': 'Llama-Archangel', | |
| 'archangel_dpo_llama7b': 'Llama-Archangel', | |
| 'archangel_kto_llama13b': 'Llama-Archangel', | |
| 'archangel_kto_llama7b': 'Llama-Archangel', | |
| 'archangel_ppo_llama13b': 'Llama-Archangel', | |
| 'archangel_ppo_llama7b': 'Llama-Archangel', | |
| 'archangel_sft-dpo_llama13b': 'Llama-Archangel', | |
| 'archangel_sft-dpo_llama7b': 'Llama-Archangel', | |
| 'archangel_sft-kto_llama13b': 'Llama-Archangel', | |
| 'archangel_sft-kto_llama7b': 'Llama-Archangel', | |
| 'archangel_sft-ppo_llama13b': 'Llama-Archangel', | |
| 'archangel_sft-ppo_llama7b': 'Llama-Archangel', | |
| 'bloomz-1b1': 'Bloomz', | |
| 'bloomz-1b7': 'Bloomz', | |
| 'bloomz-3b': 'Bloomz', | |
| 'bloomz-560m': 'Bloomz', | |
| 'bloomz-7b1': 'Bloomz', | |
| 'gemma-7b-it': 'Gemma', | |
| 'llama-30b': 'Llama', | |
| 'mpt-7b': 'MPT', | |
| 'mpt-7b-instruct': 'MPT', | |
| 'pythia-1.4b': 'Pythia', | |
| 'pythia-12b': 'Pythia', | |
| 'pythia-160m': 'Pythia', | |
| 'pythia-1b': 'Pythia', | |
| 'pythia-2.8b': 'Pythia', | |
| 'pythia-410m': 'Pythia', | |
| 'pythia-6.9b': 'Pythia', | |
| 'pythia-70m': 'Pythia', | |
| 'ruGPT-3.5-13B': 'GPT', | |
| 'stablelm-2-1_6b': 'StableLM', | |
| 'stablelm-2-zephyr-1_6b': 'StableLM', | |
| 'tulu-2-13b': 'Llama-Tulu', | |
| 'tulu-2-7b': 'Llama-Tulu', | |
| 'tulu-2-dpo-13b': 'Llama-Tulu', | |
| 'tulu-2-dpo-70b': 'Llama-Tulu', | |
| 'tulu-2-dpo-7b': 'Llama-Tulu', | |
| 'zephyr-7b-beta': 'Mistral', | |
| 'gpt-35-turbo': "GPT-OAI", | |
| 'Aya101': 'Aya101', | |
| "zephyr-7b-gemma-v0.1": 'Gemma', | |
| "Mistral-7B-v0.1": 'Mistral', | |
| "Meta-Llama-3-8B-Instruct": "Llama", | |
| "Meta-Llama-3-8B": 'Llama', | |
| } | |
| MODEL_TYPE = { | |
| 'Airavata': 'instruct', | |
| 'CCK-v2.0-DPO': 'preference', | |
| 'GEITje-7B': 'base', | |
| 'Heimer-dpo-TinyLlama-1.1B': 'preference', | |
| 'Heimer-kto-TinyLlama-1.1B': 'preference', | |
| 'Heimer-ipo-TinyLlama-1.1B': 'preference', | |
| 'HuggingFaceH4': 'preference', | |
| 'Llama-2-13b-chat-hf': 'preference', | |
| 'Llama-2-13b-hf': 'base', | |
| 'Llama-2-70b-chat-hf': 'preference', | |
| 'Llama-2-7b-chat-hf': 'preference', | |
| 'Llama-2-7b-hf': 'base', | |
| 'Mistral-7B-Instruct-v0.1': 'instruct', | |
| 'Mistral-7B-Instruct-v0.2': 'instruct', | |
| 'OLMo-7B-Instruct': 'preference', | |
| 'OpenHathi-7B-Hi-v0.1-Base': 'instruct', | |
| 'Qwen-7B-Chat': 'preference', | |
| 'Swallow-13b-instruct-hf': 'instruct', | |
| 'Swallow-70b-instruct-hf': 'instruct', | |
| 'Swallow-7b-hf': 'base', | |
| 'Swallow-7b-instruct-hf': 'instruct', | |
| 'Yi-6B-Chat': 'preference', | |
| 'archangel_dpo_llama13b': 'preference', | |
| 'archangel_dpo_llama7b': 'preference', | |
| 'archangel_kto_llama13b': 'preference', | |
| 'archangel_kto_llama7b': 'preference', | |
| 'archangel_ppo_llama13b': 'preference', | |
| 'archangel_ppo_llama7b': 'preference', | |
| 'archangel_sft-dpo_llama13b': 'preference', | |
| 'archangel_sft-dpo_llama7b': 'preference', | |
| 'archangel_sft-kto_llama13b': 'preference', | |
| 'archangel_sft-kto_llama7b': 'preference', | |
| 'archangel_sft-ppo_llama13b': 'preference', | |
| 'archangel_sft-ppo_llama7b': 'preference', | |
| 'bloomz-1b1': 'base', | |
| 'bloomz-1b7': 'base', | |
| 'bloomz-3b': 'base', | |
| 'bloomz-560m': 'base', | |
| 'bloomz-7b1': 'base', | |
| 'gemma-7b-it': 'instruct', | |
| 'llama-30b': 'base', | |
| 'mpt-7b': 'base', | |
| 'mpt-7b-instruct': 'instruct', | |
| 'pythia-1.4b': 'base', | |
| 'pythia-12b': 'base', | |
| 'pythia-160m': 'base', | |
| 'pythia-1b': 'base', | |
| 'pythia-2.8b': 'base', | |
| 'pythia-410m': 'base', | |
| 'pythia-6.9b': 'base', | |
| 'pythia-70m': 'base', | |
| 'ruGPT-3.5-13B': 'base', | |
| 'stablelm-2-1_6b': 'instruct', | |
| 'stablelm-2-zephyr-1_6b': 'preference', | |
| 'tulu-2-13b': 'preference', | |
| 'tulu-2-7b': 'preference', | |
| 'tulu-2-dpo-13b': 'preference', | |
| 'tulu-2-dpo-70b': 'preference', | |
| 'tulu-2-dpo-7b': 'preference', | |
| 'zephyr-7b-beta': 'preference', | |
| 'gpt-35-turbo': "preference", | |
| 'Aya101': 'instruct', | |
| 'zephyr-7b-gemma-v0.1': 'preference', | |
| 'Mistral-7B-v0.1': 'base', | |
| "Meta-Llama-3-8B-Instruct": "preference", | |
| "Meta-Llama-3-8B": 'base', | |
| } | |
| MULTILINGUAL_FAMILY = ['Aya101', 'GPT-OAI', 'Bloomz'] | |
| import pandas as pd | |
| def load_main_table(): | |
| df = pd.read_csv("./data/data.csv").round(3) | |
| df = df[df.Model!='CCK-v2.0-DPO'] | |
| assert len(set(df['Model'].unique()) - set(list(SIZE_MAP.keys())))==0 | |
| df['Model Size'] = df['Model'].map(SIZE_MAP) | |
| df['Model Type'] = df['Model'].map(MODEL_TYPE) | |
| df['Model Family'] = df['Model'].map(MODEL_FAMILY) | |
| df['Multilingual'] = df['Model Family'].apply(lambda x: x in MULTILINGUAL_FAMILY) | |
| df = df.sort_values(by="Average Toxicity") | |
| return df |