Spaces:
Runtime error
Runtime error
Thomas G. Lopes
commited on
Commit
·
aa8170a
1
Parent(s):
33e2c0d
fix types
Browse files
src/lib/components/inference-playground/code-snippets.svelte
CHANGED
|
@@ -112,6 +112,7 @@
|
|
| 112 |
python: getSnippet({ lang: "python", tokenStr, conversation }),
|
| 113 |
http: getSnippet({ lang: "sh", tokenStr, conversation }),
|
| 114 |
} as Record<Language, GetInferenceSnippetReturn>);
|
|
|
|
| 115 |
|
| 116 |
const selectedSnippet = $derived(snippetsByLang[lang][selectedSnippetIdxByLang[lang]]);
|
| 117 |
|
|
|
|
| 112 |
python: getSnippet({ lang: "python", tokenStr, conversation }),
|
| 113 |
http: getSnippet({ lang: "sh", tokenStr, conversation }),
|
| 114 |
} as Record<Language, GetInferenceSnippetReturn>);
|
| 115 |
+
$inspect(snippetsByLang);
|
| 116 |
|
| 117 |
const selectedSnippet = $derived(snippetsByLang[lang][selectedSnippetIdxByLang[lang]]);
|
| 118 |
|
src/lib/components/inference-playground/model-selector.svelte
CHANGED
|
@@ -6,6 +6,7 @@
|
|
| 6 |
import Avatar from "../avatar.svelte";
|
| 7 |
import ModelSelectorModal from "./model-selector-modal.svelte";
|
| 8 |
import ProviderSelect from "./provider-select.svelte";
|
|
|
|
| 9 |
|
| 10 |
interface Props {
|
| 11 |
conversation: ConversationClass;
|
|
@@ -32,6 +33,7 @@
|
|
| 32 |
const nameSpace = $derived(isCustom ? "Custom endpoint" : (model.id.split("/")[0] ?? ""));
|
| 33 |
const modelName = $derived(isCustom ? model.id : (model.id.split("/")[1] ?? ""));
|
| 34 |
const id = $props.id();
|
|
|
|
| 35 |
</script>
|
| 36 |
|
| 37 |
<div class="flex flex-col gap-2">
|
|
|
|
| 6 |
import Avatar from "../avatar.svelte";
|
| 7 |
import ModelSelectorModal from "./model-selector-modal.svelte";
|
| 8 |
import ProviderSelect from "./provider-select.svelte";
|
| 9 |
+
import typia from "typia";
|
| 10 |
|
| 11 |
interface Props {
|
| 12 |
conversation: ConversationClass;
|
|
|
|
| 33 |
const nameSpace = $derived(isCustom ? "Custom endpoint" : (model.id.split("/")[0] ?? ""));
|
| 34 |
const modelName = $derived(isCustom ? model.id : (model.id.split("/")[1] ?? ""));
|
| 35 |
const id = $props.id();
|
| 36 |
+
$inspect(conversation.model, isHFModel(conversation.model), typia.validate<Model>(conversation.model));
|
| 37 |
</script>
|
| 38 |
|
| 39 |
<div class="flex flex-col gap-2">
|
src/lib/data/context_length.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"replicate": {},
|
| 3 |
"sambanova": {
|
| 4 |
-
"DeepSeek-R1": 32768,
|
| 5 |
"DeepSeek-R1-Distill-Llama-70B": 131072,
|
| 6 |
"DeepSeek-V3-0324": 32768,
|
| 7 |
"E5-Mistral-7B-Instruct": 4096,
|
|
@@ -15,7 +15,7 @@
|
|
| 15 |
"Meta-Llama-Guard-3-8B": 16384,
|
| 16 |
"QwQ-32B": 16384,
|
| 17 |
"Qwen2-Audio-7B-Instruct": 4096,
|
| 18 |
-
"Qwen3-32B":
|
| 19 |
"Whisper-Large-v3": 4096
|
| 20 |
},
|
| 21 |
"nebius": {
|
|
@@ -46,6 +46,7 @@
|
|
| 46 |
"microsoft/phi-4": 16384,
|
| 47 |
"deepseek-ai/DeepSeek-V3": 163840,
|
| 48 |
"deepseek-ai/DeepSeek-R1": 163840,
|
|
|
|
| 49 |
"NousResearch/Hermes-3-Llama-405B": 131072,
|
| 50 |
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B": 131072,
|
| 51 |
"deepseek-ai/DeepSeek-R1-fast": 163840,
|
|
@@ -70,15 +71,16 @@
|
|
| 70 |
"stability-ai/sdxl": 0
|
| 71 |
},
|
| 72 |
"novita": {
|
|
|
|
|
|
|
| 73 |
"deepseek/deepseek-v3-0324": 128000,
|
| 74 |
"qwen/qwen3-235b-a22b-fp8": 40960,
|
| 75 |
"qwen/qwen3-30b-a3b-fp8": 40960,
|
| 76 |
"qwen/qwen3-32b-fp8": 40960,
|
| 77 |
-
"qwen/qwen2.5-vl-72b-instruct":
|
| 78 |
"deepseek/deepseek-v3-turbo": 64000,
|
| 79 |
"meta-llama/llama-4-maverick-17b-128e-instruct-fp8": 1048576,
|
| 80 |
"google/gemma-3-27b-it": 32000,
|
| 81 |
-
"qwen/qwq-32b": 32768,
|
| 82 |
"deepseek/deepseek-r1-turbo": 64000,
|
| 83 |
"Sao10K/L3-8B-Stheno-v3.2": 8192,
|
| 84 |
"gryphe/mythomax-l2-13b": 4096,
|
|
@@ -89,13 +91,11 @@
|
|
| 89 |
"deepseek/deepseek-r1-distill-qwen-14b": 64000,
|
| 90 |
"meta-llama/llama-3.3-70b-instruct": 131072,
|
| 91 |
"qwen/qwen-2.5-72b-instruct": 32000,
|
| 92 |
-
"mistralai/mistral-nemo":
|
| 93 |
"deepseek/deepseek-r1-distill-qwen-32b": 64000,
|
| 94 |
"meta-llama/llama-3-8b-instruct": 8192,
|
| 95 |
"microsoft/wizardlm-2-8x22b": 65535,
|
| 96 |
"deepseek/deepseek-r1-distill-llama-70b": 32000,
|
| 97 |
-
"meta-llama/llama-3.1-70b-instruct": 32768,
|
| 98 |
-
"google/gemma-2-9b-it": 8192,
|
| 99 |
"mistralai/mistral-7b-instruct": 32768,
|
| 100 |
"meta-llama/llama-3-70b-instruct": 8192,
|
| 101 |
"nousresearch/hermes-2-pro-llama-3-8b": 8192,
|
|
@@ -103,12 +103,8 @@
|
|
| 103 |
"cognitivecomputations/dolphin-mixtral-8x22b": 16000,
|
| 104 |
"sophosympatheia/midnight-rose-70b": 4096,
|
| 105 |
"sao10k/l3-8b-lunaris": 8192,
|
| 106 |
-
"pa/cd-op-4-20250514": 200000,
|
| 107 |
-
"qwen/qwen3-0.6b-fp8": 32000,
|
| 108 |
-
"qwen/qwen3-1.7b-fp8": 32000,
|
| 109 |
"qwen/qwen3-8b-fp8": 128000,
|
| 110 |
"qwen/qwen3-4b-fp8": 128000,
|
| 111 |
-
"qwen/qwen3-14b-fp8": 40960,
|
| 112 |
"thudm/glm-4-9b-0414": 32000,
|
| 113 |
"thudm/glm-z1-9b-0414": 32000,
|
| 114 |
"thudm/glm-z1-32b-0414": 32000,
|
|
@@ -116,7 +112,6 @@
|
|
| 116 |
"thudm/glm-z1-rumination-32b-0414": 32000,
|
| 117 |
"qwen/qwen2.5-7b-instruct": 32000,
|
| 118 |
"meta-llama/llama-3.2-1b-instruct": 131000,
|
| 119 |
-
"meta-llama/llama-3.2-11b-vision-instruct": 32768,
|
| 120 |
"meta-llama/llama-3.2-3b-instruct": 32768,
|
| 121 |
"meta-llama/llama-3.1-8b-instruct-bf16": 8192,
|
| 122 |
"sao10k/l31-70b-euryale-v2.2": 8192
|
|
@@ -138,7 +133,6 @@
|
|
| 138 |
"deepseek-ai/DeepSeek-V3": 131072,
|
| 139 |
"deepseek-ai/DeepSeek-V3-0324": 163840,
|
| 140 |
"meta-llama/Llama-3.3-70B-Instruct": 131072,
|
| 141 |
-
"Qwen/QwQ-32B-Preview": 32768,
|
| 142 |
"Qwen/Qwen2.5-Coder-32B-Instruct": 32768,
|
| 143 |
"meta-llama/Llama-3.2-3B-Instruct": 131072,
|
| 144 |
"NousResearch/Hermes-3-Llama-3.1-70B": 12288,
|
|
@@ -147,7 +141,6 @@
|
|
| 147 |
"meta-llama/Meta-Llama-3.1-8B-Instruct": 131072,
|
| 148 |
"mistralai/Pixtral-12B-2409": 32768,
|
| 149 |
"Qwen/Qwen2.5-VL-7B-Instruct": 32768,
|
| 150 |
-
"meta-llama/Meta-Llama-3.1-405B": 32768,
|
| 151 |
"meta-llama/Meta-Llama-3.1-405B-FP8": 32768,
|
| 152 |
"deepseek-ai/DeepSeek-R1": 163840,
|
| 153 |
"Qwen/QwQ-32B": 131072
|
|
@@ -176,77 +169,79 @@
|
|
| 176 |
"command": 4096
|
| 177 |
},
|
| 178 |
"together": {
|
| 179 |
-
"meta-llama/Llama-Guard-4-12B": 1048576,
|
| 180 |
"togethercomputer/m2-bert-80M-32k-retrieval": 32768,
|
| 181 |
"cartesia/sonic": 0,
|
| 182 |
-
"scb10x/scb10x-llama3-1-typhoon2-8b-instruct": 8192,
|
| 183 |
"meta-llama-llama-2-70b-hf": 4096,
|
| 184 |
-
"togethercomputer/Refuel-Llm-V2": 16384,
|
| 185 |
"intfloat/multilingual-e5-large-instruct": 514,
|
| 186 |
-
"BAAI/bge-base-en-v1.5": 512,
|
| 187 |
-
"meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo": 130815,
|
| 188 |
"Gryphe/MythoMax-L2-13b": 4096,
|
| 189 |
"Alibaba-NLP/gte-modernbert-base": 8192,
|
| 190 |
-
"mistralai/Mistral-7B-Instruct-v0.1": 32768,
|
| 191 |
-
"Qwen/Qwen2.5-7B-Instruct-Turbo": 32768,
|
| 192 |
-
"Qwen/Qwen2.5-72B-Instruct-Turbo": 131072,
|
| 193 |
-
"Qwen/QwQ-32B": 131072,
|
| 194 |
-
"mistralai/Mixtral-8x7B-Instruct-v0.1": 32768,
|
| 195 |
-
"google/gemma-2-27b-it": 8192,
|
| 196 |
-
"Qwen/Qwen2-VL-72B-Instruct": 32768,
|
| 197 |
-
"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo": 131072,
|
| 198 |
"meta-llama/LlamaGuard-2-8b": 8192,
|
| 199 |
"cartesia/sonic-2": 0,
|
| 200 |
"togethercomputer/m2-bert-80M-8k-retrieval": 8192,
|
| 201 |
-
"deepseek-ai/DeepSeek-R1
|
| 202 |
-
"deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": 131072,
|
| 203 |
-
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free": 8192,
|
| 204 |
-
"meta-llama/Llama-3.3-70B-Instruct-Turbo-Free": 131072,
|
| 205 |
-
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B": 131072,
|
| 206 |
-
"deepseek-ai/DeepSeek-V3": 131072,
|
| 207 |
-
"togethercomputer/Refuel-Llm-V2-Small": 8192,
|
| 208 |
"togethercomputer/MoA-1": 32768,
|
| 209 |
"meta-llama/Meta-Llama-3-70B-Instruct-Turbo": 8192,
|
| 210 |
-
"google/gemma-2b-it": 8192,
|
| 211 |
-
"meta-llama/Llama-3.2-11B-Vision-Instruct-Turbo": 131072,
|
| 212 |
"Gryphe/MythoMax-L2-13b-Lite": 4096,
|
| 213 |
"meta-llama/Meta-Llama-Guard-3-8B": 8192,
|
| 214 |
-
"
|
| 215 |
-
"
|
| 216 |
-
"
|
| 217 |
-
"arcee-ai/arcee-blitz": 32768,
|
| 218 |
-
"arcee-ai/caller": 32768,
|
| 219 |
-
"arcee-ai/coder-large": 32768,
|
| 220 |
-
"arcee-ai/maestro-reasoning": 131072,
|
| 221 |
-
"arcee-ai/virtuoso-large": 131072,
|
| 222 |
-
"arcee-ai/virtuoso-medium-v2": 131072,
|
| 223 |
-
"meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo": 131072,
|
| 224 |
-
"meta-llama/Llama-3-70b-chat-hf": 8192,
|
| 225 |
"meta-llama/Llama-3-8b-chat-hf": 8192,
|
| 226 |
-
"mistralai/Mistral-
|
| 227 |
-
"
|
|
|
|
| 228 |
"togethercomputer/MoA-1-Turbo": 32768,
|
| 229 |
-
"perplexity-ai/r1-1776": 163840,
|
| 230 |
-
"NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": 32768,
|
| 231 |
"meta-llama/Meta-Llama-3-8B-Instruct-Lite": 8192,
|
| 232 |
-
"
|
| 233 |
-
"Qwen/Qwen3-235B-A22B-fp8-tput": 40960,
|
| 234 |
-
"meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": 131072,
|
| 235 |
-
"nvidia/Llama-3.1-Nemotron-70B-Instruct-HF": 32768,
|
| 236 |
-
"scb10x/scb10x-llama3-1-typhoon2-70b-instruct": 8192,
|
| 237 |
"mistralai/Mistral-7B-Instruct-v0.2": 32768,
|
| 238 |
"deepseek-ai/DeepSeek-V3-p-dp": 131072,
|
| 239 |
-
"Qwen/Qwen2.5-Coder-32B-Instruct": 16384,
|
| 240 |
"Qwen/Qwen2-72B-Instruct": 32768,
|
| 241 |
"mistralai/Mistral-7B-Instruct-v0.3": 32768,
|
| 242 |
-
"
|
| 243 |
-
"meta-llama/Llama-Vision-
|
| 244 |
"meta-llama/Llama-Guard-3-11B-Vision-Turbo": 131072,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 245 |
"meta-llama/Llama-3.2-3B-Instruct-Turbo": 131072,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 246 |
"meta-llama/Llama-3.3-70B-Instruct-Turbo": 131072,
|
| 247 |
-
"meta-llama/Llama-
|
| 248 |
-
"
|
| 249 |
-
"
|
|
|
|
|
|
|
|
|
|
| 250 |
},
|
| 251 |
"fireworks-ai": {
|
| 252 |
"accounts/fireworks/models/qwq-32b": 131072,
|
|
@@ -258,6 +253,7 @@
|
|
| 258 |
"accounts/fireworks/models/llama4-scout-instruct-basic": 1048576,
|
| 259 |
"accounts/fireworks/models/qwen2-vl-72b-instruct": 32768,
|
| 260 |
"accounts/fireworks/models/firesearch-ocr-v6": 131072,
|
|
|
|
| 261 |
"accounts/fireworks/models/deepseek-v3": 131072,
|
| 262 |
"accounts/fireworks/models/llama-v3p1-8b-instruct": 131072,
|
| 263 |
"accounts/fireworks/models/llama-v3p1-70b-instruct": 131072,
|
|
@@ -267,6 +263,7 @@
|
|
| 267 |
"accounts/fireworks/models/deepseek-r1": 163840,
|
| 268 |
"accounts/sentientfoundation/models/dobby-unhinged-llama-3-3-70b-new": 131072,
|
| 269 |
"accounts/perplexity/models/r1-1776": 163840,
|
|
|
|
| 270 |
"accounts/fireworks/models/llama-v3p1-405b-instruct": 131072,
|
| 271 |
"accounts/fireworks/models/mixtral-8x22b-instruct": 65536,
|
| 272 |
"accounts/fireworks/models/qwen2p5-72b-instruct": 32768
|
|
|
|
| 1 |
{
|
| 2 |
"replicate": {},
|
| 3 |
"sambanova": {
|
| 4 |
+
"DeepSeek-R1-0528": 32768,
|
| 5 |
"DeepSeek-R1-Distill-Llama-70B": 131072,
|
| 6 |
"DeepSeek-V3-0324": 32768,
|
| 7 |
"E5-Mistral-7B-Instruct": 4096,
|
|
|
|
| 15 |
"Meta-Llama-Guard-3-8B": 16384,
|
| 16 |
"QwQ-32B": 16384,
|
| 17 |
"Qwen2-Audio-7B-Instruct": 4096,
|
| 18 |
+
"Qwen3-32B": 32768,
|
| 19 |
"Whisper-Large-v3": 4096
|
| 20 |
},
|
| 21 |
"nebius": {
|
|
|
|
| 46 |
"microsoft/phi-4": 16384,
|
| 47 |
"deepseek-ai/DeepSeek-V3": 163840,
|
| 48 |
"deepseek-ai/DeepSeek-R1": 163840,
|
| 49 |
+
"deepseek-ai/DeepSeek-R1-0528": 163840,
|
| 50 |
"NousResearch/Hermes-3-Llama-405B": 131072,
|
| 51 |
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B": 131072,
|
| 52 |
"deepseek-ai/DeepSeek-R1-fast": 163840,
|
|
|
|
| 71 |
"stability-ai/sdxl": 0
|
| 72 |
},
|
| 73 |
"novita": {
|
| 74 |
+
"deepseek/deepseek-r1-0528": 128000,
|
| 75 |
+
"deepseek/deepseek-r1-0528-qwen3-8b": 128000,
|
| 76 |
"deepseek/deepseek-v3-0324": 128000,
|
| 77 |
"qwen/qwen3-235b-a22b-fp8": 40960,
|
| 78 |
"qwen/qwen3-30b-a3b-fp8": 40960,
|
| 79 |
"qwen/qwen3-32b-fp8": 40960,
|
| 80 |
+
"qwen/qwen2.5-vl-72b-instruct": 32768,
|
| 81 |
"deepseek/deepseek-v3-turbo": 64000,
|
| 82 |
"meta-llama/llama-4-maverick-17b-128e-instruct-fp8": 1048576,
|
| 83 |
"google/gemma-3-27b-it": 32000,
|
|
|
|
| 84 |
"deepseek/deepseek-r1-turbo": 64000,
|
| 85 |
"Sao10K/L3-8B-Stheno-v3.2": 8192,
|
| 86 |
"gryphe/mythomax-l2-13b": 4096,
|
|
|
|
| 91 |
"deepseek/deepseek-r1-distill-qwen-14b": 64000,
|
| 92 |
"meta-llama/llama-3.3-70b-instruct": 131072,
|
| 93 |
"qwen/qwen-2.5-72b-instruct": 32000,
|
| 94 |
+
"mistralai/mistral-nemo": 60288,
|
| 95 |
"deepseek/deepseek-r1-distill-qwen-32b": 64000,
|
| 96 |
"meta-llama/llama-3-8b-instruct": 8192,
|
| 97 |
"microsoft/wizardlm-2-8x22b": 65535,
|
| 98 |
"deepseek/deepseek-r1-distill-llama-70b": 32000,
|
|
|
|
|
|
|
| 99 |
"mistralai/mistral-7b-instruct": 32768,
|
| 100 |
"meta-llama/llama-3-70b-instruct": 8192,
|
| 101 |
"nousresearch/hermes-2-pro-llama-3-8b": 8192,
|
|
|
|
| 103 |
"cognitivecomputations/dolphin-mixtral-8x22b": 16000,
|
| 104 |
"sophosympatheia/midnight-rose-70b": 4096,
|
| 105 |
"sao10k/l3-8b-lunaris": 8192,
|
|
|
|
|
|
|
|
|
|
| 106 |
"qwen/qwen3-8b-fp8": 128000,
|
| 107 |
"qwen/qwen3-4b-fp8": 128000,
|
|
|
|
| 108 |
"thudm/glm-4-9b-0414": 32000,
|
| 109 |
"thudm/glm-z1-9b-0414": 32000,
|
| 110 |
"thudm/glm-z1-32b-0414": 32000,
|
|
|
|
| 112 |
"thudm/glm-z1-rumination-32b-0414": 32000,
|
| 113 |
"qwen/qwen2.5-7b-instruct": 32000,
|
| 114 |
"meta-llama/llama-3.2-1b-instruct": 131000,
|
|
|
|
| 115 |
"meta-llama/llama-3.2-3b-instruct": 32768,
|
| 116 |
"meta-llama/llama-3.1-8b-instruct-bf16": 8192,
|
| 117 |
"sao10k/l31-70b-euryale-v2.2": 8192
|
|
|
|
| 133 |
"deepseek-ai/DeepSeek-V3": 131072,
|
| 134 |
"deepseek-ai/DeepSeek-V3-0324": 163840,
|
| 135 |
"meta-llama/Llama-3.3-70B-Instruct": 131072,
|
|
|
|
| 136 |
"Qwen/Qwen2.5-Coder-32B-Instruct": 32768,
|
| 137 |
"meta-llama/Llama-3.2-3B-Instruct": 131072,
|
| 138 |
"NousResearch/Hermes-3-Llama-3.1-70B": 12288,
|
|
|
|
| 141 |
"meta-llama/Meta-Llama-3.1-8B-Instruct": 131072,
|
| 142 |
"mistralai/Pixtral-12B-2409": 32768,
|
| 143 |
"Qwen/Qwen2.5-VL-7B-Instruct": 32768,
|
|
|
|
| 144 |
"meta-llama/Meta-Llama-3.1-405B-FP8": 32768,
|
| 145 |
"deepseek-ai/DeepSeek-R1": 163840,
|
| 146 |
"Qwen/QwQ-32B": 131072
|
|
|
|
| 169 |
"command": 4096
|
| 170 |
},
|
| 171 |
"together": {
|
|
|
|
| 172 |
"togethercomputer/m2-bert-80M-32k-retrieval": 32768,
|
| 173 |
"cartesia/sonic": 0,
|
|
|
|
| 174 |
"meta-llama-llama-2-70b-hf": 4096,
|
|
|
|
| 175 |
"intfloat/multilingual-e5-large-instruct": 514,
|
|
|
|
|
|
|
| 176 |
"Gryphe/MythoMax-L2-13b": 4096,
|
| 177 |
"Alibaba-NLP/gte-modernbert-base": 8192,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 178 |
"meta-llama/LlamaGuard-2-8b": 8192,
|
| 179 |
"cartesia/sonic-2": 0,
|
| 180 |
"togethercomputer/m2-bert-80M-8k-retrieval": 8192,
|
| 181 |
+
"deepseek-ai/DeepSeek-R1": 163840,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 182 |
"togethercomputer/MoA-1": 32768,
|
| 183 |
"meta-llama/Meta-Llama-3-70B-Instruct-Turbo": 8192,
|
|
|
|
|
|
|
| 184 |
"Gryphe/MythoMax-L2-13b-Lite": 4096,
|
| 185 |
"meta-llama/Meta-Llama-Guard-3-8B": 8192,
|
| 186 |
+
"deepseek-ai/DeepSeek-V3": 131072,
|
| 187 |
+
"mistralai/Mixtral-8x7B-Instruct-v0.1": 32768,
|
| 188 |
+
"meta-llama/Llama-Vision-Free": 131072,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 189 |
"meta-llama/Llama-3-8b-chat-hf": 8192,
|
| 190 |
+
"mistralai/Mistral-7B-Instruct-v0.1": 32768,
|
| 191 |
+
"BAAI/bge-base-en-v1.5-vllm": 512,
|
| 192 |
+
"meta-llama/Llama-2-70b-hf": 4096,
|
| 193 |
"togethercomputer/MoA-1-Turbo": 32768,
|
|
|
|
|
|
|
| 194 |
"meta-llama/Meta-Llama-3-8B-Instruct-Lite": 8192,
|
| 195 |
+
"black-forest-labs/FLUX.1-kontext-max": 0,
|
|
|
|
|
|
|
|
|
|
|
|
|
| 196 |
"mistralai/Mistral-7B-Instruct-v0.2": 32768,
|
| 197 |
"deepseek-ai/DeepSeek-V3-p-dp": 131072,
|
|
|
|
| 198 |
"Qwen/Qwen2-72B-Instruct": 32768,
|
| 199 |
"mistralai/Mistral-7B-Instruct-v0.3": 32768,
|
| 200 |
+
"NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": 32768,
|
| 201 |
+
"meta-llama/Llama-3.2-11B-Vision-Instruct-Turbo": 131072,
|
| 202 |
"meta-llama/Llama-Guard-3-11B-Vision-Turbo": 131072,
|
| 203 |
+
"google/gemma-2-27b-it": 8192,
|
| 204 |
+
"togethercomputer/Refuel-Llm-V2-Small": 8192,
|
| 205 |
+
"Qwen/Qwen2-VL-72B-Instruct": 32768,
|
| 206 |
+
"meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": 131072,
|
| 207 |
+
"meta-llama/Llama-3.2-90B-Vision-Instruct-Turbo": 131072,
|
| 208 |
+
"scb10x/scb10x-llama3-1-typhoon2-70b-instruct": 8192,
|
| 209 |
+
"arcee-ai/maestro-reasoning": 131072,
|
| 210 |
+
"arcee_ai/arcee-spotlight": 131072,
|
| 211 |
+
"togethercomputer/Refuel-Llm-V2": 16384,
|
| 212 |
+
"arcee-ai/arcee-blitz": 32768,
|
| 213 |
+
"perplexity-ai/r1-1776": 163840,
|
| 214 |
+
"meta-llama/Llama-4-Scout-17B-16E-Instruct": 1048576,
|
| 215 |
+
"Salesforce/Llama-Rank-V1": 8192,
|
| 216 |
+
"Qwen/Qwen2.5-Coder-32B-Instruct": 16384,
|
| 217 |
"meta-llama/Llama-3.2-3B-Instruct-Turbo": 131072,
|
| 218 |
+
"arcee-ai/virtuoso-medium-v2": 131072,
|
| 219 |
+
"arcee-ai/coder-large": 32768,
|
| 220 |
+
"meta-llama/Llama-Guard-4-12B": 1048576,
|
| 221 |
+
"deepseek-ai/DeepSeek-R1-Distill-Qwen-14B": 131072,
|
| 222 |
+
"arcee-ai/virtuoso-large": 131072,
|
| 223 |
+
"Qwen/Qwen2.5-VL-72B-Instruct": 32768,
|
| 224 |
+
"Qwen/Qwen2.5-72B-Instruct-Turbo": 131072,
|
| 225 |
+
"meta-llama/Llama-3-70b-chat-hf": 8192,
|
| 226 |
+
"deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": 131072,
|
| 227 |
+
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B": 131072,
|
| 228 |
+
"meta-llama/Llama-3.3-70B-Instruct-Turbo-Free": 131072,
|
| 229 |
+
"nvidia/Llama-3.1-Nemotron-70B-Instruct-HF": 32768,
|
| 230 |
+
"Qwen/QwQ-32B": 131072,
|
| 231 |
+
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free": 8192,
|
| 232 |
+
"Qwen/Qwen3-235B-A22B-fp8-tput": 40960,
|
| 233 |
+
"mistralai/Mistral-Small-24B-Instruct-2501": 32768,
|
| 234 |
+
"meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8": 1048576,
|
| 235 |
+
"marin-community/marin-8b-instruct": 131072,
|
| 236 |
+
"Qwen/Qwen2.5-7B-Instruct-Turbo": 32768,
|
| 237 |
+
"meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo": 131072,
|
| 238 |
"meta-llama/Llama-3.3-70B-Instruct-Turbo": 131072,
|
| 239 |
+
"meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo": 130815,
|
| 240 |
+
"scb10x/scb10x-typhoon-2-1-gemma3-12b": 8192,
|
| 241 |
+
"arcee-ai/caller": 32768,
|
| 242 |
+
"black-forest-labs/FLUX.1-kontext-pro": 0,
|
| 243 |
+
"lgai/exaone-deep-32b": 32768,
|
| 244 |
+
"lgai/exaone-3-5-32b-instruct": 32768
|
| 245 |
},
|
| 246 |
"fireworks-ai": {
|
| 247 |
"accounts/fireworks/models/qwq-32b": 131072,
|
|
|
|
| 253 |
"accounts/fireworks/models/llama4-scout-instruct-basic": 1048576,
|
| 254 |
"accounts/fireworks/models/qwen2-vl-72b-instruct": 32768,
|
| 255 |
"accounts/fireworks/models/firesearch-ocr-v6": 131072,
|
| 256 |
+
"accounts/fireworks/models/deepseek-r1-0528": 163840,
|
| 257 |
"accounts/fireworks/models/deepseek-v3": 131072,
|
| 258 |
"accounts/fireworks/models/llama-v3p1-8b-instruct": 131072,
|
| 259 |
"accounts/fireworks/models/llama-v3p1-70b-instruct": 131072,
|
|
|
|
| 263 |
"accounts/fireworks/models/deepseek-r1": 163840,
|
| 264 |
"accounts/sentientfoundation/models/dobby-unhinged-llama-3-3-70b-new": 131072,
|
| 265 |
"accounts/perplexity/models/r1-1776": 163840,
|
| 266 |
+
"accounts/sentientfoundation-serverless/models/dobby-mini-unhinged-plus-llama-3-1-8b": 131072,
|
| 267 |
"accounts/fireworks/models/llama-v3p1-405b-instruct": 131072,
|
| 268 |
"accounts/fireworks/models/mixtral-8x22b-instruct": 65536,
|
| 269 |
"accounts/fireworks/models/qwen2p5-72b-instruct": 32768
|
src/lib/types.ts
CHANGED
|
@@ -62,7 +62,7 @@ export type CustomModel = {
|
|
| 62 |
export type Config = {
|
| 63 |
architectures: string[];
|
| 64 |
model_type: string;
|
| 65 |
-
tokenizer_config
|
| 66 |
auto_map?: AutoMap;
|
| 67 |
quantization_config?: QuantizationConfig;
|
| 68 |
};
|
|
@@ -165,6 +165,7 @@ export enum Provider {
|
|
| 165 |
export enum Status {
|
| 166 |
Live = "live",
|
| 167 |
Staging = "staging",
|
|
|
|
| 168 |
}
|
| 169 |
|
| 170 |
export enum Task {
|
|
|
|
| 62 |
export type Config = {
|
| 63 |
architectures: string[];
|
| 64 |
model_type: string;
|
| 65 |
+
tokenizer_config?: TokenizerConfig;
|
| 66 |
auto_map?: AutoMap;
|
| 67 |
quantization_config?: QuantizationConfig;
|
| 68 |
};
|
|
|
|
| 165 |
export enum Status {
|
| 166 |
Live = "live",
|
| 167 |
Staging = "staging",
|
| 168 |
+
Error = "error",
|
| 169 |
}
|
| 170 |
|
| 171 |
export enum Task {
|
src/lib/utils/business.svelte.ts
CHANGED
|
@@ -342,25 +342,11 @@ export function getInferenceSnippet(
|
|
| 342 |
{ ...model, inference: "" },
|
| 343 |
accessToken,
|
| 344 |
provider,
|
| 345 |
-
|
|
|
|
| 346 |
opts
|
| 347 |
);
|
| 348 |
|
| 349 |
-
if (opts?.structured_output && !structuredForbiddenProviders.includes(provider as Provider)) {
|
| 350 |
-
allSnippets.forEach(s => {
|
| 351 |
-
const modified = modifySnippet(s.content, { prop: "hi" });
|
| 352 |
-
if (s.content === modified) {
|
| 353 |
-
console.log("Failed for", s.language, "\n");
|
| 354 |
-
} else {
|
| 355 |
-
console.log("Original snippet");
|
| 356 |
-
console.log(s.content);
|
| 357 |
-
console.log("\nModified");
|
| 358 |
-
console.log(modified);
|
| 359 |
-
console.log();
|
| 360 |
-
}
|
| 361 |
-
});
|
| 362 |
-
}
|
| 363 |
-
|
| 364 |
return allSnippets
|
| 365 |
.filter(s => s.language === language)
|
| 366 |
.map(s => {
|
|
|
|
| 342 |
{ ...model, inference: "" },
|
| 343 |
accessToken,
|
| 344 |
provider,
|
| 345 |
+
// eslint-disable-next-line @typescript-eslint/no-explicit-any
|
| 346 |
+
{ ...providerMapping, hfModelId: model.id } as any,
|
| 347 |
opts
|
| 348 |
);
|
| 349 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 350 |
return allSnippets
|
| 351 |
.filter(s => s.language === language)
|
| 352 |
.map(s => {
|