Thomas G. Lopes
commited on
Commit
·
33e2c0d
1
Parent(s):
893b0be
ctrl g shortcut
Browse files
src/lib/components/inference-playground/message.svelte
CHANGED
@@ -16,6 +16,7 @@
|
|
16 |
import LocalToasts from "../local-toasts.svelte";
|
17 |
import ImgPreview from "./img-preview.svelte";
|
18 |
import { TEST_IDS } from "$lib/constants.js";
|
|
|
19 |
|
20 |
type Props = {
|
21 |
conversation: ConversationClass;
|
@@ -103,6 +104,13 @@
|
|
103 |
if (!message || !content) return;
|
104 |
conversation.updateMessage({ index, message: { ...message, content } });
|
105 |
}}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
106 |
placeholder="Enter {message?.role} message"
|
107 |
class="grow resize-none overflow-hidden rounded-lg bg-transparent px-2 py-2.5 ring-gray-100 outline-none group-hover/message:ring-3 hover:bg-white focus:bg-white focus:ring-3 @2xl:px-3 dark:ring-gray-600 dark:hover:bg-gray-900 dark:focus:bg-gray-900"
|
108 |
rows="1"
|
@@ -182,7 +190,15 @@
|
|
182 |
<IconCustom icon={message.role === "user" ? "regen" : "refresh"} />
|
183 |
</button>
|
184 |
{/snippet}
|
185 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
186 |
</Tooltip>
|
187 |
|
188 |
<Tooltip>
|
|
|
16 |
import LocalToasts from "../local-toasts.svelte";
|
17 |
import ImgPreview from "./img-preview.svelte";
|
18 |
import { TEST_IDS } from "$lib/constants.js";
|
19 |
+
import { cmdOrCtrl } from "$lib/utils/platform.js";
|
20 |
|
21 |
type Props = {
|
22 |
conversation: ConversationClass;
|
|
|
104 |
if (!message || !content) return;
|
105 |
conversation.updateMessage({ index, message: { ...message, content } });
|
106 |
}}
|
107 |
+
onkeydown={e => {
|
108 |
+
if ((e.ctrlKey || e.metaKey) && e.key === "g") {
|
109 |
+
e.preventDefault();
|
110 |
+
e.stopPropagation();
|
111 |
+
onRegen?.();
|
112 |
+
}
|
113 |
+
}}
|
114 |
placeholder="Enter {message?.role} message"
|
115 |
class="grow resize-none overflow-hidden rounded-lg bg-transparent px-2 py-2.5 ring-gray-100 outline-none group-hover/message:ring-3 hover:bg-white focus:bg-white focus:ring-3 @2xl:px-3 dark:ring-gray-600 dark:hover:bg-gray-900 dark:focus:bg-gray-900"
|
116 |
rows="1"
|
|
|
190 |
<IconCustom icon={message.role === "user" ? "regen" : "refresh"} />
|
191 |
</button>
|
192 |
{/snippet}
|
193 |
+
<div class="flex items-center gap-2">
|
194 |
+
{regenLabel}
|
195 |
+
|
196 |
+
<span
|
197 |
+
class="inline-flex items-center gap-0.5 rounded-sm border border-white/20 bg-white/10 px-0.5 text-xs text-white/70"
|
198 |
+
>
|
199 |
+
{cmdOrCtrl}<span class="">G</span>
|
200 |
+
</span>
|
201 |
+
</div>
|
202 |
</Tooltip>
|
203 |
|
204 |
<Tooltip>
|
src/lib/data/context_length.json
CHANGED
@@ -21,36 +21,15 @@
|
|
21 |
"nebius": {
|
22 |
"meta-llama/Meta-Llama-3.1-8B-Instruct-fast": 131072,
|
23 |
"meta-llama/Meta-Llama-3.1-8B-Instruct": 131072,
|
24 |
-
"meta-llama/Meta-Llama-3.1-70B-Instruct-fast": 131072,
|
25 |
"meta-llama/Meta-Llama-3.1-70B-Instruct": 131072,
|
26 |
"meta-llama/Meta-Llama-3.1-405B-Instruct": 131072,
|
27 |
"meta-llama/Llama-Guard-3-8B": 131072,
|
28 |
-
"nvidia/Llama-3.1-Nemotron-70B-Instruct-HF-fast": 131072,
|
29 |
-
"nvidia/Llama-3.1-Nemotron-70B-Instruct-HF": 131072,
|
30 |
"nvidia/Llama-3_1-Nemotron-Ultra-253B-v1": 131072,
|
31 |
-
"mistralai/Mistral-Nemo-Instruct-2407-fast": 128000,
|
32 |
"mistralai/Mistral-Nemo-Instruct-2407": 128000,
|
33 |
-
"mistralai/Mixtral-8x7B-Instruct-v0.1-fast": 32768,
|
34 |
-
"mistralai/Mixtral-8x7B-Instruct-v0.1": 32768,
|
35 |
-
"mistralai/Mixtral-8x22B-Instruct-v0.1-fast": 65536,
|
36 |
-
"mistralai/Mixtral-8x22B-Instruct-v0.1": 65536,
|
37 |
-
"allenai/OLMo-7B-Instruct-hf": 2048,
|
38 |
-
"microsoft/Phi-3-mini-4k-instruct-fast": 4096,
|
39 |
-
"microsoft/Phi-3-mini-4k-instruct": 4096,
|
40 |
-
"microsoft/Phi-3-medium-128k-instruct-fast": 131072,
|
41 |
-
"microsoft/Phi-3-medium-128k-instruct": 131072,
|
42 |
-
"google/gemma-2-2b-it-fast": 8192,
|
43 |
"google/gemma-2-2b-it": 8192,
|
44 |
"google/gemma-2-9b-it-fast": 8192,
|
45 |
-
"google/gemma-2-9b-it": 8192,
|
46 |
-
"google/gemma-2-27b-it-fast": 8192,
|
47 |
-
"google/gemma-2-27b-it": 8192,
|
48 |
-
"deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct-fast": 128000,
|
49 |
-
"deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct": 128000,
|
50 |
"Qwen/Qwen2.5-Coder-7B-fast": 32768,
|
51 |
"Qwen/Qwen2.5-Coder-7B": 32768,
|
52 |
-
"Qwen/Qwen2.5-Coder-7B-Instruct-fast": 32768,
|
53 |
-
"Qwen/Qwen2.5-Coder-7B-Instruct": 32768,
|
54 |
"Qwen/Qwen2.5-Coder-32B-Instruct-fast": 131072,
|
55 |
"Qwen/Qwen2.5-Coder-32B-Instruct": 131072,
|
56 |
"Qwen/Qwen2.5-32B-Instruct-fast": 131072,
|
@@ -58,24 +37,12 @@
|
|
58 |
"Qwen/Qwen2.5-72B-Instruct-fast": 131072,
|
59 |
"Qwen/Qwen2.5-72B-Instruct": 131072,
|
60 |
"Qwen/Qwen2-VL-72B-Instruct": 32768,
|
61 |
-
"Qwen/Qwen2-VL-7B-Instruct": 32768,
|
62 |
-
"llava-hf/llava-1.5-7b-hf": 4096,
|
63 |
-
"llava-hf/llava-1.5-13b-hf": 4096,
|
64 |
-
"aaditya/Llama3-OpenBioLLM-8B": 8192,
|
65 |
"aaditya/Llama3-OpenBioLLM-70B": 8192,
|
66 |
"BAAI/bge-en-icl": 32768,
|
67 |
"BAAI/bge-multilingual-gemma2": 8192,
|
68 |
"intfloat/e5-mistral-7b-instruct": 32768,
|
69 |
-
"cognitivecomputations/dolphin-2.9.2-mixtral-8x22b": 65536,
|
70 |
-
"microsoft/Phi-3.5-MoE-instruct": 131072,
|
71 |
-
"microsoft/Phi-3.5-mini-instruct": 131072,
|
72 |
-
"Qwen/Qwen2.5-1.5B-Instruct": 32768,
|
73 |
"meta-llama/Llama-3.3-70B-Instruct": 131072,
|
74 |
"meta-llama/Llama-3.3-70B-Instruct-fast": 131072,
|
75 |
-
"meta-llama/Llama-3.2-1B-Instruct": 131072,
|
76 |
-
"meta-llama/Llama-3.2-3B-Instruct": 131072,
|
77 |
-
"Qwen/QwQ-32B-Preview": 32768,
|
78 |
-
"Qwen/QVQ-72B-preview": 128000,
|
79 |
"microsoft/phi-4": 16384,
|
80 |
"deepseek-ai/DeepSeek-V3": 163840,
|
81 |
"deepseek-ai/DeepSeek-R1": 163840,
|
@@ -88,6 +55,7 @@
|
|
88 |
"Qwen/Qwen3-30B-A3B": 40960,
|
89 |
"Qwen/Qwen3-30B-A3B-fast": 40960,
|
90 |
"Qwen/Qwen3-32B": 40960,
|
|
|
91 |
"Qwen/Qwen3-14B": 40960,
|
92 |
"Qwen/Qwen3-4B-fast": 40960,
|
93 |
"nvidia/Llama-3_3-Nemotron-Super-49B-v1": 131072,
|
@@ -117,7 +85,6 @@
|
|
117 |
"deepseek/deepseek-prover-v2-671b": 160000,
|
118 |
"meta-llama/llama-4-scout-17b-16e-instruct": 131072,
|
119 |
"deepseek/deepseek-r1-distill-llama-8b": 32000,
|
120 |
-
"deepseek/deepseek_v3": 64000,
|
121 |
"meta-llama/llama-3.1-8b-instruct": 16384,
|
122 |
"deepseek/deepseek-r1-distill-qwen-14b": 64000,
|
123 |
"meta-llama/llama-3.3-70b-instruct": 131072,
|
@@ -131,7 +98,6 @@
|
|
131 |
"google/gemma-2-9b-it": 8192,
|
132 |
"mistralai/mistral-7b-instruct": 32768,
|
133 |
"meta-llama/llama-3-70b-instruct": 8192,
|
134 |
-
"deepseek/deepseek-r1": 64000,
|
135 |
"nousresearch/hermes-2-pro-llama-3-8b": 8192,
|
136 |
"sao10k/l3-70b-euryale-v2.1": 8192,
|
137 |
"cognitivecomputations/dolphin-mixtral-8x22b": 16000,
|
@@ -210,13 +176,12 @@
|
|
210 |
"command": 4096
|
211 |
},
|
212 |
"together": {
|
213 |
-
"meta-llama/Llama-4-Scout-17B-16E-Instruct": 1048576,
|
214 |
"meta-llama/Llama-Guard-4-12B": 1048576,
|
215 |
"togethercomputer/m2-bert-80M-32k-retrieval": 32768,
|
216 |
"cartesia/sonic": 0,
|
217 |
"scb10x/scb10x-llama3-1-typhoon2-8b-instruct": 8192,
|
218 |
-
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free": 8192,
|
219 |
"meta-llama-llama-2-70b-hf": 4096,
|
|
|
220 |
"intfloat/multilingual-e5-large-instruct": 514,
|
221 |
"BAAI/bge-base-en-v1.5": 512,
|
222 |
"meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo": 130815,
|
@@ -233,8 +198,11 @@
|
|
233 |
"meta-llama/LlamaGuard-2-8b": 8192,
|
234 |
"cartesia/sonic-2": 0,
|
235 |
"togethercomputer/m2-bert-80M-8k-retrieval": 8192,
|
|
|
|
|
|
|
236 |
"meta-llama/Llama-3.3-70B-Instruct-Turbo-Free": 131072,
|
237 |
-
"
|
238 |
"deepseek-ai/DeepSeek-V3": 131072,
|
239 |
"togethercomputer/Refuel-Llm-V2-Small": 8192,
|
240 |
"togethercomputer/MoA-1": 32768,
|
@@ -260,8 +228,6 @@
|
|
260 |
"togethercomputer/MoA-1-Turbo": 32768,
|
261 |
"perplexity-ai/r1-1776": 163840,
|
262 |
"NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": 32768,
|
263 |
-
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B": 131072,
|
264 |
-
"deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": 131072,
|
265 |
"meta-llama/Meta-Llama-3-8B-Instruct-Lite": 8192,
|
266 |
"Qwen/Qwen3-235B-A22B-fp8": 40960,
|
267 |
"Qwen/Qwen3-235B-A22B-fp8-tput": 40960,
|
@@ -270,7 +236,6 @@
|
|
270 |
"scb10x/scb10x-llama3-1-typhoon2-70b-instruct": 8192,
|
271 |
"mistralai/Mistral-7B-Instruct-v0.2": 32768,
|
272 |
"deepseek-ai/DeepSeek-V3-p-dp": 131072,
|
273 |
-
"deepseek-ai/DeepSeek-R1-Distill-Qwen-14B": 131072,
|
274 |
"Qwen/Qwen2.5-Coder-32B-Instruct": 16384,
|
275 |
"Qwen/Qwen2-72B-Instruct": 32768,
|
276 |
"mistralai/Mistral-7B-Instruct-v0.3": 32768,
|
@@ -278,9 +243,10 @@
|
|
278 |
"meta-llama/Llama-Vision-Free": 131072,
|
279 |
"meta-llama/Llama-Guard-3-11B-Vision-Turbo": 131072,
|
280 |
"meta-llama/Llama-3.2-3B-Instruct-Turbo": 131072,
|
281 |
-
"arcee_ai/arcee-spotlight": 131072,
|
282 |
"meta-llama/Llama-3.3-70B-Instruct-Turbo": 131072,
|
283 |
-
"meta-llama/Llama-
|
|
|
|
|
284 |
},
|
285 |
"fireworks-ai": {
|
286 |
"accounts/fireworks/models/qwq-32b": 131072,
|
|
|
21 |
"nebius": {
|
22 |
"meta-llama/Meta-Llama-3.1-8B-Instruct-fast": 131072,
|
23 |
"meta-llama/Meta-Llama-3.1-8B-Instruct": 131072,
|
|
|
24 |
"meta-llama/Meta-Llama-3.1-70B-Instruct": 131072,
|
25 |
"meta-llama/Meta-Llama-3.1-405B-Instruct": 131072,
|
26 |
"meta-llama/Llama-Guard-3-8B": 131072,
|
|
|
|
|
27 |
"nvidia/Llama-3_1-Nemotron-Ultra-253B-v1": 131072,
|
|
|
28 |
"mistralai/Mistral-Nemo-Instruct-2407": 128000,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
29 |
"google/gemma-2-2b-it": 8192,
|
30 |
"google/gemma-2-9b-it-fast": 8192,
|
|
|
|
|
|
|
|
|
|
|
31 |
"Qwen/Qwen2.5-Coder-7B-fast": 32768,
|
32 |
"Qwen/Qwen2.5-Coder-7B": 32768,
|
|
|
|
|
33 |
"Qwen/Qwen2.5-Coder-32B-Instruct-fast": 131072,
|
34 |
"Qwen/Qwen2.5-Coder-32B-Instruct": 131072,
|
35 |
"Qwen/Qwen2.5-32B-Instruct-fast": 131072,
|
|
|
37 |
"Qwen/Qwen2.5-72B-Instruct-fast": 131072,
|
38 |
"Qwen/Qwen2.5-72B-Instruct": 131072,
|
39 |
"Qwen/Qwen2-VL-72B-Instruct": 32768,
|
|
|
|
|
|
|
|
|
40 |
"aaditya/Llama3-OpenBioLLM-70B": 8192,
|
41 |
"BAAI/bge-en-icl": 32768,
|
42 |
"BAAI/bge-multilingual-gemma2": 8192,
|
43 |
"intfloat/e5-mistral-7b-instruct": 32768,
|
|
|
|
|
|
|
|
|
44 |
"meta-llama/Llama-3.3-70B-Instruct": 131072,
|
45 |
"meta-llama/Llama-3.3-70B-Instruct-fast": 131072,
|
|
|
|
|
|
|
|
|
46 |
"microsoft/phi-4": 16384,
|
47 |
"deepseek-ai/DeepSeek-V3": 163840,
|
48 |
"deepseek-ai/DeepSeek-R1": 163840,
|
|
|
55 |
"Qwen/Qwen3-30B-A3B": 40960,
|
56 |
"Qwen/Qwen3-30B-A3B-fast": 40960,
|
57 |
"Qwen/Qwen3-32B": 40960,
|
58 |
+
"Qwen/Qwen3-32B-fast": 40960,
|
59 |
"Qwen/Qwen3-14B": 40960,
|
60 |
"Qwen/Qwen3-4B-fast": 40960,
|
61 |
"nvidia/Llama-3_3-Nemotron-Super-49B-v1": 131072,
|
|
|
85 |
"deepseek/deepseek-prover-v2-671b": 160000,
|
86 |
"meta-llama/llama-4-scout-17b-16e-instruct": 131072,
|
87 |
"deepseek/deepseek-r1-distill-llama-8b": 32000,
|
|
|
88 |
"meta-llama/llama-3.1-8b-instruct": 16384,
|
89 |
"deepseek/deepseek-r1-distill-qwen-14b": 64000,
|
90 |
"meta-llama/llama-3.3-70b-instruct": 131072,
|
|
|
98 |
"google/gemma-2-9b-it": 8192,
|
99 |
"mistralai/mistral-7b-instruct": 32768,
|
100 |
"meta-llama/llama-3-70b-instruct": 8192,
|
|
|
101 |
"nousresearch/hermes-2-pro-llama-3-8b": 8192,
|
102 |
"sao10k/l3-70b-euryale-v2.1": 8192,
|
103 |
"cognitivecomputations/dolphin-mixtral-8x22b": 16000,
|
|
|
176 |
"command": 4096
|
177 |
},
|
178 |
"together": {
|
|
|
179 |
"meta-llama/Llama-Guard-4-12B": 1048576,
|
180 |
"togethercomputer/m2-bert-80M-32k-retrieval": 32768,
|
181 |
"cartesia/sonic": 0,
|
182 |
"scb10x/scb10x-llama3-1-typhoon2-8b-instruct": 8192,
|
|
|
183 |
"meta-llama-llama-2-70b-hf": 4096,
|
184 |
+
"togethercomputer/Refuel-Llm-V2": 16384,
|
185 |
"intfloat/multilingual-e5-large-instruct": 514,
|
186 |
"BAAI/bge-base-en-v1.5": 512,
|
187 |
"meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo": 130815,
|
|
|
198 |
"meta-llama/LlamaGuard-2-8b": 8192,
|
199 |
"cartesia/sonic-2": 0,
|
200 |
"togethercomputer/m2-bert-80M-8k-retrieval": 8192,
|
201 |
+
"deepseek-ai/DeepSeek-R1-Distill-Qwen-14B": 131072,
|
202 |
+
"deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": 131072,
|
203 |
+
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free": 8192,
|
204 |
"meta-llama/Llama-3.3-70B-Instruct-Turbo-Free": 131072,
|
205 |
+
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B": 131072,
|
206 |
"deepseek-ai/DeepSeek-V3": 131072,
|
207 |
"togethercomputer/Refuel-Llm-V2-Small": 8192,
|
208 |
"togethercomputer/MoA-1": 32768,
|
|
|
228 |
"togethercomputer/MoA-1-Turbo": 32768,
|
229 |
"perplexity-ai/r1-1776": 163840,
|
230 |
"NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": 32768,
|
|
|
|
|
231 |
"meta-llama/Meta-Llama-3-8B-Instruct-Lite": 8192,
|
232 |
"Qwen/Qwen3-235B-A22B-fp8": 40960,
|
233 |
"Qwen/Qwen3-235B-A22B-fp8-tput": 40960,
|
|
|
236 |
"scb10x/scb10x-llama3-1-typhoon2-70b-instruct": 8192,
|
237 |
"mistralai/Mistral-7B-Instruct-v0.2": 32768,
|
238 |
"deepseek-ai/DeepSeek-V3-p-dp": 131072,
|
|
|
239 |
"Qwen/Qwen2.5-Coder-32B-Instruct": 16384,
|
240 |
"Qwen/Qwen2-72B-Instruct": 32768,
|
241 |
"mistralai/Mistral-7B-Instruct-v0.3": 32768,
|
|
|
243 |
"meta-llama/Llama-Vision-Free": 131072,
|
244 |
"meta-llama/Llama-Guard-3-11B-Vision-Turbo": 131072,
|
245 |
"meta-llama/Llama-3.2-3B-Instruct-Turbo": 131072,
|
|
|
246 |
"meta-llama/Llama-3.3-70B-Instruct-Turbo": 131072,
|
247 |
+
"meta-llama/Llama-4-Scout-17B-16E-Instruct": 1048576,
|
248 |
+
"meta-llama/Llama-2-70b-hf": 4096,
|
249 |
+
"arcee_ai/arcee-spotlight": 131072
|
250 |
},
|
251 |
"fireworks-ai": {
|
252 |
"accounts/fireworks/models/qwq-32b": 131072,
|