Thomas G. Lopes commited on
Commit
33e2c0d
·
1 Parent(s): 893b0be

ctrl g shortcut

Browse files
src/lib/components/inference-playground/message.svelte CHANGED
@@ -16,6 +16,7 @@
16
  import LocalToasts from "../local-toasts.svelte";
17
  import ImgPreview from "./img-preview.svelte";
18
  import { TEST_IDS } from "$lib/constants.js";
 
19
 
20
  type Props = {
21
  conversation: ConversationClass;
@@ -103,6 +104,13 @@
103
  if (!message || !content) return;
104
  conversation.updateMessage({ index, message: { ...message, content } });
105
  }}
 
 
 
 
 
 
 
106
  placeholder="Enter {message?.role} message"
107
  class="grow resize-none overflow-hidden rounded-lg bg-transparent px-2 py-2.5 ring-gray-100 outline-none group-hover/message:ring-3 hover:bg-white focus:bg-white focus:ring-3 @2xl:px-3 dark:ring-gray-600 dark:hover:bg-gray-900 dark:focus:bg-gray-900"
108
  rows="1"
@@ -182,7 +190,15 @@
182
  <IconCustom icon={message.role === "user" ? "regen" : "refresh"} />
183
  </button>
184
  {/snippet}
185
- {regenLabel}
 
 
 
 
 
 
 
 
186
  </Tooltip>
187
 
188
  <Tooltip>
 
16
  import LocalToasts from "../local-toasts.svelte";
17
  import ImgPreview from "./img-preview.svelte";
18
  import { TEST_IDS } from "$lib/constants.js";
19
+ import { cmdOrCtrl } from "$lib/utils/platform.js";
20
 
21
  type Props = {
22
  conversation: ConversationClass;
 
104
  if (!message || !content) return;
105
  conversation.updateMessage({ index, message: { ...message, content } });
106
  }}
107
+ onkeydown={e => {
108
+ if ((e.ctrlKey || e.metaKey) && e.key === "g") {
109
+ e.preventDefault();
110
+ e.stopPropagation();
111
+ onRegen?.();
112
+ }
113
+ }}
114
  placeholder="Enter {message?.role} message"
115
  class="grow resize-none overflow-hidden rounded-lg bg-transparent px-2 py-2.5 ring-gray-100 outline-none group-hover/message:ring-3 hover:bg-white focus:bg-white focus:ring-3 @2xl:px-3 dark:ring-gray-600 dark:hover:bg-gray-900 dark:focus:bg-gray-900"
116
  rows="1"
 
190
  <IconCustom icon={message.role === "user" ? "regen" : "refresh"} />
191
  </button>
192
  {/snippet}
193
+ <div class="flex items-center gap-2">
194
+ {regenLabel}
195
+
196
+ <span
197
+ class="inline-flex items-center gap-0.5 rounded-sm border border-white/20 bg-white/10 px-0.5 text-xs text-white/70"
198
+ >
199
+ {cmdOrCtrl}<span class="">G</span>
200
+ </span>
201
+ </div>
202
  </Tooltip>
203
 
204
  <Tooltip>
src/lib/data/context_length.json CHANGED
@@ -21,36 +21,15 @@
21
  "nebius": {
22
  "meta-llama/Meta-Llama-3.1-8B-Instruct-fast": 131072,
23
  "meta-llama/Meta-Llama-3.1-8B-Instruct": 131072,
24
- "meta-llama/Meta-Llama-3.1-70B-Instruct-fast": 131072,
25
  "meta-llama/Meta-Llama-3.1-70B-Instruct": 131072,
26
  "meta-llama/Meta-Llama-3.1-405B-Instruct": 131072,
27
  "meta-llama/Llama-Guard-3-8B": 131072,
28
- "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF-fast": 131072,
29
- "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF": 131072,
30
  "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1": 131072,
31
- "mistralai/Mistral-Nemo-Instruct-2407-fast": 128000,
32
  "mistralai/Mistral-Nemo-Instruct-2407": 128000,
33
- "mistralai/Mixtral-8x7B-Instruct-v0.1-fast": 32768,
34
- "mistralai/Mixtral-8x7B-Instruct-v0.1": 32768,
35
- "mistralai/Mixtral-8x22B-Instruct-v0.1-fast": 65536,
36
- "mistralai/Mixtral-8x22B-Instruct-v0.1": 65536,
37
- "allenai/OLMo-7B-Instruct-hf": 2048,
38
- "microsoft/Phi-3-mini-4k-instruct-fast": 4096,
39
- "microsoft/Phi-3-mini-4k-instruct": 4096,
40
- "microsoft/Phi-3-medium-128k-instruct-fast": 131072,
41
- "microsoft/Phi-3-medium-128k-instruct": 131072,
42
- "google/gemma-2-2b-it-fast": 8192,
43
  "google/gemma-2-2b-it": 8192,
44
  "google/gemma-2-9b-it-fast": 8192,
45
- "google/gemma-2-9b-it": 8192,
46
- "google/gemma-2-27b-it-fast": 8192,
47
- "google/gemma-2-27b-it": 8192,
48
- "deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct-fast": 128000,
49
- "deepseek-ai/DeepSeek-Coder-V2-Lite-Instruct": 128000,
50
  "Qwen/Qwen2.5-Coder-7B-fast": 32768,
51
  "Qwen/Qwen2.5-Coder-7B": 32768,
52
- "Qwen/Qwen2.5-Coder-7B-Instruct-fast": 32768,
53
- "Qwen/Qwen2.5-Coder-7B-Instruct": 32768,
54
  "Qwen/Qwen2.5-Coder-32B-Instruct-fast": 131072,
55
  "Qwen/Qwen2.5-Coder-32B-Instruct": 131072,
56
  "Qwen/Qwen2.5-32B-Instruct-fast": 131072,
@@ -58,24 +37,12 @@
58
  "Qwen/Qwen2.5-72B-Instruct-fast": 131072,
59
  "Qwen/Qwen2.5-72B-Instruct": 131072,
60
  "Qwen/Qwen2-VL-72B-Instruct": 32768,
61
- "Qwen/Qwen2-VL-7B-Instruct": 32768,
62
- "llava-hf/llava-1.5-7b-hf": 4096,
63
- "llava-hf/llava-1.5-13b-hf": 4096,
64
- "aaditya/Llama3-OpenBioLLM-8B": 8192,
65
  "aaditya/Llama3-OpenBioLLM-70B": 8192,
66
  "BAAI/bge-en-icl": 32768,
67
  "BAAI/bge-multilingual-gemma2": 8192,
68
  "intfloat/e5-mistral-7b-instruct": 32768,
69
- "cognitivecomputations/dolphin-2.9.2-mixtral-8x22b": 65536,
70
- "microsoft/Phi-3.5-MoE-instruct": 131072,
71
- "microsoft/Phi-3.5-mini-instruct": 131072,
72
- "Qwen/Qwen2.5-1.5B-Instruct": 32768,
73
  "meta-llama/Llama-3.3-70B-Instruct": 131072,
74
  "meta-llama/Llama-3.3-70B-Instruct-fast": 131072,
75
- "meta-llama/Llama-3.2-1B-Instruct": 131072,
76
- "meta-llama/Llama-3.2-3B-Instruct": 131072,
77
- "Qwen/QwQ-32B-Preview": 32768,
78
- "Qwen/QVQ-72B-preview": 128000,
79
  "microsoft/phi-4": 16384,
80
  "deepseek-ai/DeepSeek-V3": 163840,
81
  "deepseek-ai/DeepSeek-R1": 163840,
@@ -88,6 +55,7 @@
88
  "Qwen/Qwen3-30B-A3B": 40960,
89
  "Qwen/Qwen3-30B-A3B-fast": 40960,
90
  "Qwen/Qwen3-32B": 40960,
 
91
  "Qwen/Qwen3-14B": 40960,
92
  "Qwen/Qwen3-4B-fast": 40960,
93
  "nvidia/Llama-3_3-Nemotron-Super-49B-v1": 131072,
@@ -117,7 +85,6 @@
117
  "deepseek/deepseek-prover-v2-671b": 160000,
118
  "meta-llama/llama-4-scout-17b-16e-instruct": 131072,
119
  "deepseek/deepseek-r1-distill-llama-8b": 32000,
120
- "deepseek/deepseek_v3": 64000,
121
  "meta-llama/llama-3.1-8b-instruct": 16384,
122
  "deepseek/deepseek-r1-distill-qwen-14b": 64000,
123
  "meta-llama/llama-3.3-70b-instruct": 131072,
@@ -131,7 +98,6 @@
131
  "google/gemma-2-9b-it": 8192,
132
  "mistralai/mistral-7b-instruct": 32768,
133
  "meta-llama/llama-3-70b-instruct": 8192,
134
- "deepseek/deepseek-r1": 64000,
135
  "nousresearch/hermes-2-pro-llama-3-8b": 8192,
136
  "sao10k/l3-70b-euryale-v2.1": 8192,
137
  "cognitivecomputations/dolphin-mixtral-8x22b": 16000,
@@ -210,13 +176,12 @@
210
  "command": 4096
211
  },
212
  "together": {
213
- "meta-llama/Llama-4-Scout-17B-16E-Instruct": 1048576,
214
  "meta-llama/Llama-Guard-4-12B": 1048576,
215
  "togethercomputer/m2-bert-80M-32k-retrieval": 32768,
216
  "cartesia/sonic": 0,
217
  "scb10x/scb10x-llama3-1-typhoon2-8b-instruct": 8192,
218
- "deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free": 8192,
219
  "meta-llama-llama-2-70b-hf": 4096,
 
220
  "intfloat/multilingual-e5-large-instruct": 514,
221
  "BAAI/bge-base-en-v1.5": 512,
222
  "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo": 130815,
@@ -233,8 +198,11 @@
233
  "meta-llama/LlamaGuard-2-8b": 8192,
234
  "cartesia/sonic-2": 0,
235
  "togethercomputer/m2-bert-80M-8k-retrieval": 8192,
 
 
 
236
  "meta-llama/Llama-3.3-70B-Instruct-Turbo-Free": 131072,
237
- "togethercomputer/Refuel-Llm-V2": 16384,
238
  "deepseek-ai/DeepSeek-V3": 131072,
239
  "togethercomputer/Refuel-Llm-V2-Small": 8192,
240
  "togethercomputer/MoA-1": 32768,
@@ -260,8 +228,6 @@
260
  "togethercomputer/MoA-1-Turbo": 32768,
261
  "perplexity-ai/r1-1776": 163840,
262
  "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": 32768,
263
- "deepseek-ai/DeepSeek-R1-Distill-Llama-70B": 131072,
264
- "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": 131072,
265
  "meta-llama/Meta-Llama-3-8B-Instruct-Lite": 8192,
266
  "Qwen/Qwen3-235B-A22B-fp8": 40960,
267
  "Qwen/Qwen3-235B-A22B-fp8-tput": 40960,
@@ -270,7 +236,6 @@
270
  "scb10x/scb10x-llama3-1-typhoon2-70b-instruct": 8192,
271
  "mistralai/Mistral-7B-Instruct-v0.2": 32768,
272
  "deepseek-ai/DeepSeek-V3-p-dp": 131072,
273
- "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B": 131072,
274
  "Qwen/Qwen2.5-Coder-32B-Instruct": 16384,
275
  "Qwen/Qwen2-72B-Instruct": 32768,
276
  "mistralai/Mistral-7B-Instruct-v0.3": 32768,
@@ -278,9 +243,10 @@
278
  "meta-llama/Llama-Vision-Free": 131072,
279
  "meta-llama/Llama-Guard-3-11B-Vision-Turbo": 131072,
280
  "meta-llama/Llama-3.2-3B-Instruct-Turbo": 131072,
281
- "arcee_ai/arcee-spotlight": 131072,
282
  "meta-llama/Llama-3.3-70B-Instruct-Turbo": 131072,
283
- "meta-llama/Llama-2-70b-hf": 4096
 
 
284
  },
285
  "fireworks-ai": {
286
  "accounts/fireworks/models/qwq-32b": 131072,
 
21
  "nebius": {
22
  "meta-llama/Meta-Llama-3.1-8B-Instruct-fast": 131072,
23
  "meta-llama/Meta-Llama-3.1-8B-Instruct": 131072,
 
24
  "meta-llama/Meta-Llama-3.1-70B-Instruct": 131072,
25
  "meta-llama/Meta-Llama-3.1-405B-Instruct": 131072,
26
  "meta-llama/Llama-Guard-3-8B": 131072,
 
 
27
  "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1": 131072,
 
28
  "mistralai/Mistral-Nemo-Instruct-2407": 128000,
 
 
 
 
 
 
 
 
 
 
29
  "google/gemma-2-2b-it": 8192,
30
  "google/gemma-2-9b-it-fast": 8192,
 
 
 
 
 
31
  "Qwen/Qwen2.5-Coder-7B-fast": 32768,
32
  "Qwen/Qwen2.5-Coder-7B": 32768,
 
 
33
  "Qwen/Qwen2.5-Coder-32B-Instruct-fast": 131072,
34
  "Qwen/Qwen2.5-Coder-32B-Instruct": 131072,
35
  "Qwen/Qwen2.5-32B-Instruct-fast": 131072,
 
37
  "Qwen/Qwen2.5-72B-Instruct-fast": 131072,
38
  "Qwen/Qwen2.5-72B-Instruct": 131072,
39
  "Qwen/Qwen2-VL-72B-Instruct": 32768,
 
 
 
 
40
  "aaditya/Llama3-OpenBioLLM-70B": 8192,
41
  "BAAI/bge-en-icl": 32768,
42
  "BAAI/bge-multilingual-gemma2": 8192,
43
  "intfloat/e5-mistral-7b-instruct": 32768,
 
 
 
 
44
  "meta-llama/Llama-3.3-70B-Instruct": 131072,
45
  "meta-llama/Llama-3.3-70B-Instruct-fast": 131072,
 
 
 
 
46
  "microsoft/phi-4": 16384,
47
  "deepseek-ai/DeepSeek-V3": 163840,
48
  "deepseek-ai/DeepSeek-R1": 163840,
 
55
  "Qwen/Qwen3-30B-A3B": 40960,
56
  "Qwen/Qwen3-30B-A3B-fast": 40960,
57
  "Qwen/Qwen3-32B": 40960,
58
+ "Qwen/Qwen3-32B-fast": 40960,
59
  "Qwen/Qwen3-14B": 40960,
60
  "Qwen/Qwen3-4B-fast": 40960,
61
  "nvidia/Llama-3_3-Nemotron-Super-49B-v1": 131072,
 
85
  "deepseek/deepseek-prover-v2-671b": 160000,
86
  "meta-llama/llama-4-scout-17b-16e-instruct": 131072,
87
  "deepseek/deepseek-r1-distill-llama-8b": 32000,
 
88
  "meta-llama/llama-3.1-8b-instruct": 16384,
89
  "deepseek/deepseek-r1-distill-qwen-14b": 64000,
90
  "meta-llama/llama-3.3-70b-instruct": 131072,
 
98
  "google/gemma-2-9b-it": 8192,
99
  "mistralai/mistral-7b-instruct": 32768,
100
  "meta-llama/llama-3-70b-instruct": 8192,
 
101
  "nousresearch/hermes-2-pro-llama-3-8b": 8192,
102
  "sao10k/l3-70b-euryale-v2.1": 8192,
103
  "cognitivecomputations/dolphin-mixtral-8x22b": 16000,
 
176
  "command": 4096
177
  },
178
  "together": {
 
179
  "meta-llama/Llama-Guard-4-12B": 1048576,
180
  "togethercomputer/m2-bert-80M-32k-retrieval": 32768,
181
  "cartesia/sonic": 0,
182
  "scb10x/scb10x-llama3-1-typhoon2-8b-instruct": 8192,
 
183
  "meta-llama-llama-2-70b-hf": 4096,
184
+ "togethercomputer/Refuel-Llm-V2": 16384,
185
  "intfloat/multilingual-e5-large-instruct": 514,
186
  "BAAI/bge-base-en-v1.5": 512,
187
  "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo": 130815,
 
198
  "meta-llama/LlamaGuard-2-8b": 8192,
199
  "cartesia/sonic-2": 0,
200
  "togethercomputer/m2-bert-80M-8k-retrieval": 8192,
201
+ "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B": 131072,
202
+ "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": 131072,
203
+ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free": 8192,
204
  "meta-llama/Llama-3.3-70B-Instruct-Turbo-Free": 131072,
205
+ "deepseek-ai/DeepSeek-R1-Distill-Llama-70B": 131072,
206
  "deepseek-ai/DeepSeek-V3": 131072,
207
  "togethercomputer/Refuel-Llm-V2-Small": 8192,
208
  "togethercomputer/MoA-1": 32768,
 
228
  "togethercomputer/MoA-1-Turbo": 32768,
229
  "perplexity-ai/r1-1776": 163840,
230
  "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": 32768,
 
 
231
  "meta-llama/Meta-Llama-3-8B-Instruct-Lite": 8192,
232
  "Qwen/Qwen3-235B-A22B-fp8": 40960,
233
  "Qwen/Qwen3-235B-A22B-fp8-tput": 40960,
 
236
  "scb10x/scb10x-llama3-1-typhoon2-70b-instruct": 8192,
237
  "mistralai/Mistral-7B-Instruct-v0.2": 32768,
238
  "deepseek-ai/DeepSeek-V3-p-dp": 131072,
 
239
  "Qwen/Qwen2.5-Coder-32B-Instruct": 16384,
240
  "Qwen/Qwen2-72B-Instruct": 32768,
241
  "mistralai/Mistral-7B-Instruct-v0.3": 32768,
 
243
  "meta-llama/Llama-Vision-Free": 131072,
244
  "meta-llama/Llama-Guard-3-11B-Vision-Turbo": 131072,
245
  "meta-llama/Llama-3.2-3B-Instruct-Turbo": 131072,
 
246
  "meta-llama/Llama-3.3-70B-Instruct-Turbo": 131072,
247
+ "meta-llama/Llama-4-Scout-17B-16E-Instruct": 1048576,
248
+ "meta-llama/Llama-2-70b-hf": 4096,
249
+ "arcee_ai/arcee-spotlight": 131072
250
  },
251
  "fireworks-ai": {
252
  "accounts/fireworks/models/qwq-32b": 131072,