Thomas G. Lopes commited on
Commit
4148351
·
1 Parent(s): a76eef5

update ctx length

Browse files
Files changed (1) hide show
  1. src/lib/data/context_length.json +13 -12
src/lib/data/context_length.json CHANGED
@@ -15,7 +15,8 @@
15
  "Meta-Llama-Guard-3-8B": 16384,
16
  "QwQ-32B": 16384,
17
  "Qwen2-Audio-7B-Instruct": 4096,
18
- "Qwen3-32B": 8192
 
19
  },
20
  "nebius": {
21
  "meta-llama/Meta-Llama-3.1-8B-Instruct-fast": 131072,
@@ -121,7 +122,7 @@
121
  "deepseek/deepseek-r1-distill-qwen-14b": 64000,
122
  "meta-llama/llama-3.3-70b-instruct": 131072,
123
  "qwen/qwen-2.5-72b-instruct": 32000,
124
- "mistralai/mistral-nemo": 131072,
125
  "deepseek/deepseek-r1-distill-qwen-32b": 64000,
126
  "meta-llama/llama-3-8b-instruct": 8192,
127
  "microsoft/wizardlm-2-8x22b": 65535,
@@ -136,6 +137,7 @@
136
  "cognitivecomputations/dolphin-mixtral-8x22b": 16000,
137
  "sophosympatheia/midnight-rose-70b": 4096,
138
  "sao10k/l3-8b-lunaris": 8192,
 
139
  "qwen/qwen3-0.6b-fp8": 32000,
140
  "qwen/qwen3-1.7b-fp8": 32000,
141
  "qwen/qwen3-8b-fp8": 128000,
@@ -208,23 +210,28 @@
208
  "command": 4096
209
  },
210
  "together": {
211
- "Qwen/QwQ-32B": 131072,
212
  "meta-llama/Llama-4-Scout-17B-16E-Instruct": 1048576,
213
- "mistralai/Mistral-7B-Instruct-v0.1": 32768,
214
  "meta-llama/Llama-Guard-4-12B": 1048576,
215
  "togethercomputer/m2-bert-80M-32k-retrieval": 32768,
216
  "cartesia/sonic": 0,
217
  "scb10x/scb10x-llama3-1-typhoon2-8b-instruct": 8192,
218
- "Qwen/Qwen2.5-7B-Instruct-Turbo": 32768,
219
  "deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free": 8192,
220
  "meta-llama-llama-2-70b-hf": 4096,
221
  "intfloat/multilingual-e5-large-instruct": 514,
222
  "BAAI/bge-base-en-v1.5": 512,
 
223
  "Gryphe/MythoMax-L2-13b": 4096,
224
  "Alibaba-NLP/gte-modernbert-base": 8192,
 
 
 
 
 
 
225
  "mistralai/Mixtral-8x7B-Instruct-v0.1": 32768,
226
  "google/gemma-2-27b-it": 8192,
227
  "Qwen/Qwen2-VL-72B-Instruct": 32768,
 
228
  "meta-llama/LlamaGuard-2-8b": 8192,
229
  "cartesia/sonic-2": 0,
230
  "togethercomputer/m2-bert-80M-8k-retrieval": 8192,
@@ -240,7 +247,6 @@
240
  "meta-llama/Meta-Llama-Guard-3-8B": 8192,
241
  "marin-community/marin-8b-instruct": 131072,
242
  "deepseek-ai/DeepSeek-R1": 163840,
243
- "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": 131072,
244
  "Qwen/Qwen2.5-VL-72B-Instruct": 32768,
245
  "arcee-ai/arcee-blitz": 32768,
246
  "arcee-ai/caller": 32768,
@@ -253,7 +259,6 @@
253
  "mistralai/Mistral-Small-24B-Instruct-2501": 32768,
254
  "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8": 1048576,
255
  "togethercomputer/MoA-1-Turbo": 32768,
256
- "meta-llama/Llama-3.3-70B-Instruct-Turbo": 131072,
257
  "perplexity-ai/r1-1776": 163840,
258
  "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": 32768,
259
  "deepseek-ai/DeepSeek-R1-Distill-Llama-70B": 131072,
@@ -261,23 +266,19 @@
261
  "meta-llama/Meta-Llama-3-8B-Instruct-Lite": 8192,
262
  "Qwen/Qwen3-235B-A22B-fp8": 40960,
263
  "Qwen/Qwen3-235B-A22B-fp8-tput": 40960,
 
264
  "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF": 32768,
265
- "arcee_ai/arcee-spotlight": 131072,
266
- "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo": 130815,
267
  "scb10x/scb10x-llama3-1-typhoon2-70b-instruct": 8192,
268
- "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo": 131072,
269
  "mistralai/Mistral-7B-Instruct-v0.2": 32768,
270
  "deepseek-ai/DeepSeek-V3-p-dp": 131072,
271
  "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B": 131072,
272
  "Qwen/Qwen2.5-Coder-32B-Instruct": 16384,
273
  "Qwen/Qwen2-72B-Instruct": 32768,
274
- "meta-llama/Llama-3-70b-chat-hf": 8192,
275
  "mistralai/Mistral-7B-Instruct-v0.3": 32768,
276
  "Salesforce/Llama-Rank-V1": 8192,
277
  "meta-llama/Llama-Vision-Free": 131072,
278
  "meta-llama/Llama-Guard-3-11B-Vision-Turbo": 131072,
279
  "meta-llama/Llama-3.2-3B-Instruct-Turbo": 131072,
280
- "Qwen/Qwen2.5-72B-Instruct-Turbo": 131072,
281
  "meta-llama/Llama-2-70b-hf": 4096
282
  },
283
  "fireworks-ai": {
 
15
  "Meta-Llama-Guard-3-8B": 16384,
16
  "QwQ-32B": 16384,
17
  "Qwen2-Audio-7B-Instruct": 4096,
18
+ "Qwen3-32B": 8192,
19
+ "Whisper-Large-v3": 4096
20
  },
21
  "nebius": {
22
  "meta-llama/Meta-Llama-3.1-8B-Instruct-fast": 131072,
 
122
  "deepseek/deepseek-r1-distill-qwen-14b": 64000,
123
  "meta-llama/llama-3.3-70b-instruct": 131072,
124
  "qwen/qwen-2.5-72b-instruct": 32000,
125
+ "mistralai/mistral-nemo": 64000,
126
  "deepseek/deepseek-r1-distill-qwen-32b": 64000,
127
  "meta-llama/llama-3-8b-instruct": 8192,
128
  "microsoft/wizardlm-2-8x22b": 65535,
 
137
  "cognitivecomputations/dolphin-mixtral-8x22b": 16000,
138
  "sophosympatheia/midnight-rose-70b": 4096,
139
  "sao10k/l3-8b-lunaris": 8192,
140
+ "pa/cd-op-4-20250514": 200000,
141
  "qwen/qwen3-0.6b-fp8": 32000,
142
  "qwen/qwen3-1.7b-fp8": 32000,
143
  "qwen/qwen3-8b-fp8": 128000,
 
210
  "command": 4096
211
  },
212
  "together": {
 
213
  "meta-llama/Llama-4-Scout-17B-16E-Instruct": 1048576,
 
214
  "meta-llama/Llama-Guard-4-12B": 1048576,
215
  "togethercomputer/m2-bert-80M-32k-retrieval": 32768,
216
  "cartesia/sonic": 0,
217
  "scb10x/scb10x-llama3-1-typhoon2-8b-instruct": 8192,
 
218
  "deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free": 8192,
219
  "meta-llama-llama-2-70b-hf": 4096,
220
  "intfloat/multilingual-e5-large-instruct": 514,
221
  "BAAI/bge-base-en-v1.5": 512,
222
+ "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo": 130815,
223
  "Gryphe/MythoMax-L2-13b": 4096,
224
  "Alibaba-NLP/gte-modernbert-base": 8192,
225
+ "mistralai/Mistral-7B-Instruct-v0.1": 32768,
226
+ "Qwen/Qwen2.5-7B-Instruct-Turbo": 32768,
227
+ "Qwen/Qwen2.5-72B-Instruct-Turbo": 131072,
228
+ "meta-llama/Llama-3.3-70B-Instruct-Turbo": 131072,
229
+ "Qwen/QwQ-32B": 131072,
230
+ "meta-llama/Llama-3-70b-chat-hf": 8192,
231
  "mistralai/Mixtral-8x7B-Instruct-v0.1": 32768,
232
  "google/gemma-2-27b-it": 8192,
233
  "Qwen/Qwen2-VL-72B-Instruct": 32768,
234
+ "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo": 131072,
235
  "meta-llama/LlamaGuard-2-8b": 8192,
236
  "cartesia/sonic-2": 0,
237
  "togethercomputer/m2-bert-80M-8k-retrieval": 8192,
 
247
  "meta-llama/Meta-Llama-Guard-3-8B": 8192,
248
  "marin-community/marin-8b-instruct": 131072,
249
  "deepseek-ai/DeepSeek-R1": 163840,
 
250
  "Qwen/Qwen2.5-VL-72B-Instruct": 32768,
251
  "arcee-ai/arcee-blitz": 32768,
252
  "arcee-ai/caller": 32768,
 
259
  "mistralai/Mistral-Small-24B-Instruct-2501": 32768,
260
  "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8": 1048576,
261
  "togethercomputer/MoA-1-Turbo": 32768,
 
262
  "perplexity-ai/r1-1776": 163840,
263
  "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO": 32768,
264
  "deepseek-ai/DeepSeek-R1-Distill-Llama-70B": 131072,
 
266
  "meta-llama/Meta-Llama-3-8B-Instruct-Lite": 8192,
267
  "Qwen/Qwen3-235B-A22B-fp8": 40960,
268
  "Qwen/Qwen3-235B-A22B-fp8-tput": 40960,
269
+ "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": 131072,
270
  "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF": 32768,
 
 
271
  "scb10x/scb10x-llama3-1-typhoon2-70b-instruct": 8192,
 
272
  "mistralai/Mistral-7B-Instruct-v0.2": 32768,
273
  "deepseek-ai/DeepSeek-V3-p-dp": 131072,
274
  "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B": 131072,
275
  "Qwen/Qwen2.5-Coder-32B-Instruct": 16384,
276
  "Qwen/Qwen2-72B-Instruct": 32768,
 
277
  "mistralai/Mistral-7B-Instruct-v0.3": 32768,
278
  "Salesforce/Llama-Rank-V1": 8192,
279
  "meta-llama/Llama-Vision-Free": 131072,
280
  "meta-llama/Llama-Guard-3-11B-Vision-Turbo": 131072,
281
  "meta-llama/Llama-3.2-3B-Instruct-Turbo": 131072,
 
282
  "meta-llama/Llama-2-70b-hf": 4096
283
  },
284
  "fireworks-ai": {