Spaces:
Sleeping
Sleeping
Update server.py
Browse files
server.py
CHANGED
@@ -20,8 +20,8 @@ def launch_vllm_server(beta=1.0):
|
|
20 |
"Qwen/Qwen3-4B",
|
21 |
"--tensor-parallel-size", "1",
|
22 |
"--enforce-eager",
|
23 |
-
"--max-model-len", "
|
24 |
-
"--max-seq-len-to-capture", "
|
25 |
"--max-num-seqs", "36",
|
26 |
"--host", "0.0.0.0",
|
27 |
"--port", "8000",
|
|
|
20 |
"Qwen/Qwen3-4B",
|
21 |
"--tensor-parallel-size", "1",
|
22 |
"--enforce-eager",
|
23 |
+
"--max-model-len", "4096",
|
24 |
+
"--max-seq-len-to-capture", "4096",
|
25 |
"--max-num-seqs", "36",
|
26 |
"--host", "0.0.0.0",
|
27 |
"--port", "8000",
|