yzhuang commited on
Commit
9bb13ea
·
verified ·
1 Parent(s): 81f72df

Update server.py

Browse files
Files changed (1) hide show
  1. server.py +2 -2
server.py CHANGED
@@ -20,8 +20,8 @@ def launch_vllm_server(beta=1.0):
20
  "Qwen/Qwen3-4B",
21
  "--tensor-parallel-size", "1",
22
  "--enforce-eager",
23
- "--max-model-len", "2048",
24
- "--max-seq-len-to-capture", "2048",
25
  "--max-num-seqs", "36",
26
  "--host", "0.0.0.0",
27
  "--port", "8000",
 
20
  "Qwen/Qwen3-4B",
21
  "--tensor-parallel-size", "1",
22
  "--enforce-eager",
23
+ "--max-model-len", "4096",
24
+ "--max-seq-len-to-capture", "4096",
25
  "--max-num-seqs", "36",
26
  "--host", "0.0.0.0",
27
  "--port", "8000",