Spaces:
Sleeping
Sleeping
update
Browse files
server.py
CHANGED
@@ -24,7 +24,8 @@ def launch_vllm_server(beta=1.0):
|
|
24 |
"--max-model-len", "2048",
|
25 |
"--max-seq-len-to-capture", "2048",
|
26 |
"--max-num-seqs", "1",
|
27 |
-
"--port", "8000"
|
|
|
28 |
]
|
29 |
subprocess.run(cmd, env=env)
|
30 |
|
|
|
24 |
"--max-model-len", "2048",
|
25 |
"--max-seq-len-to-capture", "2048",
|
26 |
"--max-num-seqs", "1",
|
27 |
+
"--port", "8000",
|
28 |
+
"--disable-async-output-proc"
|
29 |
]
|
30 |
subprocess.run(cmd, env=env)
|
31 |
|