Spaces:
Sleeping
Sleeping
update
Browse files
app.py
CHANGED
@@ -12,8 +12,8 @@ def chat_with_moi(message, history, temperature, top_p, beta):
|
|
12 |
# Set the MIXINPUTS_BETA env var *per request*
|
13 |
os.environ["MIXINPUTS_BETA"] = str(beta)
|
14 |
|
15 |
-
setup_mixinputs()
|
16 |
-
launch_vllm_server(beta=beta)
|
17 |
|
18 |
payload = {
|
19 |
"model": "Qwen/QwQ-32B", # match what your vLLM server expects
|
|
|
12 |
# Set the MIXINPUTS_BETA env var *per request*
|
13 |
os.environ["MIXINPUTS_BETA"] = str(beta)
|
14 |
|
15 |
+
# setup_mixinputs()
|
16 |
+
# launch_vllm_server(beta=beta)
|
17 |
|
18 |
payload = {
|
19 |
"model": "Qwen/QwQ-32B", # match what your vLLM server expects
|
server.py
CHANGED
@@ -7,6 +7,7 @@ def setup_mixinputs():
|
|
7 |
# Step 1: Run mixinputs setup
|
8 |
subprocess.run(["mixinputs", "setup"], check=True)
|
9 |
|
|
|
10 |
def launch_vllm_server(beta=1.0):
|
11 |
# Step 2: Set environment variables
|
12 |
env = os.environ.copy()
|
@@ -24,11 +25,11 @@ def launch_vllm_server(beta=1.0):
|
|
24 |
]
|
25 |
subprocess.run(cmd, env=env)
|
26 |
|
27 |
-
#
|
28 |
-
|
29 |
|
30 |
-
#
|
31 |
-
|
32 |
|
33 |
-
#
|
34 |
-
|
|
|
7 |
# Step 1: Run mixinputs setup
|
8 |
subprocess.run(["mixinputs", "setup"], check=True)
|
9 |
|
10 |
+
@spaces.GPU(duration=240)
|
11 |
def launch_vllm_server(beta=1.0):
|
12 |
# Step 2: Set environment variables
|
13 |
env = os.environ.copy()
|
|
|
25 |
]
|
26 |
subprocess.run(cmd, env=env)
|
27 |
|
28 |
+
# Step 1: Setup
|
29 |
+
setup_mixinputs()
|
30 |
|
31 |
+
# Step 2: Launch vLLM server in background
|
32 |
+
threading.Thread(target=launch_vllm_server, daemon=True).start()
|
33 |
|
34 |
+
# Step 3: Give time for server to initialize
|
35 |
+
time.sleep(20)
|