yzhuang commited on
Commit
952fd8e
·
1 Parent(s): 873d420
Files changed (2) hide show
  1. app.py +2 -2
  2. server.py +7 -6
app.py CHANGED
@@ -12,8 +12,8 @@ def chat_with_moi(message, history, temperature, top_p, beta):
12
  # Set the MIXINPUTS_BETA env var *per request*
13
  os.environ["MIXINPUTS_BETA"] = str(beta)
14
 
15
- setup_mixinputs()
16
- launch_vllm_server(beta=beta)
17
 
18
  payload = {
19
  "model": "Qwen/QwQ-32B", # match what your vLLM server expects
 
12
  # Set the MIXINPUTS_BETA env var *per request*
13
  os.environ["MIXINPUTS_BETA"] = str(beta)
14
 
15
+ # setup_mixinputs()
16
+ # launch_vllm_server(beta=beta)
17
 
18
  payload = {
19
  "model": "Qwen/QwQ-32B", # match what your vLLM server expects
server.py CHANGED
@@ -7,6 +7,7 @@ def setup_mixinputs():
7
  # Step 1: Run mixinputs setup
8
  subprocess.run(["mixinputs", "setup"], check=True)
9
 
 
10
  def launch_vllm_server(beta=1.0):
11
  # Step 2: Set environment variables
12
  env = os.environ.copy()
@@ -24,11 +25,11 @@ def launch_vllm_server(beta=1.0):
24
  ]
25
  subprocess.run(cmd, env=env)
26
 
27
- # # Step 1: Setup
28
- # setup_mixinputs()
29
 
30
- # # Step 2: Launch vLLM server in background
31
- # threading.Thread(target=launch_vllm_server, daemon=True).start()
32
 
33
- # # Step 3: Give time for server to initialize
34
- # time.sleep(20)
 
7
  # Step 1: Run mixinputs setup
8
  subprocess.run(["mixinputs", "setup"], check=True)
9
 
10
+ @spaces.GPU(duration=240)
11
  def launch_vllm_server(beta=1.0):
12
  # Step 2: Set environment variables
13
  env = os.environ.copy()
 
25
  ]
26
  subprocess.run(cmd, env=env)
27
 
28
+ # Step 1: Setup
29
+ setup_mixinputs()
30
 
31
+ # Step 2: Launch vLLM server in background
32
+ threading.Thread(target=launch_vllm_server, daemon=True).start()
33
 
34
+ # Step 3: Give time for server to initialize
35
+ time.sleep(20)