Spaces:

hsuwill000
/

ESP01LLMSample

Sleeping

hsuwill000 commited on 18 days ago

Commit

844f989

verified ·

1 Parent(s): bbd2fc4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -209,7 +209,7 @@ async def root():
 # --- 7. FastAPI 路由: /infer4 (極簡版) ---
-@app.post("/infer4", summary="執行 LLM 推論 (v4: 極簡輸入/僅回傳 response 欄位)")
 async def infer4_endpoint(request: InferenceRequestMinimal):
     FIXED_SYSTEM_MESSAGE = "You are a friendly and concise assistant."
     FIXED_MAX_TOKENS = 4096
@@ -239,7 +239,7 @@ async def infer4_endpoint(request: InferenceRequestMinimal):
 # --- 8. FastAPI 路由: /infer_amd (使用 Gradio Client) ---
-@app.post("/infer_amd", summary="使用 Gradio Client 呼叫外部 AMD LLM Space")
 async def infer_amd_endpoint(request: InferenceRequestMinimal):
     """
     使用 gradio_client 呼叫 AMD_SPACE_ID 所指定的 Space 的 /chat API。

 # --- 7. FastAPI 路由: /infer4 (極簡版) ---
+@app.post("/local/qwen-0-6b", summary="執行 LLM 推論 (v4: 極簡輸入/僅回傳 response 欄位)")
 async def infer4_endpoint(request: InferenceRequestMinimal):
     FIXED_SYSTEM_MESSAGE = "You are a friendly and concise assistant."
     FIXED_MAX_TOKENS = 4096
 # --- 8. FastAPI 路由: /infer_amd (使用 Gradio Client) ---
+@app.post("/remote/amd", summary="使用 Gradio Client 呼叫外部 AMD LLM Space")
 async def infer_amd_endpoint(request: InferenceRequestMinimal):
     """
     使用 gradio_client 呼叫 AMD_SPACE_ID 所指定的 Space 的 /chat API。