Spaces:

nuernie
/

ai-server

Paused

App Files Files Community

nuernie commited on May 17

Commit

0c553fd

1 Parent(s): bb2aa1c

adjust

Browse files

Files changed (2) hide show

app.py +25 -99
requirements.txt +5 -4

app.py CHANGED Viewed

@@ -4,6 +4,7 @@ import uvicorn
 from whisper_live.server import TranscriptionServer
 import logging
 import numpy as np
 # —————————————————————————————
 # Logging
@@ -11,17 +12,29 @@ import numpy as np
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
-# —————————————————————————————
-# Instantiate the shared TranscriptionServer
-# (e.g. this loads your model once)
-# —————————————————————————————
-transcription_server = TranscriptionServer()
 @asynccontextmanager
 async def lifespan(app: FastAPI):
-    # any startup logic here (e.g. preload models)
     yield
-    # any cleanup logic here
 app = FastAPI(
     title="Whisper Live Server",
@@ -33,103 +46,16 @@ app = FastAPI(
 async def root():
     return {
         "message": "Welcome to Whisper Live Server",
-        "websocket_endpoint": "/ws",
         "health_endpoint": "/health"
     }
 @app.get("/health")
 async def health_check():
-    return {"status": "healthy"}
-@app.websocket("/ws")
-async def websocket_endpoint(websocket: WebSocket):
-    await websocket.accept()
-    client_uid = None
-    config = {}
-    try:
-        # —————————————————————————————
-        # 1) Read the per‑client config JSON
-        #—————————————————————————————
-        config = await websocket.receive_json()
-        client_uid = config.get("uid")
-        if not client_uid:
-            await websocket.close(code=4000, reason="No client UID provided")
-            return
-        logger.info(f"Client connected: {client_uid} | Config: {config}")
-        # —————————————————————————————
-        # 2) Send back a SERVER_READY message
-        #—————————————————————————————
-        await websocket.send_json({
-            "uid": client_uid,
-            "message": "SERVER_READY",
-            "backend": "faster_whisper"
-        })
-        # —————————————————————————————
-        # 3) Configure the shared server for this client
-        #    (you can also patch transcription_server attributes here)
-        #—————————————————————————————
-        language = config.get("language", "de")
-        task     = config.get("task",     "transcribe")
-        model    = config.get("model",    "tiny")
-        use_vad  = config.get("use_vad",  True)
-        # If your TranscriptionServer.process_audio takes kwargs, you can pass them directly.
-        # Otherwise, you may need to set transcription_server.language = language, etc.
-        # —————————————————————————————
-        # 4) Enter the receive‑loop
-        #—————————————————————————————
-        while True:
-            msg = await websocket.receive()
-            # client closed connection
-            if msg["type"] == "websocket.disconnect":
-                break
-            # binary audio frames
-            if "bytes" in msg and msg["bytes"] is not None:
-                audio_data = np.frombuffer(msg["bytes"], dtype=np.float32)
-                # pass per‑client params into process_audio
-                segments = transcription_server.process_audio(
-                    audio_data,
-                    language=language,
-                    task=task,
-                    model=model,
-                    use_vad=use_vad
-                )
-                if segments:
-                    await websocket.send_json({
-                        "uid": client_uid,
-                        "segments": segments
-                    })
-            # text control messages
-            elif "text" in msg and msg["text"] == "END_OF_AUDIO":
-                logger.info(f"Client {client_uid} ended stream.")
-                break
-    except WebSocketDisconnect:
-        logger.warning(f"WebSocket disconnected: {client_uid}")
-    except Exception as e:
-        logger.error(f"WebSocket error: {e}")
-        if client_uid:
-            try:
-                await websocket.send_json({
-                    "uid": client_uid,
-                    "error": str(e)
-                })
-            except:
-                pass
-    finally:
-        await websocket.close()
 if __name__ == "__main__":
     uvicorn.run(app, host="0.0.0.0", port=7860)

 from whisper_live.server import TranscriptionServer
 import logging
 import numpy as np
+import threading
 # —————————————————————————————
 # Logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
+# Global server instance
+transcription_server = None
+server_thread = None
 @asynccontextmanager
 async def lifespan(app: FastAPI):
+    # Startup: create and start the transcription server
+    global transcription_server, server_thread
+    transcription_server = TranscriptionServer()
+    server_thread = threading.Thread(
+        target=transcription_server.run,
+        kwargs={
+            'host': '0.0.0.0',
+            'port': 9090,  # WebSocket port for transcription
+            'backend': 'faster_whisper'
+        }
+    )
+    server_thread.daemon = True
+    server_thread.start()
     yield
+    # Cleanup
+    if transcription_server:
+        transcription_server.cleanup()
 app = FastAPI(
     title="Whisper Live Server",
 async def root():
     return {
         "message": "Welcome to Whisper Live Server",
+        "websocket_endpoint": "ws://localhost:9090",  # Direct WebSocket connection
         "health_endpoint": "/health"
     }
 @app.get("/health")
 async def health_check():
+    global transcription_server, server_thread
+    if transcription_server and server_thread.is_alive():
+        return {"status": "healthy"}
+    return {"status": "unhealthy"}
 if __name__ == "__main__":
     uvicorn.run(app, host="0.0.0.0", port=7860)

requirements.txt CHANGED Viewed

@@ -1,7 +1,8 @@
-fastapi>=0.68.0
-uvicorn>=0.15.0
-websockets>=10.0
-numpy>=1.21.0
 faster-whisper==1.1.0
 PyAudio
 websocket-client

+fastapi==0.109.2
+uvicorn==0.27.1
+websockets==12.0
+numpy==1.26.4
+python-multipart==0.0.9
 faster-whisper==1.1.0
 PyAudio
 websocket-client