Spaces:

Luigi
/

Streaming-Zipformer

Running

App Files Files Community

Luigi commited on Jun 8

Commit

a1d489d

1 Parent(s): 2632b6f

remove final, as this demo perform asr forever

Browse files

Files changed (3) hide show

app/asr_worker.py +1 -10
app/main.py +6 -25
app/static/index.html +1 -11

app/asr_worker.py CHANGED Viewed

@@ -170,13 +170,4 @@ def stream_audio(raw_pcm_bytes, stream, recognizer, orig_sr):
     if recognizer.is_ready(stream):
         recognizer.decode_streams([stream])
     result = recognizer.get_result(stream)
-    return converter.convert(result), rms
-def finalize_stream(stream, recognizer):
-    tail = np.zeros(int(0.66 * 16000), dtype=np.float32)
-    stream.accept_waveform(16000, tail)
-    stream.input_finished()
-    while recognizer.is_ready(stream):
-        recognizer.decode_streams([stream])
-    result = recognizer.get_result(stream)
-    return converter.convert(result)

     if recognizer.is_ready(stream):
         recognizer.decode_streams([stream])
     result = recognizer.get_result(stream)
+    return converter.convert(result), rms

app/main.py CHANGED Viewed

@@ -1,7 +1,7 @@
 from fastapi import FastAPI, WebSocket
 from fastapi.staticfiles import StaticFiles
 from fastapi.responses import HTMLResponse
-from app.asr_worker import create_recognizer, stream_audio, finalize_stream
 import json
 from starlette.websockets import WebSocketDisconnect
@@ -30,22 +30,10 @@ async def websocket_endpoint(websocket: WebSocket):
             data = await websocket.receive()
             kind = data.get("type")
-            # Handle control frames
             if kind not in ("websocket.receive", "websocket.receive_bytes"):
-                print(f"[DEBUG main] Received control/frame: {data}")
-                if kind == "websocket.disconnect":
-                    # On client disconnect, flush final transcript if possible
-                    if stream and recognizer:
-                        print(f"[INFO main] Client disconnected (code={data.get('code')}). Flushing final transcript...")
-                        final = finalize_stream(stream, recognizer)
-                        try:
-                            await websocket.send_json({"final": final})
-                        except (WebSocketDisconnect, RuntimeError):
-                            pass
-                    break
-                continue
-            # Handle text (config) frame
             if kind == "websocket.receive" and "text" in data:
                 raw = data["text"]
                 try:
@@ -81,7 +69,7 @@ async def websocket_endpoint(websocket: WebSocket):
                 await websocket.send_json({"partial": result, "volume": vol_to_send})
                 continue
-            elif isinstance(data, dict) and data.get("type") == "websocket.receive_bytes":
                 raw_audio = data["bytes"]
                 print(f"[INFO main] Received audio chunk: {len(raw_audio)} bytes")
@@ -93,17 +81,10 @@ async def websocket_endpoint(websocket: WebSocket):
                 await websocket.send_json({
                     "partial": result,
-                    "volume": vol_to_send
                 })
     except Exception as e:
         print(f"[ERROR main] Unexpected exception: {e}")
-        if stream and recognizer:
-            final = finalize_stream(stream, recognizer)
-            try:
-                await websocket.send_json({"final": final})
-            except (WebSocketDisconnect, RuntimeError):
-                pass
-        # Ensure connection is closed
         try:
             await websocket.close()
         except:

 from fastapi import FastAPI, WebSocket
 from fastapi.staticfiles import StaticFiles
 from fastapi.responses import HTMLResponse
+from app.asr_worker import create_recognizer, stream_audio
 import json
 from starlette.websockets import WebSocketDisconnect
             data = await websocket.receive()
             kind = data.get("type")
+            # Handle config messages
             if kind not in ("websocket.receive", "websocket.receive_bytes"):
+                            print(f"[DEBUG main] Received control/frame: {data}")
+                            continue
             if kind == "websocket.receive" and "text" in data:
                 raw = data["text"]
                 try:
                 await websocket.send_json({"partial": result, "volume": vol_to_send})
                 continue
+            elif kind == "websocket.receive_bytes":
                 raw_audio = data["bytes"]
                 print(f"[INFO main] Received audio chunk: {len(raw_audio)} bytes")
                 await websocket.send_json({
                     "partial": result,
+                    "volume": min(rms * 20.0, 1.0)
                 })
     except Exception as e:
         print(f"[ERROR main] Unexpected exception: {e}")
         try:
             await websocket.close()
         except:

app/static/index.html CHANGED Viewed

@@ -66,11 +66,6 @@
       color: #353b48;
     }
-    #final {
-      font-size: 1.4rem;
-      color: #e84118;
-    }
     .controls {
       display: flex;
       gap: 1rem;
@@ -132,8 +127,7 @@
   <progress id="vol" max="1" value="0"></progress>
   <div class="output">
-    <div><span class="label">Partial:</span> <span id="partial">...</span></div>
-    <div><span class="label">Final:</span> <b id="final">...</b></div>
   </div>
   <script>
@@ -157,7 +151,6 @@
     const vol = document.getElementById("vol");
     const partial = document.getElementById("partial");
-    const finalText = document.getElementById("final");
     const modelSelect = document.getElementById("modelSelect");
     const precisionSelect = document.getElementById("precisionSelect");
     const modelLangs = document.getElementById("modelLangs");
@@ -218,9 +211,6 @@
         if (msg.partial) {
           partial.textContent = msg.partial;
         }
-        if (msg.final) {
-          finalText.textContent = msg.final;
-        }
       };
     });
   </script>

       color: #353b48;
     }
     .controls {
       display: flex;
       gap: 1rem;
   <progress id="vol" max="1" value="0"></progress>
   <div class="output">
+    <div><span class="label">Transcript:</span> <span id="partial">...</span></div>
   </div>
   <script>
     const vol = document.getElementById("vol");
     const partial = document.getElementById("partial");
     const modelSelect = document.getElementById("modelSelect");
     const precisionSelect = document.getElementById("precisionSelect");
     const modelLangs = document.getElementById("modelLangs");
         if (msg.partial) {
           partial.textContent = msg.partial;
         }
       };
     });
   </script>