Spaces:

langtech-innovation
/

WhisperLiveKitDiarization

Paused

qfuxa commited on Feb 12

Commit

2ebc949

2 Parent(s): 022a086 bd1016f

Merge pull request #45 from QuentinFuxa/solving-ffmpeg-process-freezing-unexpectedly

Files changed (2) hide show

src/whisper_streaming/online_asr.py CHANGED Viewed

@@ -85,6 +85,7 @@ class HypothesisBuffer:
             self.committed_in_buffer.pop(0)
 class OnlineASRProcessor:
     """
     Processes incoming audio in a streaming fashion, calling the ASR system
@@ -163,6 +164,13 @@ class OnlineASRProcessor:
         context_text = self.asr.sep.join(token.text for token in non_prompt_tokens)
         return self.asr.sep.join(prompt_list[::-1]), context_text
     def process_iter(self) -> Transcript:
         """
         Processes the current audio buffer.
@@ -413,4 +421,10 @@ class VACOnlineASRProcessor:
         result = self.online.finish()
         self.current_online_chunk_buffer_size = 0
         self.is_currently_final = False
-        return result

             self.committed_in_buffer.pop(0)
 class OnlineASRProcessor:
     """
     Processes incoming audio in a streaming fashion, calling the ASR system
         context_text = self.asr.sep.join(token.text for token in non_prompt_tokens)
         return self.asr.sep.join(prompt_list[::-1]), context_text
+    def get_buffer(self):
+        """
+        Get the unvalidated buffer in string format.
+        """
+        return self.concatenate_tokens(self.transcript_buffer.buffer).text
     def process_iter(self) -> Transcript:
         """
         Processes the current audio buffer.
         result = self.online.finish()
         self.current_online_chunk_buffer_size = 0
         self.is_currently_final = False
+        return result
+    def get_buffer(self):
+        """
+        Get the unvalidated buffer in string format.
+        """
+        return self.online.concatenate_tokens(self.online.transcript_buffer.buffer).text

whisper_fastapi_online_server.py CHANGED Viewed

@@ -158,12 +158,8 @@ async def websocket_endpoint(websocket: WebSocket):
                         })
                     full_transcription += transcription.text
-                    if args.vac:
-                        transcript = online.online.concatenate_tokens(online.online.transcript_buffer.buffer)
-                    else:
-                        transcript = online.concatenate_tokens(online.transcript_buffer.buffer)
-                    buffer = transcript.text
                     if buffer in full_transcription: # With VAC, the buffer is not updated until the next chunk is processed
                         buffer = ""

                         })
                     full_transcription += transcription.text
+                    buffer = online.get_buffer()
                     if buffer in full_transcription: # With VAC, the buffer is not updated until the next chunk is processed
                         buffer = ""