Dominik Macháček
commited on
Commit
·
c812334
1
Parent(s):
6b968c6
increasing timestamps fixed
Browse filesbut the code needs to be simplified and cleaned before merging
- whisper_online.py +8 -4
- whisper_online_vac.py +1 -1
whisper_online.py
CHANGED
@@ -235,16 +235,19 @@ class OnlineASRProcessor:
|
|
235 |
|
236 |
self.buffer_trimming_way, self.buffer_trimming_sec = buffer_trimming
|
237 |
|
238 |
-
def init(self):
|
239 |
"""run this when starting or restarting processing"""
|
240 |
self.audio_buffer = np.array([],dtype=np.float32)
|
241 |
-
self.buffer_time_offset = 0
|
242 |
-
|
243 |
self.transcript_buffer = HypothesisBuffer(logfile=self.logfile)
|
|
|
|
|
|
|
|
|
|
|
|
|
244 |
self.commited = []
|
245 |
self.last_chunked_at = 0
|
246 |
|
247 |
-
self.silence_iters = 0
|
248 |
|
249 |
def insert_audio_chunk(self, audio):
|
250 |
self.audio_buffer = np.append(self.audio_buffer, audio)
|
@@ -400,6 +403,7 @@ class OnlineASRProcessor:
|
|
400 |
o = self.transcript_buffer.complete()
|
401 |
f = self.to_flush(o)
|
402 |
print("last, noncommited:",f,file=self.logfile)
|
|
|
403 |
return f
|
404 |
|
405 |
|
|
|
235 |
|
236 |
self.buffer_trimming_way, self.buffer_trimming_sec = buffer_trimming
|
237 |
|
238 |
+
def init(self, keep_offset=False):
|
239 |
"""run this when starting or restarting processing"""
|
240 |
self.audio_buffer = np.array([],dtype=np.float32)
|
|
|
|
|
241 |
self.transcript_buffer = HypothesisBuffer(logfile=self.logfile)
|
242 |
+
if not keep_offset:
|
243 |
+
self.buffer_time_offset = 0
|
244 |
+
self.transcript_buffer.last_commited_time = 0
|
245 |
+
else:
|
246 |
+
self.transcript_buffer.last_commited_time = self.buffer_time_offset
|
247 |
+
|
248 |
self.commited = []
|
249 |
self.last_chunked_at = 0
|
250 |
|
|
|
251 |
|
252 |
def insert_audio_chunk(self, audio):
|
253 |
self.audio_buffer = np.append(self.audio_buffer, audio)
|
|
|
403 |
o = self.transcript_buffer.complete()
|
404 |
f = self.to_flush(o)
|
405 |
print("last, noncommited:",f,file=self.logfile)
|
406 |
+
self.buffer_time_offset += len(self.audio_buffer)/16000
|
407 |
return f
|
408 |
|
409 |
|
whisper_online_vac.py
CHANGED
@@ -45,7 +45,7 @@ class VACOnlineASRProcessor(OnlineASRProcessor):
|
|
45 |
|
46 |
def finish(self):
|
47 |
ret = self.online.finish()
|
48 |
-
self.online.init()
|
49 |
self.current_online_chunk_buffer_size = 0
|
50 |
return ret
|
51 |
|
|
|
45 |
|
46 |
def finish(self):
|
47 |
ret = self.online.finish()
|
48 |
+
self.online.init(keep_offset=True)
|
49 |
self.current_online_chunk_buffer_size = 0
|
50 |
return ret
|
51 |
|