specify dtype for librosa.load, instead of cast
Browse files- whisper_online.py +2 -2
- whisper_online_server.py +3 -2
whisper_online.py
CHANGED
@@ -10,8 +10,8 @@ import math
|
|
10 |
|
11 |
@lru_cache
|
12 |
def load_audio(fname):
|
13 |
-
a, _ = librosa.load(fname, sr=16000)
|
14 |
-
return a
|
15 |
|
16 |
def load_audio_chunk(fname, beg, end):
|
17 |
audio = load_audio(fname)
|
|
|
10 |
|
11 |
@lru_cache
|
12 |
def load_audio(fname):
|
13 |
+
a, _ = librosa.load(fname, sr=16000, dtype=np.float32)
|
14 |
+
return a
|
15 |
|
16 |
def load_audio_chunk(fname, beg, end):
|
17 |
audio = load_audio(fname)
|
whisper_online_server.py
CHANGED
@@ -4,6 +4,7 @@ from whisper_online import *
|
|
4 |
import sys
|
5 |
import argparse
|
6 |
import os
|
|
|
7 |
parser = argparse.ArgumentParser()
|
8 |
|
9 |
# server options
|
@@ -137,8 +138,8 @@ class ServerProcessor:
|
|
137 |
if not raw_bytes:
|
138 |
break
|
139 |
sf = soundfile.SoundFile(io.BytesIO(raw_bytes), channels=1,endian="LITTLE",samplerate=SAMPLING_RATE, subtype="PCM_16",format="RAW")
|
140 |
-
audio, _ = librosa.load(sf,sr=SAMPLING_RATE)
|
141 |
-
out.append(audio
|
142 |
if not out:
|
143 |
return None
|
144 |
return np.concatenate(out)
|
|
|
4 |
import sys
|
5 |
import argparse
|
6 |
import os
|
7 |
+
import numpy as np
|
8 |
parser = argparse.ArgumentParser()
|
9 |
|
10 |
# server options
|
|
|
138 |
if not raw_bytes:
|
139 |
break
|
140 |
sf = soundfile.SoundFile(io.BytesIO(raw_bytes), channels=1,endian="LITTLE",samplerate=SAMPLING_RATE, subtype="PCM_16",format="RAW")
|
141 |
+
audio, _ = librosa.load(sf,sr=SAMPLING_RATE,dtype=np.float32)
|
142 |
+
out.append(audio)
|
143 |
if not out:
|
144 |
return None
|
145 |
return np.concatenate(out)
|