fujii commited on
Commit
4405c45
·
1 Parent(s): 24926c9

specify dtype for librosa.load, instead of cast

Browse files
Files changed (2) hide show
  1. whisper_online.py +2 -2
  2. whisper_online_server.py +3 -2
whisper_online.py CHANGED
@@ -10,8 +10,8 @@ import math
10
 
11
  @lru_cache
12
  def load_audio(fname):
13
- a, _ = librosa.load(fname, sr=16000)
14
- return a.astype('float32')
15
 
16
  def load_audio_chunk(fname, beg, end):
17
  audio = load_audio(fname)
 
10
 
11
  @lru_cache
12
  def load_audio(fname):
13
+ a, _ = librosa.load(fname, sr=16000, dtype=np.float32)
14
+ return a
15
 
16
  def load_audio_chunk(fname, beg, end):
17
  audio = load_audio(fname)
whisper_online_server.py CHANGED
@@ -4,6 +4,7 @@ from whisper_online import *
4
  import sys
5
  import argparse
6
  import os
 
7
  parser = argparse.ArgumentParser()
8
 
9
  # server options
@@ -137,8 +138,8 @@ class ServerProcessor:
137
  if not raw_bytes:
138
  break
139
  sf = soundfile.SoundFile(io.BytesIO(raw_bytes), channels=1,endian="LITTLE",samplerate=SAMPLING_RATE, subtype="PCM_16",format="RAW")
140
- audio, _ = librosa.load(sf,sr=SAMPLING_RATE)
141
- out.append(audio.astype('float32'))
142
  if not out:
143
  return None
144
  return np.concatenate(out)
 
4
  import sys
5
  import argparse
6
  import os
7
+ import numpy as np
8
  parser = argparse.ArgumentParser()
9
 
10
  # server options
 
138
  if not raw_bytes:
139
  break
140
  sf = soundfile.SoundFile(io.BytesIO(raw_bytes), channels=1,endian="LITTLE",samplerate=SAMPLING_RATE, subtype="PCM_16",format="RAW")
141
+ audio, _ = librosa.load(sf,sr=SAMPLING_RATE,dtype=np.float32)
142
+ out.append(audio)
143
  if not out:
144
  return None
145
  return np.concatenate(out)