Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -20,7 +20,12 @@ pipe = pipeline(task="automatic-speech-recognition", model=model_repo_id, device
|
|
20 |
def infer(
|
21 |
audio
|
22 |
):
|
23 |
-
|
|
|
|
|
|
|
|
|
|
|
24 |
|
25 |
css = """
|
26 |
#col-container {
|
|
|
20 |
def infer(
|
21 |
audio
|
22 |
):
|
23 |
+
sampling_rate, wav = audio
|
24 |
+
if wav.ndim > 1:
|
25 |
+
wav = wav.mean(axis=1)
|
26 |
+
wav = wav.astype(np.float32)
|
27 |
+
wav /= np.max(np.abs(wav))
|
28 |
+
return pipe({"sampling_rate": sampling_rate, "raw": wav}, generate_kwargs={'language': 'chinese'})['text']
|
29 |
|
30 |
css = """
|
31 |
#col-container {
|